Add files using upload-large-folder tool

Browse files

Files changed (5) hide show

README.md +10 -13
chat_template.jinja +101 -0
model.safetensors +1 -1
model.safetensors.index.json +2 -1
tokenizer_config.json +5 -4

README.md CHANGED Viewed

@@ -1,20 +1,17 @@
----
-license: apache-2.0
-library_name: mlx
-tags:
-- mlx
-pipeline_tag: text-generation
-base_model: deepseek-ai/DeepSeek-R1-0528-Qwen3-8B
----
 # mlx-community/DeepSeek-R1-0528-Qwen3-8B-4bit-AWQ
 This model [mlx-community/DeepSeek-R1-0528-Qwen3-8B-4bit-AWQ](https://huggingface.co/mlx-community/DeepSeek-R1-0528-Qwen3-8B-4bit-AWQ) was
 converted to MLX format from [deepseek-ai/DeepSeek-R1-0528-Qwen3-8B](https://huggingface.co/deepseek-ai/DeepSeek-R1-0528-Qwen3-8B)
-using mlx-lm version **0.24.1**.
-AWQ Parameters:
---bits 4 --num-samples 256 --group-size 64 --sequence-length 1024, with a custom calibration dataset
 ## Use with mlx
@@ -36,4 +33,4 @@ if tokenizer.chat_template is not None:
     )
 response = generate(model, tokenizer, prompt=prompt, verbose=True)
-```

+---
+license: mit
+library_name: mlx
+tags:
+- mlx
+base_model: deepseek-ai/DeepSeek-R1-0528-Qwen3-8B
+pipeline_tag: text-generation
+---
 # mlx-community/DeepSeek-R1-0528-Qwen3-8B-4bit-AWQ
 This model [mlx-community/DeepSeek-R1-0528-Qwen3-8B-4bit-AWQ](https://huggingface.co/mlx-community/DeepSeek-R1-0528-Qwen3-8B-4bit-AWQ) was
 converted to MLX format from [deepseek-ai/DeepSeek-R1-0528-Qwen3-8B](https://huggingface.co/deepseek-ai/DeepSeek-R1-0528-Qwen3-8B)
+using mlx-lm version **0.25.2**.
 ## Use with mlx
     )
 response = generate(model, tokenizer, prompt=prompt, verbose=True)
+```

chat_template.jinja ADDED Viewed

	@@ -0,0 +1,101 @@

+{%- if not add_generation_prompt is defined %}
+    {%- set add_generation_prompt = false %}
+{%- endif %}
+{%- set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='', is_first_sp=true, is_last_user=false) %}
+{%- for message in messages %}
+    {%- if message['role'] == 'system' %}
+        {%- if ns.is_first_sp %}
+            {%- set ns.system_prompt = ns.system_prompt + message['content'] %}
+            {%- set ns.is_first_sp = false %}
+        {%- else %}
+            {%- set ns.system_prompt = ns.system_prompt + '\n\n' + message['content'] %}
+        {%- endif %}
+    {%- endif %}
+{%- endfor %}
+{#- Adapted from https://github.com/sgl-project/sglang/blob/main/examples/chat_template/tool_chat_template_deepseekr1.jinja #}
+{%- if tools is defined and tools is not none %}
+    {%- set tool_ns = namespace(text='You are a helpful assistant with tool calling capabilities. ' + 'When a tool call is needed, you MUST use the following format to issue the call:\n' + '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>function<｜tool▁sep｜>FUNCTION_NAME\n' + '```json\n{"param1": "value1", "param2": "value2"}\n```<｜tool▁call▁end｜><｜tool▁calls▁end｜>\n\n' + 'Make sure the JSON is valid.' + '## Tools\n\n### Function\n\nYou have the following functions available:\n\n') %}
+    {%- for tool in tools %}
+        {%- set tool_ns.text = tool_ns.text + '\n```json\n' + (tool | tojson) + '\n```\n' %}
+    {%- endfor %}
+    {%- if ns.system_prompt|length != 0 %}
+        {%- set ns.system_prompt = ns.system_prompt + '\n\n' + tool_ns.text %}
+    {%- else %}
+        {%- set ns.system_prompt = tool_ns.text %}
+    {%- endif %}
+{%- endif %}
+{{- bos_token }}
+{{- ns.system_prompt }}
+{%- set last_index = (messages|length - 1) %}
+{%- for message in messages %}
+    {%- set content = message['content'] %}
+    {%- if message['role'] == 'user' %}
+        {%- set ns.is_tool = false -%}
+        {%- set ns.is_first = false -%}
+        {%- set ns.is_last_user = true -%}
+        {%- if loop.index0 == last_index %}
+            {{- '<｜User｜>' + content }}
+        {%- else %}
+            {{- '<｜User｜>' + content + '<｜Assistant｜>'}}
+        {%- endif %}
+    {%- endif %}
+    {%- if message['role'] == 'assistant' %}
+        {%- if '</think>' in content %}
+            {%- set content = (content.split('</think>')|last) %}
+        {%- endif %}
+    {%- endif %}
+    {%- if message['role'] == 'assistant' and message['tool_calls'] is defined and message['tool_calls'] is not none %}
+        {%- set ns.is_last_user = false -%}
+        {%- if ns.is_tool %}
+            {{- '<｜tool▁outputs▁end｜>'}}
+        {%- endif %}
+        {%- set ns.is_first = false %}
+        {%- set ns.is_tool = false -%}
+        {%- set ns.is_output_first = true %}
+        {%- for tool in message['tool_calls'] %}
+            {%- set arguments = tool['function']['arguments'] %}
+            {%- if arguments is not string %}
+                {%- set arguments = arguments|tojson %}
+            {%- endif %}
+            {%- if not ns.is_first %}
+                {%- if content is none %}
+                    {{- '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + arguments + '\n' + '```' + '<｜tool▁call▁end｜>'}}
+                }
+                {%- else %}
+                    {{- content + '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + arguments + '\n' + '```' + '<｜tool▁call▁end｜>'}}
+                {%- endif %}
+                {%- set ns.is_first = true -%}
+            {%- else %}
+                {{- '\n' + '<｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + arguments + '\n' + '```' + '<｜tool▁call▁end｜>'}}
+            {%- endif %}
+        {%- endfor %}
+        {{- '<｜tool▁calls▁end｜><｜end▁of▁sentence｜>'}}
+    {%- endif %}
+    {%- if message['role'] == 'assistant' and (message['tool_calls'] is not defined or message['tool_calls'] is none) %}
+        {%- set ns.is_last_user = false -%}
+        {%- if ns.is_tool %}
+            {{- '<｜tool▁outputs▁end｜>' + content + '<｜end▁of▁sentence｜>'}}
+            {%- set ns.is_tool = false -%}
+        {%- else %}
+            {{- content + '<｜end▁of▁sentence｜>'}}
+        {%- endif %}
+    {%- endif %}
+    {%- if message['role'] == 'tool' %}
+        {%- set ns.is_last_user = false -%}
+        {%- set ns.is_tool = true -%}
+        {%- if ns.is_output_first %}
+            {{- '<｜tool▁outputs▁begin｜><｜tool▁output▁begin｜>' + content + '<｜tool▁output▁end｜>'}}
+            {%- set ns.is_output_first = false %}
+        {%- else %}
+            {{- '\n<｜tool▁output▁begin｜>' + content + '<｜tool▁output▁end｜>'}}
+        {%- endif %}
+    {%- endif %}
+{%- endfor -%}
+{%- if ns.is_tool %}
+    {{- '<｜tool▁outputs▁end｜>'}}
+{%- endif %}
+{#- if add_generation_prompt and not ns.is_last_user and not ns.is_tool #}
+{%- if add_generation_prompt and not ns.is_tool %}
+    {{- '<｜Assistant｜>'}}
+{%- endif %}

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f6e3b583241de5a9c6ca377239fa56415f42c5338db8bd0016ecce1f84f4d809
 size 4685626408

 version https://git-lfs.github.com/spec/v1
+oid sha256:6855552e30af2a06fcbfaba711352e460ee4df303d3fcea7d1fdae63e2b271fc
 size 4685626408

model.safetensors.index.json CHANGED Viewed

@@ -1,6 +1,7 @@
 {
     "metadata": {
-        "total_size": 4685522944
     },
     "weight_map": {
         "lm_head.biases": "model.safetensors",

 {
     "metadata": {
+        "total_size": 4685522944,
+        "total_parameters": 8190735360
     },
     "weight_map": {
         "lm_head.biases": "model.safetensors",

tokenizer_config.json CHANGED Viewed

@@ -229,15 +229,16 @@
     }
   },
   "bos_token": "<｜begin▁of▁sentence｜>",
-  "chat_template": "{% if not add_generation_prompt is defined %}{% set add_generation_prompt = false %}{% endif %}{% set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='', is_first_sp=true, is_last_user=false) %}{%- for message in messages %}{%- if message['role'] == 'system' %}{%- if ns.is_first_sp %}{% set ns.system_prompt = ns.system_prompt + message['content'] %}{% set ns.is_first_sp = false %}{%- else %}{% set ns.system_prompt = ns.system_prompt + '\n\n' + message['content'] %}{%- endif %}{%- endif %}{%- endfor %}{{ bos_token }}{{ ns.system_prompt }}{%- for message in messages %}{% set content = message['content'] %}{%- if message['role'] == 'user' %}{%- set ns.is_tool = false -%}{%- set ns.is_first = false -%}{%- set ns.is_last_user = true -%}{{'<｜User｜>' + content + '<｜Assistant｜>'}}{%- endif %}{%- if message['role'] == 'assistant' %}{% if '</think>' in content %}{% set content = content.split('</think>')[-1] %}{% endif %}{% endif %}{%- if message['role'] == 'assistant' and message['tool_calls'] is defined and message['tool_calls'] is not none %}{%- set ns.is_last_user = false -%}{%- if ns.is_tool %}{{'<｜tool▁outputs▁end｜>'}}{%- endif %}{%- set ns.is_first = false %}{%- set ns.is_tool = false -%}{%- set ns.is_output_first = true %}{%- for tool in message['tool_calls'] %}{%- if not ns.is_first %}{%- if content is none %}{{'<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + tool['function']['arguments'] + '\n' + '```' + '<｜tool▁call▁end｜>'}}{%- else %}{{content + '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + tool['function']['arguments'] + '\n' + '```' + '<｜tool▁call▁end｜>'}}{%- endif %}{%- set ns.is_first = true -%}{%- else %}{{'\n' + '<｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\n' + '```json' + '\n' + tool['function']['arguments'] + '\n' + '```' + '<｜tool▁call▁end｜>'}}{%- endif %}{%- endfor %}{{'<｜tool▁calls▁end｜><｜end▁of▁sentence｜>'}}{%- endif %}{%- if message['role'] == 'assistant' and (message['tool_calls'] is not defined or message['tool_calls'] is none)%}{%- set ns.is_last_user = false -%}{%- if ns.is_tool %}{{'<｜tool▁outputs▁end｜>' + content + '<｜end▁of▁sentence｜>'}}{%- set ns.is_tool = false -%}{%- else %}{{content + '<｜end▁of▁sentence｜>'}}{%- endif %}{%- endif %}{%- if message['role'] == 'tool' %}{%- set ns.is_last_user = false -%}{%- set ns.is_tool = true -%}{%- if ns.is_output_first %}{{'<｜tool▁outputs▁begin｜><｜tool▁output▁begin｜>' + content + '<｜tool▁output▁end｜>'}}{%- set ns.is_output_first = false %}{%- else %}{{'\n<｜tool▁output▁begin｜>' + content + '<｜tool▁output▁end｜>'}}{%- endif %}{%- endif %}{%- endfor -%}{% if ns.is_tool %}{{'<｜tool▁outputs▁end｜>'}}{% endif %}{% if add_generation_prompt and not ns.is_last_user and not ns.is_tool %}{{'<｜Assistant｜>'}}{% endif %}",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<｜end▁of▁sentence｜>",
   "extra_special_tokens": {},
   "legacy": true,
   "model_max_length": 131072,
-  "pad_token": "<｜end▁of▁sentence｜>",
   "sp_model_kwargs": {},
   "tokenizer_class": "LlamaTokenizerFast",
   "unk_token": null,
-  "use_default_system_prompt": false
-}

     }
   },
   "bos_token": "<｜begin▁of▁sentence｜>",
   "clean_up_tokenization_spaces": false,
   "eos_token": "<｜end▁of▁sentence｜>",
   "extra_special_tokens": {},
   "legacy": true,
   "model_max_length": 131072,
+  "pad_token": "<|vision_pad|>",
+  "padding_side": "left",
   "sp_model_kwargs": {},
   "tokenizer_class": "LlamaTokenizerFast",
   "unk_token": null,
+  "use_default_system_prompt": false,
+  "chat_template": "{%- if not add_generation_prompt is defined %}\n    {%- set add_generation_prompt = false %}\n{%- endif %}\n{%- set ns = namespace(is_first=false, is_tool=false, is_output_first=true, system_prompt='', is_first_sp=true, is_last_user=false) %}\n{%- for message in messages %}\n    {%- if message['role'] == 'system' %}\n        {%- if ns.is_first_sp %}\n            {%- set ns.system_prompt = ns.system_prompt + message['content'] %}\n            {%- set ns.is_first_sp = false %}\n        {%- else %}\n            {%- set ns.system_prompt = ns.system_prompt + '\\n\\n' + message['content'] %}\n        {%- endif %}\n    {%- endif %}\n{%- endfor %}\n\n{#- Adapted from https://github.com/sgl-project/sglang/blob/main/examples/chat_template/tool_chat_template_deepseekr1.jinja #}\n{%- if tools is defined and tools is not none %}\n    {%- set tool_ns = namespace(text='You are a helpful assistant with tool calling capabilities. ' + 'When a tool call is needed, you MUST use the following format to issue the call:\\n' + '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>function<｜tool▁sep｜>FUNCTION_NAME\\n' + '```json\\n{\"param1\": \"value1\", \"param2\": \"value2\"}\\n```<｜tool▁call▁end｜><｜tool▁calls▁end｜>\\n\\n' + 'Make sure the JSON is valid.' + '## Tools\\n\\n### Function\\n\\nYou have the following functions available:\\n\\n') %}\n    {%- for tool in tools %}\n        {%- set tool_ns.text = tool_ns.text + '\\n```json\\n' + (tool | tojson) + '\\n```\\n' %}\n    {%- endfor %}\n    {%- if ns.system_prompt|length != 0 %}\n        {%- set ns.system_prompt = ns.system_prompt + '\\n\\n' + tool_ns.text %}\n    {%- else %}\n        {%- set ns.system_prompt = tool_ns.text %}\n    {%- endif %}\n{%- endif %}\n{{- bos_token }}\n{{- ns.system_prompt }}\n{%- set last_index = (messages|length - 1) %}\n{%- for message in messages %}\n    {%- set content = message['content'] %}\n    {%- if message['role'] == 'user' %}\n        {%- set ns.is_tool = false -%}\n        {%- set ns.is_first = false -%}\n        {%- set ns.is_last_user = true -%}\n        {%- if loop.index0 == last_index %}\n            {{- '<｜User｜>' + content }}\n        {%- else %}\n            {{- '<｜User｜>' + content + '<｜Assistant｜>'}}\n        {%- endif %}\n    {%- endif %}\n    {%- if message['role'] == 'assistant' %}\n        {%- if '</think>' in content %}\n            {%- set content = (content.split('</think>')|last) %}\n        {%- endif %}\n    {%- endif %}\n    {%- if message['role'] == 'assistant' and message['tool_calls'] is defined and message['tool_calls'] is not none %}\n        {%- set ns.is_last_user = false -%}\n        {%- if ns.is_tool %}\n            {{- '<｜tool▁outputs▁end｜>'}}\n        {%- endif %}\n        {%- set ns.is_first = false %}\n        {%- set ns.is_tool = false -%}\n        {%- set ns.is_output_first = true %}\n        {%- for tool in message['tool_calls'] %}\n            {%- set arguments = tool['function']['arguments'] %}\n            {%- if arguments is not string %}\n                {%- set arguments = arguments|tojson %}\n            {%- endif %}\n            {%- if not ns.is_first %}\n                {%- if content is none %}\n                    {{- '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + arguments + '\\n' + '```' + '<｜tool▁call▁end｜>'}}\n                }\n                {%- else %}\n                    {{- content + '<｜tool▁calls▁begin｜><｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + arguments + '\\n' + '```' + '<｜tool▁call▁end｜>'}}\n                {%- endif %}\n                {%- set ns.is_first = true -%}\n            {%- else %}\n                {{- '\\n' + '<｜tool▁call▁begin｜>' + tool['type'] + '<｜tool▁sep｜>' + tool['function']['name'] + '\\n' + '```json' + '\\n' + arguments + '\\n' + '```' + '<｜tool▁call▁end｜>'}}\n            {%- endif %}\n        {%- endfor %}\n        {{- '<｜tool▁calls▁end｜><｜end▁of▁sentence｜>'}}\n    {%- endif %}\n    {%- if message['role'] == 'assistant' and (message['tool_calls'] is not defined or message['tool_calls'] is none) %}\n        {%- set ns.is_last_user = false -%}\n        {%- if ns.is_tool %}\n            {{- '<｜tool▁outputs▁end｜>' + content + '<｜end▁of▁sentence｜>'}}\n            {%- set ns.is_tool = false -%}\n        {%- else %}\n            {{- content + '<｜end▁of▁sentence｜>'}}\n        {%- endif %}\n    {%- endif %}\n    {%- if message['role'] == 'tool' %}\n        {%- set ns.is_last_user = false -%}\n        {%- set ns.is_tool = true -%}\n        {%- if ns.is_output_first %}\n            {{- '<｜tool▁outputs▁begin｜><｜tool▁output▁begin｜>' + content + '<｜tool▁output▁end｜>'}}\n            {%- set ns.is_output_first = false %}\n        {%- else %}\n            {{- '\\n<｜tool▁output▁begin｜>' + content + '<｜tool▁output▁end｜>'}}\n        {%- endif %}\n    {%- endif %}\n{%- endfor -%}\n{%- if ns.is_tool %}\n    {{- '<｜tool▁outputs▁end｜>'}}\n{%- endif %}\n{#- if add_generation_prompt and not ns.is_last_user and not ns.is_tool #}\n{%- if add_generation_prompt and not ns.is_tool %}\n    {{- '<｜Assistant｜>'}}\n{%- endif %}"
+}