Add weights
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- README.md +10 -0
- mlc-chat-config.json +76 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
- params_shard_14.bin +3 -0
README.md
CHANGED
@@ -1,3 +1,13 @@
|
|
1 |
---
|
2 |
license: mit
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
---
|
|
|
|
|
|
1 |
---
|
2 |
license: mit
|
3 |
+
language:
|
4 |
+
- en
|
5 |
+
base_model: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
|
6 |
+
base_model_relation: quantized
|
7 |
+
library_name: mlc-llm
|
8 |
+
pipeline_tag: text-generation
|
9 |
+
tags:
|
10 |
+
- chat
|
11 |
---
|
12 |
+
|
13 |
+
4-bit GPTQ quantized version of [DeepSeek-R1-Distill-Qwen-14B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B).
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,76 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "qwen2",
|
4 |
+
"quantization": "GPTQ-Int4",
|
5 |
+
"model_config": {
|
6 |
+
"hidden_act": "silu",
|
7 |
+
"hidden_size": 5120,
|
8 |
+
"intermediate_size": 13824,
|
9 |
+
"num_attention_heads": 40,
|
10 |
+
"num_hidden_layers": 48,
|
11 |
+
"num_key_value_heads": 8,
|
12 |
+
"rms_norm_eps": 1e-05,
|
13 |
+
"rope_theta": 1000000.0,
|
14 |
+
"vocab_size": 152064,
|
15 |
+
"tie_word_embeddings": false,
|
16 |
+
"context_window_size": 8192,
|
17 |
+
"prefill_chunk_size": 128,
|
18 |
+
"tensor_parallel_shards": 1,
|
19 |
+
"head_dim": 128,
|
20 |
+
"dtype": "float32",
|
21 |
+
"max_batch_size": 128
|
22 |
+
},
|
23 |
+
"vocab_size": 152064,
|
24 |
+
"context_window_size": 8192,
|
25 |
+
"sliding_window_size": -1,
|
26 |
+
"prefill_chunk_size": 128,
|
27 |
+
"attention_sink_size": -1,
|
28 |
+
"tensor_parallel_shards": 1,
|
29 |
+
"pipeline_parallel_stages": 1,
|
30 |
+
"temperature": 1.0,
|
31 |
+
"presence_penalty": 0.0,
|
32 |
+
"frequency_penalty": 0.0,
|
33 |
+
"repetition_penalty": 1.0,
|
34 |
+
"top_p": 1.0,
|
35 |
+
"tokenizer_files": [
|
36 |
+
"tokenizer.json",
|
37 |
+
"tokenizer_config.json"
|
38 |
+
],
|
39 |
+
"tokenizer_info": {
|
40 |
+
"token_postproc_method": "byte_level",
|
41 |
+
"prepend_space_in_encode": false,
|
42 |
+
"strip_space_in_decode": false
|
43 |
+
},
|
44 |
+
"conv_template": {
|
45 |
+
"name": "deepseek_r1_qwen",
|
46 |
+
"system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
|
47 |
+
"system_message": "You are a helpful assistant.",
|
48 |
+
"system_prefix_token_ids": null,
|
49 |
+
"add_role_after_system_message": true,
|
50 |
+
"roles": {
|
51 |
+
"user": "<\uff5cUser\uff5c>",
|
52 |
+
"assistant": "<\uff5cAssistant\uff5c>"
|
53 |
+
},
|
54 |
+
"role_templates": {
|
55 |
+
"user": "{user_message}",
|
56 |
+
"assistant": "{assistant_message}",
|
57 |
+
"tool": "{tool_message}"
|
58 |
+
},
|
59 |
+
"messages": [],
|
60 |
+
"seps": [
|
61 |
+
"",
|
62 |
+
"<\uff5cend\u2581of\u2581sentence\uff5c>"
|
63 |
+
],
|
64 |
+
"role_content_sep": "",
|
65 |
+
"role_empty_sep": "",
|
66 |
+
"stop_str": [],
|
67 |
+
"stop_token_ids": [
|
68 |
+
151643
|
69 |
+
],
|
70 |
+
"function_string": "",
|
71 |
+
"use_function_calling": false
|
72 |
+
},
|
73 |
+
"pad_token_id": 0,
|
74 |
+
"bos_token_id": 151643,
|
75 |
+
"eos_token_id": 151643
|
76 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6b077069dfff6eaf8b35ea54715525d28def5bed9b7598e971fbbe7e196a9b4
|
3 |
+
size 389283840
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a311e89f4f75ce982e5766cb9ea83004533668f486ec32acb3b9b94bc5edb1bc
|
3 |
+
size 31102976
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4bfea67143d6de96ca90bc361a292206f7490184a0199e2b2f4074caf1ac0e52
|
3 |
+
size 35389440
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4ff64442b447f24fb1e6718a972babd02f49d2decb7763fbce514dd471bd11a
|
3 |
+
size 35389440
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06a89d57f2ab1256fd199bd3517289cccabef0597f609d28739c3e8a486e17f3
|
3 |
+
size 22685696
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:938b807bd84751503d46361b2d3e4076354a27eeb869c4f3a8c52701a7654f53
|
3 |
+
size 70778880
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:697694ed70b62ba5fa9535603670301785ce5bcf79b6464512ebf0c3256dc115
|
3 |
+
size 35389440
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9949a85ea5c945f7a23d4c90e572505a6f5180ca380dda0ddce6e18434386ee4
|
3 |
+
size 18350080
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f3e40ad3cd2ad67220be3c2fcb6b86faf9c67ff8f351eadd9d85338b9322e782
|
3 |
+
size 70778880
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d5030a9b79d39094a5352885aeb0e6ed3b42f5b1c5e210554dc29103af21f1a
|
3 |
+
size 35389440
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f405d5c2ca881925c0599d7374a13d79d04625d9f5ffa880bf48716a91d4fb5e
|
3 |
+
size 33171456
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81147a86c465792ef02e127b9a64dfbfb0feba6dcc78f8cc3fe61bd8575e874c
|
3 |
+
size 33171456
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93e877d9ecba01659351e34a5a801da25cfb15f2c48567084790fb429690c0d5
|
3 |
+
size 70778880
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ef809684f448c78231eb2a9734416f72591a49015f3fc9d371bdf3e2d07fc6e
|
3 |
+
size 22685696
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ada333314e827370007e018bad6dd7dc4dcd3f636f7335c3858782922ce4f7d
|
3 |
+
size 35389440
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:568c493868ca9861505f7976461513102c22bac0acced85d44793588bb329c46
|
3 |
+
size 22685696
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c0cde261a36a7acb08eeef86d2525519d101bd6c95f3a124070b853e7c59805
|
3 |
+
size 70778880
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d9924e1614e7a923caee512ffd704e991a9473300701796766b567771d18de4
|
3 |
+
size 35389440
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:577abd523eeb442d8b5d21fc5f2bb11123157e92033203ed56e5339e72d2ee91
|
3 |
+
size 18350080
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c8a318b4a9889ca42756619a0ef3df8bb5c3623b108b62f58049069b0877e6e
|
3 |
+
size 70778880
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7949d07a17c40671d9e12a01387e8b2e5b300adf51bdc8aabe0b7342778b78e
|
3 |
+
size 35389440
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:11246b39c54a1054f3b773b25423148681e8a6bcfb7ec6c177aea0b75c0f94f0
|
3 |
+
size 33171456
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc5cf574fd175823c01b4c58d8be8173add4a7f356c151ec7692e9ca75597be3
|
3 |
+
size 33171456
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a680c970a687a72557a98e0b500c1ee5902f1513d30da0e13e888309dfa87b7
|
3 |
+
size 70778880
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8085e25818aea50723fc4c687e049a029a19ea91f32f50ba21a0ad59601ee0a
|
3 |
+
size 70778880
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15b9a5e9208c5e4ed33a8e7c17dd10ca057e88f91a85dbccb32eef5120f18667
|
3 |
+
size 35389440
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b5602c69d9f1291d8184b3c7373ba79360d55ccb874da21200551b3ae4b5601
|
3 |
+
size 22685696
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:171ea1c83616057e7fd285b6e1fbfacdcae1ccad0d479111deb3def6cc2a29b7
|
3 |
+
size 70778880
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:41e450226a1200c121a045b2de6ab7795994dc3c83c427e6893915aa72c7a8ae
|
3 |
+
size 35389440
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d192e807e061643434650645d37c95c656fe8d2e57622f98b51907928e43b2c1
|
3 |
+
size 18350080
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f17fee144b67db35359914f69a73f1d12d239e099d22a78e1a23cb417a7ed672
|
3 |
+
size 70778880
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a5acb11997e75912201972c90b9ba7436f3b27fef307fd8f91c8a90a40477633
|
3 |
+
size 35389440
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7be41733c2b3fd649c886c49778e39f05576a8220eb9679b82b218084473365
|
3 |
+
size 33171456
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:06ef71f65d3cbec845dffe133dc0787a88a2e8ca20e568c716d95065f5865829
|
3 |
+
size 33171456
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e68cb0e1681aeea17e18efb0cd4dd62afa766310a695852b22d1f2e806e3143e
|
3 |
+
size 70778880
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bc7603642a731feadc49f4e8ef00dfc1ba7a023f0eebdc128f44ae962e04aea4
|
3 |
+
size 35389440
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0f4a8c397bbb574f050d36c96d99447df75a7c052d1b1cf37b139cd0fc724669
|
3 |
+
size 35389440
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c93e7f865ea7c91bb76d97f8ea22f5cd8b2304ce0f46d654c2cbd438f82e19bc
|
3 |
+
size 22685696
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:63cd0a7810526bd43232107f42ab2db01eb1e9e5f83c37393a38c73695875974
|
3 |
+
size 70778880
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b6c2d3b303b80175bd9e4d9b308ff11c32870ffa45535adbfbe0e7af2353b4c6
|
3 |
+
size 35389440
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0de0b0068cd4ad767c6e617a92ca848c315e3fd4224d0257fa16bf7f04ec0e56
|
3 |
+
size 18350080
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:802a89e787c1829349a29537e588c8053966691466e85373360c316e58d0c651
|
3 |
+
size 70778880
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:afbdc6055e6c25575fbd40940f05037878a9100bdf6058fab1057c76679a3826
|
3 |
+
size 35389440
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4328f387a6207abd80588e037d71b2b8c06ae7606a8c2fda4c6bacf8b3ff2987
|
3 |
+
size 33171456
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:012f8f8668208b0209dca3722d6f201e928c4445aacdd3e114678573d52b1e7d
|
3 |
+
size 33171456
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1fad20debebf989642578a73fab16640d178c0e009cb41b431ca5e4770822a58
|
3 |
+
size 70778880
|
params_shard_14.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7778e96c23fedfd1a48a7ccad5ae495e8b108736e9edd3e010eaad201ba3994f
|
3 |
+
size 18350080
|