Jeethu commited on
Commit
e318e73
·
1 Parent(s): a97a41c

Add weights

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
README.md CHANGED
@@ -1,3 +1,13 @@
1
  ---
2
  license: mit
 
 
 
 
 
 
 
 
3
  ---
 
 
 
1
  ---
2
  license: mit
3
+ language:
4
+ - en
5
+ base_model: deepseek-ai/DeepSeek-R1-Distill-Qwen-14B
6
+ base_model_relation: quantized
7
+ library_name: mlc-llm
8
+ pipeline_tag: text-generation
9
+ tags:
10
+ - chat
11
  ---
12
+
13
+ 4-bit GPTQ quantized version of [DeepSeek-R1-Distill-Qwen-14B](https://huggingface.co/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B).
mlc-chat-config.json ADDED
@@ -0,0 +1,76 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "qwen2",
4
+ "quantization": "GPTQ-Int4",
5
+ "model_config": {
6
+ "hidden_act": "silu",
7
+ "hidden_size": 5120,
8
+ "intermediate_size": 13824,
9
+ "num_attention_heads": 40,
10
+ "num_hidden_layers": 48,
11
+ "num_key_value_heads": 8,
12
+ "rms_norm_eps": 1e-05,
13
+ "rope_theta": 1000000.0,
14
+ "vocab_size": 152064,
15
+ "tie_word_embeddings": false,
16
+ "context_window_size": 8192,
17
+ "prefill_chunk_size": 128,
18
+ "tensor_parallel_shards": 1,
19
+ "head_dim": 128,
20
+ "dtype": "float32",
21
+ "max_batch_size": 128
22
+ },
23
+ "vocab_size": 152064,
24
+ "context_window_size": 8192,
25
+ "sliding_window_size": -1,
26
+ "prefill_chunk_size": 128,
27
+ "attention_sink_size": -1,
28
+ "tensor_parallel_shards": 1,
29
+ "pipeline_parallel_stages": 1,
30
+ "temperature": 1.0,
31
+ "presence_penalty": 0.0,
32
+ "frequency_penalty": 0.0,
33
+ "repetition_penalty": 1.0,
34
+ "top_p": 1.0,
35
+ "tokenizer_files": [
36
+ "tokenizer.json",
37
+ "tokenizer_config.json"
38
+ ],
39
+ "tokenizer_info": {
40
+ "token_postproc_method": "byte_level",
41
+ "prepend_space_in_encode": false,
42
+ "strip_space_in_decode": false
43
+ },
44
+ "conv_template": {
45
+ "name": "deepseek_r1_qwen",
46
+ "system_template": "<\uff5cbegin\u2581of\u2581sentence\uff5c>{system_message}",
47
+ "system_message": "You are a helpful assistant.",
48
+ "system_prefix_token_ids": null,
49
+ "add_role_after_system_message": true,
50
+ "roles": {
51
+ "user": "<\uff5cUser\uff5c>",
52
+ "assistant": "<\uff5cAssistant\uff5c>"
53
+ },
54
+ "role_templates": {
55
+ "user": "{user_message}",
56
+ "assistant": "{assistant_message}",
57
+ "tool": "{tool_message}"
58
+ },
59
+ "messages": [],
60
+ "seps": [
61
+ "",
62
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
63
+ ],
64
+ "role_content_sep": "",
65
+ "role_empty_sep": "",
66
+ "stop_str": [],
67
+ "stop_token_ids": [
68
+ 151643
69
+ ],
70
+ "function_string": "",
71
+ "use_function_calling": false
72
+ },
73
+ "pad_token_id": 0,
74
+ "bos_token_id": 151643,
75
+ "eos_token_id": 151643
76
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f6b077069dfff6eaf8b35ea54715525d28def5bed9b7598e971fbbe7e196a9b4
3
+ size 389283840
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a311e89f4f75ce982e5766cb9ea83004533668f486ec32acb3b9b94bc5edb1bc
3
+ size 31102976
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4bfea67143d6de96ca90bc361a292206f7490184a0199e2b2f4074caf1ac0e52
3
+ size 35389440
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4ff64442b447f24fb1e6718a972babd02f49d2decb7763fbce514dd471bd11a
3
+ size 35389440
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06a89d57f2ab1256fd199bd3517289cccabef0597f609d28739c3e8a486e17f3
3
+ size 22685696
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:938b807bd84751503d46361b2d3e4076354a27eeb869c4f3a8c52701a7654f53
3
+ size 70778880
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:697694ed70b62ba5fa9535603670301785ce5bcf79b6464512ebf0c3256dc115
3
+ size 35389440
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9949a85ea5c945f7a23d4c90e572505a6f5180ca380dda0ddce6e18434386ee4
3
+ size 18350080
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3e40ad3cd2ad67220be3c2fcb6b86faf9c67ff8f351eadd9d85338b9322e782
3
+ size 70778880
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d5030a9b79d39094a5352885aeb0e6ed3b42f5b1c5e210554dc29103af21f1a
3
+ size 35389440
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f405d5c2ca881925c0599d7374a13d79d04625d9f5ffa880bf48716a91d4fb5e
3
+ size 33171456
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81147a86c465792ef02e127b9a64dfbfb0feba6dcc78f8cc3fe61bd8575e874c
3
+ size 33171456
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93e877d9ecba01659351e34a5a801da25cfb15f2c48567084790fb429690c0d5
3
+ size 70778880
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ef809684f448c78231eb2a9734416f72591a49015f3fc9d371bdf3e2d07fc6e
3
+ size 22685696
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ada333314e827370007e018bad6dd7dc4dcd3f636f7335c3858782922ce4f7d
3
+ size 35389440
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:568c493868ca9861505f7976461513102c22bac0acced85d44793588bb329c46
3
+ size 22685696
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c0cde261a36a7acb08eeef86d2525519d101bd6c95f3a124070b853e7c59805
3
+ size 70778880
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d9924e1614e7a923caee512ffd704e991a9473300701796766b567771d18de4
3
+ size 35389440
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:577abd523eeb442d8b5d21fc5f2bb11123157e92033203ed56e5339e72d2ee91
3
+ size 18350080
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c8a318b4a9889ca42756619a0ef3df8bb5c3623b108b62f58049069b0877e6e
3
+ size 70778880
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7949d07a17c40671d9e12a01387e8b2e5b300adf51bdc8aabe0b7342778b78e
3
+ size 35389440
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11246b39c54a1054f3b773b25423148681e8a6bcfb7ec6c177aea0b75c0f94f0
3
+ size 33171456
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc5cf574fd175823c01b4c58d8be8173add4a7f356c151ec7692e9ca75597be3
3
+ size 33171456
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a680c970a687a72557a98e0b500c1ee5902f1513d30da0e13e888309dfa87b7
3
+ size 70778880
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d8085e25818aea50723fc4c687e049a029a19ea91f32f50ba21a0ad59601ee0a
3
+ size 70778880
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15b9a5e9208c5e4ed33a8e7c17dd10ca057e88f91a85dbccb32eef5120f18667
3
+ size 35389440
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8b5602c69d9f1291d8184b3c7373ba79360d55ccb874da21200551b3ae4b5601
3
+ size 22685696
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:171ea1c83616057e7fd285b6e1fbfacdcae1ccad0d479111deb3def6cc2a29b7
3
+ size 70778880
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41e450226a1200c121a045b2de6ab7795994dc3c83c427e6893915aa72c7a8ae
3
+ size 35389440
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d192e807e061643434650645d37c95c656fe8d2e57622f98b51907928e43b2c1
3
+ size 18350080
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f17fee144b67db35359914f69a73f1d12d239e099d22a78e1a23cb417a7ed672
3
+ size 70778880
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5acb11997e75912201972c90b9ba7436f3b27fef307fd8f91c8a90a40477633
3
+ size 35389440
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7be41733c2b3fd649c886c49778e39f05576a8220eb9679b82b218084473365
3
+ size 33171456
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:06ef71f65d3cbec845dffe133dc0787a88a2e8ca20e568c716d95065f5865829
3
+ size 33171456
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e68cb0e1681aeea17e18efb0cd4dd62afa766310a695852b22d1f2e806e3143e
3
+ size 70778880
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc7603642a731feadc49f4e8ef00dfc1ba7a023f0eebdc128f44ae962e04aea4
3
+ size 35389440
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0f4a8c397bbb574f050d36c96d99447df75a7c052d1b1cf37b139cd0fc724669
3
+ size 35389440
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c93e7f865ea7c91bb76d97f8ea22f5cd8b2304ce0f46d654c2cbd438f82e19bc
3
+ size 22685696
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63cd0a7810526bd43232107f42ab2db01eb1e9e5f83c37393a38c73695875974
3
+ size 70778880
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b6c2d3b303b80175bd9e4d9b308ff11c32870ffa45535adbfbe0e7af2353b4c6
3
+ size 35389440
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0de0b0068cd4ad767c6e617a92ca848c315e3fd4224d0257fa16bf7f04ec0e56
3
+ size 18350080
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:802a89e787c1829349a29537e588c8053966691466e85373360c316e58d0c651
3
+ size 70778880
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afbdc6055e6c25575fbd40940f05037878a9100bdf6058fab1057c76679a3826
3
+ size 35389440
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4328f387a6207abd80588e037d71b2b8c06ae7606a8c2fda4c6bacf8b3ff2987
3
+ size 33171456
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:012f8f8668208b0209dca3722d6f201e928c4445aacdd3e114678573d52b1e7d
3
+ size 33171456
params_shard_139.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1fad20debebf989642578a73fab16640d178c0e009cb41b431ca5e4770822a58
3
+ size 70778880
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7778e96c23fedfd1a48a7ccad5ae495e8b108736e9edd3e010eaad201ba3994f
3
+ size 18350080