riczhou commited on
Commit
e19ead7
·
verified ·
1 Parent(s): 04aa9d0

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
mlc-chat-config.json ADDED
@@ -0,0 +1,100 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "deepseek_v2",
4
+ "quantization": "q4f16_1",
5
+ "model_config": {
6
+ "vocab_size": 102400,
7
+ "hidden_size": 2048,
8
+ "intermediate_size": 10944,
9
+ "moe_intermediate_size": 1408,
10
+ "num_hidden_layers": 27,
11
+ "num_attention_heads": 16,
12
+ "num_key_value_heads": 16,
13
+ "n_shared_experts": 2,
14
+ "n_routed_experts": 64,
15
+ "num_experts_per_tok": 6,
16
+ "norm_topk_prob": false,
17
+ "first_k_dense_replace": 1,
18
+ "moe_layer_freq": 1,
19
+ "routed_scaling_factor": 1.0,
20
+ "attention_bias": false,
21
+ "kv_lora_rank": 512,
22
+ "qk_rope_head_dim": 64,
23
+ "v_head_dim": 128,
24
+ "qk_nope_head_dim": 128,
25
+ "rms_norm_eps": 1e-06,
26
+ "rope_theta": 10000,
27
+ "q_lora_rank": null,
28
+ "rope_scaling": {
29
+ "beta_fast": 32,
30
+ "beta_slow": 1,
31
+ "factor": 40,
32
+ "mscale": 0.707,
33
+ "mscale_all_dim": 0.707,
34
+ "original_max_position_embeddings": 4096,
35
+ "type": "yarn"
36
+ },
37
+ "context_window_size": 163840,
38
+ "prefill_chunk_size": 8192,
39
+ "tensor_parallel_shards": 1,
40
+ "dtype": "float32",
41
+ "max_batch_size": 128
42
+ },
43
+ "vocab_size": 102400,
44
+ "context_window_size": 163840,
45
+ "sliding_window_size": -1,
46
+ "prefill_chunk_size": 8192,
47
+ "attention_sink_size": -1,
48
+ "tensor_parallel_shards": 1,
49
+ "pipeline_parallel_stages": 1,
50
+ "temperature": 0.3,
51
+ "presence_penalty": 0.0,
52
+ "frequency_penalty": 0.0,
53
+ "repetition_penalty": 1.0,
54
+ "top_p": 0.95,
55
+ "tokenizer_files": [
56
+ "tokenizer.json",
57
+ "tokenizer_config.json"
58
+ ],
59
+ "tokenizer_info": {
60
+ "token_postproc_method": "byte_level",
61
+ "prepend_space_in_encode": false,
62
+ "strip_space_in_decode": false
63
+ },
64
+ "conv_template": {
65
+ "name": "deepseek_v2",
66
+ "system_template": "{system_message}",
67
+ "system_message": "",
68
+ "system_prefix_token_ids": [
69
+ 100000
70
+ ],
71
+ "add_role_after_system_message": true,
72
+ "roles": {
73
+ "user": "User",
74
+ "assistant": "Assistant"
75
+ },
76
+ "role_templates": {
77
+ "user": "{user_message}",
78
+ "assistant": "{assistant_message}",
79
+ "tool": "{tool_message}"
80
+ },
81
+ "messages": [],
82
+ "seps": [
83
+ "\n\n",
84
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
85
+ ],
86
+ "role_content_sep": ": ",
87
+ "role_empty_sep": ":",
88
+ "stop_str": [
89
+ "<\uff5cend\u2581of\u2581sentence\uff5c>"
90
+ ],
91
+ "stop_token_ids": [
92
+ 100001
93
+ ],
94
+ "function_string": "",
95
+ "use_function_calling": false
96
+ },
97
+ "pad_token_id": 0,
98
+ "bos_token_id": 100000,
99
+ "eos_token_id": 100001
100
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dea775780902e34b2fe56b139732ae03b7d9082c6b463d255355f79ba6205142
3
+ size 104857600
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee9948d56e05798d5113f65d688b0e71048dfa47616dad988be288064a5552d5
3
+ size 104857600
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f3c799eff086f941f3feeea5d95ebe51fe2128ca3d16945e4011a6e51ed64eb
3
+ size 92274688
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98bf83697b161a250c918b7c517fa72e5763ffeafcb08aee26b3d5db8069d315
3
+ size 184549376
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b5560dc29082fb82576e19d2abf25c169bfa4deb979560c18fa9afbbe1ccee0
3
+ size 23068672
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ba7c136fa0cc0adf609a89a060c72a627aee00d038f84427cd41cc14e48c0e9
3
+ size 92274688
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4ece3d672a3b547cd14e9ff0918e80e312fc8fbaf7272087a62eef3ae9503c0d
3
+ size 29279232
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0839e123f575000d7746582936ab7fd276ee5c78fdc1f47855c9f9e2206f8f1d
3
+ size 184549376
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8118c089711f27533dbbfa3751f40baca16086547bccc14bfd748fa162ebb4f4
3
+ size 23068672
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78d2b6d4abdcd3564f6bf2a7e13bd0acc780718ad207e3bef08e1bc3ffc16778
3
+ size 92274688
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:300830f81d6450407068e5c57c8dac6179c93b2b6184d6d232715b5ecb5f61a6
3
+ size 29279232
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed6767b466cbda3ffab11c10a5548b1a9d2712f8dff936168f4555388f520110
3
+ size 11542528
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9f90707c5804ce188af5dc11b197cde12e6a687030bb19604cb8d245a2bf658
3
+ size 29279232
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10deb159c16b095d990e5f9f226f972508d863f15986954a3b6a0fa52db5875b
3
+ size 184549376
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4ac5cd0db89230dd0080f7234f1270a7b9adc4ee14fc33a716c1c7c112dcb08
3
+ size 23068672
params_shard_14.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5ff7aa84705c26bd5630afb55734412aa856c6bf448255a1e1ea5b350f9d7c0
3
+ size 92274688
params_shard_15.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d126aff355210888a34b7d7d328ef18e1dea219e86eb847e864ad2f075a5d7ae
3
+ size 29279232
params_shard_16.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25e318e4a9b3cab494dd5b3b132b06ff8406841a44339827b1f2456ef6c93e6a
3
+ size 184549376
params_shard_17.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71e963ebe21400fc1776e3cfa977d365cc9b82352fef507c38f1d1153713e36c
3
+ size 23068672
params_shard_18.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cef8ab14a6e74f6aa48f36201bcb05062fe9669382eefe2df0c861c39a39f15
3
+ size 92274688
params_shard_19.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:513c20045affb01450c86edf3fe8fcc15d9a8e45800add5ea1f66878c10b3978
3
+ size 29279232
params_shard_2.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a262afb8c598add92dc9dae205473357c8d1e6ce3de561740d42bca2f4f7e606
3
+ size 31601664
params_shard_20.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1764ee53318f3d1bbaead1c90a7fd4ec2c54a1d51a16b0753efeeaded7551abb
3
+ size 184549376
params_shard_21.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1cb1694d030a99ad74d9b4bd48c42b94440bde9597faf8d25eb5ccebc85a48b1
3
+ size 23068672
params_shard_22.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:481f3b4e174334c1cd3f92fd89bf530197ade1c7bd9ece27a867cc28a7b60a19
3
+ size 92274688
params_shard_23.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:355da7d65416505768af4c01bc00b6a600f75aa1bda3ce304138fb8c1246595f
3
+ size 29279232
params_shard_24.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b602ca4b646d300126ec41bd50e87ba1120b39868f12b2fd205fc9e66910f1d8
3
+ size 184549376
params_shard_25.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d711893eb680229c49938c8154deaaa93f0e41a1f50cd9c43526f1ce72c3f7b
3
+ size 23068672
params_shard_26.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:60af96a46caaab86d61e23ea521e0231460e6562479d99ca0467f2ff82bd94da
3
+ size 92274688
params_shard_27.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3aa33be07f87128795e4e8c34064c00000394e0520320ddb8a50d08cd0015b22
3
+ size 29279232
params_shard_28.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5fab43d72b680a6b1a0dc78d45ac2abff2ca41a26ce76d68c5febe672b9b095c
3
+ size 184549376
params_shard_29.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c25cec021de12f75b1a54f3c657e5a4c1bddacb2eb62f55a447b0b3d0978fbbc
3
+ size 23068672
params_shard_3.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:52353c334e622d01b583ad14159017758fb32e28eb4fe5137f777fe41a8635eb
3
+ size 27574272
params_shard_30.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e849a70b538ec74764aa680b0d8200a5aebdc02e3e9ae644bf7ed7d1c2d040f
3
+ size 92274688
params_shard_31.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20dd6e4736327ea3caef14a8e0d60e28f5b5bbeaef238956808a42696545d347
3
+ size 29279232
params_shard_32.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bf5c41861c40855efccda07d3faa085aed92e10f03c03df2dfabb988e7c7b61
3
+ size 184549376
params_shard_33.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1537f1711104756e4fb15ad07984e7f49a0be21c71d4e49e83e86b47a4a25020
3
+ size 23068672
params_shard_34.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3a81af774a839ec99cfbc322c60efa4449a6880137ef24f7c056e627a2115b5f
3
+ size 92274688
params_shard_35.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:57c077d75d1fdaaeba8fee16f56b869d523bc633b9bb84e54ec3a4d9f1f2f04e
3
+ size 29279232
params_shard_36.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd90499714d1a9771cf56175635806b64249a76df407377d56341d4a1c8fa480
3
+ size 184549376
params_shard_37.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f3a35f81f6d0be11b2146b10881fef440ab4b55099a13d4007f6c867a8e03be2
3
+ size 23068672
params_shard_38.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aecdcdb48971c2534f73292546a0dd5b93d27cead604c44eb71ae97b0c16bae6
3
+ size 92274688
params_shard_39.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:503849d08889f8b1c20e5a3e3932e6683cc9c0cd561d492c12f28033ced3e704
3
+ size 29279232
params_shard_4.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:334389ad9bfb6054dd1feb9f2daf189031b89d86b9aa44382a59148b80c98bd7
3
+ size 184549376
params_shard_40.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:490276df5068a06831a20716be0ae9fccbce68fd1a534bbf8c7e8aa27ae12f3a
3
+ size 184549376
params_shard_41.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:509db06593ffbb2ce5dbcd355e419cffb80092d82245afc56f283bb74c3e6d58
3
+ size 23068672
params_shard_42.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ad33a56c052ae3dc0b5d5adddd4a16c1b9b9d36624a590d83a5a32741c3a593
3
+ size 92274688
params_shard_43.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03935f41332b8f435c2257044ebe3c647c83c5bfcfe40344ab849820214f37cb
3
+ size 29279232