riczhou commited on
Commit
963a0cd
·
verified ·
1 Parent(s): 63f1da5

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
mlc-chat-config.json ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "gemma3",
4
+ "quantization": "q0f32",
5
+ "model_config": {
6
+ "text_config": {
7
+ "hidden_size": 5376,
8
+ "intermediate_size": 21504,
9
+ "num_hidden_layers": 62,
10
+ "attention_bias": false,
11
+ "num_attention_heads": 32,
12
+ "num_key_value_heads": 16,
13
+ "head_dim": 128,
14
+ "rms_norm_eps": 1e-06,
15
+ "hidden_activation": "gelu_pytorch_tanh",
16
+ "position_embedding_base": 10000,
17
+ "context_window_size": 8192,
18
+ "prefill_chunk_size": 8192,
19
+ "query_pre_attn_scalar": 168,
20
+ "sliding_window": 1024,
21
+ "kwargs": {
22
+ "model_type": "gemma3_text",
23
+ "rope_scaling": {
24
+ "factor": 8.0,
25
+ "rope_type": "linear"
26
+ }
27
+ }
28
+ },
29
+ "vocab_size": 262208,
30
+ "tensor_parallel_shards": 1,
31
+ "max_batch_size": 128,
32
+ "context_window_size": 8192,
33
+ "sliding_window_size": -1,
34
+ "prefill_chunk_size": 8192,
35
+ "is_text_model": false
36
+ },
37
+ "vocab_size": 262208,
38
+ "context_window_size": 8192,
39
+ "sliding_window_size": -1,
40
+ "prefill_chunk_size": 8192,
41
+ "attention_sink_size": -1,
42
+ "tensor_parallel_shards": 1,
43
+ "pipeline_parallel_stages": 1,
44
+ "temperature": 1.0,
45
+ "presence_penalty": 0.0,
46
+ "frequency_penalty": 0.0,
47
+ "repetition_penalty": 1.0,
48
+ "top_p": 0.95,
49
+ "tokenizer_files": [
50
+ "tokenizer.model",
51
+ "tokenizer.json",
52
+ "added_tokens.json",
53
+ "tokenizer_config.json"
54
+ ],
55
+ "tokenizer_info": {
56
+ "token_postproc_method": "byte_fallback",
57
+ "prepend_space_in_encode": false,
58
+ "strip_space_in_decode": false
59
+ },
60
+ "conv_template": {
61
+ "name": "gemma_instruction",
62
+ "system_template": "{system_message}",
63
+ "system_message": "",
64
+ "system_prefix_token_ids": [
65
+ 2
66
+ ],
67
+ "add_role_after_system_message": true,
68
+ "roles": {
69
+ "user": "<start_of_turn>user",
70
+ "assistant": "<start_of_turn>model"
71
+ },
72
+ "role_templates": {
73
+ "user": "{user_message}",
74
+ "assistant": "{assistant_message}",
75
+ "tool": "{tool_message}"
76
+ },
77
+ "messages": [],
78
+ "seps": [
79
+ "<end_of_turn>\n"
80
+ ],
81
+ "role_content_sep": "\n",
82
+ "role_empty_sep": "\n",
83
+ "stop_str": [
84
+ "<end_of_turn>"
85
+ ],
86
+ "stop_token_ids": [
87
+ 1,
88
+ 107
89
+ ],
90
+ "function_string": "",
91
+ "use_function_calling": false
92
+ },
93
+ "pad_token_id": 0,
94
+ "bos_token_id": 2,
95
+ "eos_token_id": [
96
+ 1,
97
+ 106
98
+ ]
99
+ }
ndarray-cache-b16.json ADDED
The diff for this file is too large to render. See raw diff
 
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:956bea43ffd41cfbe994fc946afa939848903a224d4259687caa9ea10fcacee1
3
+ size 2819260416
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:77c8bff8512e36b6d826d4b4c71a2e2208c32663e78531a699b3744c166f2407
3
+ size 231211008
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ceb704b252bf8f621831508ee8ff8c032dc93a378aa707f7ed198c056e028f7c
3
+ size 22020096
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f40727de772da7848ab91fa7309eab07ca60c88adc4e86b22320bd147e631b9
3
+ size 44040192
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20de1d74151edcd184ca0e0538eb37dd709e2df6eae10430b0072b8e96498c8b
3
+ size 22020096
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9efca4514bd6273d819a3d9390d8555d00f2d491be86a104913d248ba1cd5b09
3
+ size 231211008
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e3a3431b97440b3c872d68e3794439bd4dd36b53e5ebf7fdcfe60139d512f4f
3
+ size 462422016
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf60b587c11118f8f6cb70d4efb6326282a97f22641eddcdd849342d5c42b375
3
+ size 22020096
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7babdba80584b38efaee95094eeb451ba7dc698964684fe35c9b59477e5095ba
3
+ size 44040192
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a3c680f0e541525dd47f31b1fa733c73274e4cf3231622c15a1266c942f9e60c
3
+ size 44040192
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eab3d65eee12bd4ba9eb8e9ad8fd864ee7ae55128503ab9904fa5d6e3d5beecb
3
+ size 22020096
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ad766223d2d32908bc3baa13e34c5a7cedc39784f636def6c4029aa80db2fcd
3
+ size 231211008
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f94fa6de84325ca1d98298e1c96edcc2e15e51cb40953bf3d123ad4abd2c6c1
3
+ size 462422016
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c3746323772979da387aa8878c6733cef9f040c5cd985ec46a71fb697840b0b
3
+ size 231211008
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02f8464908884043ad8072f7940297b45bd9be51d21c1b7284818e5a74fe6d01
3
+ size 22020096
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6d88f4660fa5bced9613296be17eac50df8b6afd42251753ade9c1766a579b7e
3
+ size 44040192
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7a9be42ff50e155bbbfd4ccdb1ad96f5aaf4ca5a141af614b5ce7581c9ab5a72
3
+ size 44040192
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e3bf9f09c0c2e4baade972eec82c07ad5c9c4549b882179bd7362dfc15a712fe
3
+ size 22020096
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:96b5d1d61cb407f7591e30886beec7577cc9dc28e0cf0d39f76688ccd1b2eeaf
3
+ size 462422016
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:250df95870a41bd6c5d718c11d13c8dcf4b58965949db4263beff18c7675cb0b
3
+ size 22020096
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:754550356615daf341015669739da15178bf224ab09b46874ae570352cc09fa2
3
+ size 44040192
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5b04787b94558add239989acdbcd2b2bae6afe9bde6a47154cc9225ae626b329
3
+ size 44040192
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8ae37920f3cbb56f5a8905aa155c5bc8288f09a78142af694c6f8e0642bd4fc
3
+ size 22020096
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c05e2220f331f47bbe0c6bea085119a8ecf65004632755937ac97407013e8f9
3
+ size 231211008
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28760469b76b1d0e20911f3ee168b2e812556f2f1e69008caa83718fb1722787
3
+ size 231211008
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:15650b1335e3ce8c5a2745c6db6d0e33becf16e29d3194a70555758a38aa126a
3
+ size 231211008
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d93d5769e74e5a3936065bcd916cd299628ea358e24c89c4ecdcd80bdd5d80a4
3
+ size 462422016
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8bc11d9640cdeb10c768a1ec92e5780edd62ae2832cab2b5a7f686d89a5c124
3
+ size 22020096
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a09cad7198c7de7b72f7e6927a459b3a2624b7fd9b70c8e894832f162c2c47a
3
+ size 44040192
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a6b5e8d5f96ba27b8406acc1e6462c09461ef60fe54442011d80b4e98d3e017
3
+ size 44040192
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d1acdab22f8e30a3b2a96a612eaf222c7ef2ad8ab0db81c3492760dbc0ae241
3
+ size 22020096
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff2763b8147048dcfa2c28471b1f0af2d15ab95b481499467d6012d504a30700
3
+ size 231211008
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:579a07475453490914ef4aff81ce4c79fd03752770f816320edfb93213832783
3
+ size 462422016
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d37ebc444434bada0ad09e5d5cf671b92833cb3b62adb565d6618e678971045
3
+ size 22020096
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a45c4d07a741f3a4edf52d79215f062e8469299fd5c25841de31b5ac70e91fd
3
+ size 44040192
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c70f22e9d6a1971e9faacecd95fe03dfb198afc1bf5178a907525dbe2092b01d
3
+ size 462422016
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8824c30e047cbd0b9452846a0f53c81e13397bb3c6e70bbebc9c01066b2241fa
3
+ size 44040192
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:50b52ce54e5322d456a344a880428bdcd375f808fbacf738f08f6b66ff4f018b
3
+ size 22020096
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:602356317ffc5fd46dd4b58ffda1b04bf7ccdea4ff7e5047703df13fdcc3db83
3
+ size 231211008
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3ff94319d22ad417e1d2b9731743e61ad8488e3abf8390960fe157f22ceb856d
3
+ size 462422016
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eacd23aae203a2661bb16ada469417d5b4caad424e4558b576b915fed285e73a
3
+ size 22020096
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:254d852452343fee2522ecc63da0ca3fc2714817c72fa1cecd48a11d6bad71ca
3
+ size 44040192
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07aa7eaeb96d109a0861e45b380efee308d97b553faf86f1bb22fda737bd60d8
3
+ size 44040192
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ff943433b3ead3d2702b4c704e58b69bf018a118045419a7b81add5148ce63ce
3
+ size 22020096
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3bcd91340a2b603f33b0b417d48a6962c9d83fddf58c7bc5398a6fc8678e626f
3
+ size 231211008