Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- added_tokens.json +3 -0
- mlc-chat-config.json +99 -0
- ndarray-cache-b16.json +0 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<image_soft_token>": 262144
|
3 |
+
}
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "gemma3",
|
4 |
+
"quantization": "q0f32",
|
5 |
+
"model_config": {
|
6 |
+
"text_config": {
|
7 |
+
"hidden_size": 5376,
|
8 |
+
"intermediate_size": 21504,
|
9 |
+
"num_hidden_layers": 62,
|
10 |
+
"attention_bias": false,
|
11 |
+
"num_attention_heads": 32,
|
12 |
+
"num_key_value_heads": 16,
|
13 |
+
"head_dim": 128,
|
14 |
+
"rms_norm_eps": 1e-06,
|
15 |
+
"hidden_activation": "gelu_pytorch_tanh",
|
16 |
+
"position_embedding_base": 10000,
|
17 |
+
"context_window_size": 8192,
|
18 |
+
"prefill_chunk_size": 8192,
|
19 |
+
"query_pre_attn_scalar": 168,
|
20 |
+
"sliding_window": 1024,
|
21 |
+
"kwargs": {
|
22 |
+
"model_type": "gemma3_text",
|
23 |
+
"rope_scaling": {
|
24 |
+
"factor": 8.0,
|
25 |
+
"rope_type": "linear"
|
26 |
+
}
|
27 |
+
}
|
28 |
+
},
|
29 |
+
"vocab_size": 262208,
|
30 |
+
"tensor_parallel_shards": 1,
|
31 |
+
"max_batch_size": 128,
|
32 |
+
"context_window_size": 8192,
|
33 |
+
"sliding_window_size": -1,
|
34 |
+
"prefill_chunk_size": 8192,
|
35 |
+
"is_text_model": false
|
36 |
+
},
|
37 |
+
"vocab_size": 262208,
|
38 |
+
"context_window_size": 8192,
|
39 |
+
"sliding_window_size": -1,
|
40 |
+
"prefill_chunk_size": 8192,
|
41 |
+
"attention_sink_size": -1,
|
42 |
+
"tensor_parallel_shards": 1,
|
43 |
+
"pipeline_parallel_stages": 1,
|
44 |
+
"temperature": 1.0,
|
45 |
+
"presence_penalty": 0.0,
|
46 |
+
"frequency_penalty": 0.0,
|
47 |
+
"repetition_penalty": 1.0,
|
48 |
+
"top_p": 0.95,
|
49 |
+
"tokenizer_files": [
|
50 |
+
"tokenizer.model",
|
51 |
+
"tokenizer.json",
|
52 |
+
"added_tokens.json",
|
53 |
+
"tokenizer_config.json"
|
54 |
+
],
|
55 |
+
"tokenizer_info": {
|
56 |
+
"token_postproc_method": "byte_fallback",
|
57 |
+
"prepend_space_in_encode": false,
|
58 |
+
"strip_space_in_decode": false
|
59 |
+
},
|
60 |
+
"conv_template": {
|
61 |
+
"name": "gemma_instruction",
|
62 |
+
"system_template": "{system_message}",
|
63 |
+
"system_message": "",
|
64 |
+
"system_prefix_token_ids": [
|
65 |
+
2
|
66 |
+
],
|
67 |
+
"add_role_after_system_message": true,
|
68 |
+
"roles": {
|
69 |
+
"user": "<start_of_turn>user",
|
70 |
+
"assistant": "<start_of_turn>model"
|
71 |
+
},
|
72 |
+
"role_templates": {
|
73 |
+
"user": "{user_message}",
|
74 |
+
"assistant": "{assistant_message}",
|
75 |
+
"tool": "{tool_message}"
|
76 |
+
},
|
77 |
+
"messages": [],
|
78 |
+
"seps": [
|
79 |
+
"<end_of_turn>\n"
|
80 |
+
],
|
81 |
+
"role_content_sep": "\n",
|
82 |
+
"role_empty_sep": "\n",
|
83 |
+
"stop_str": [
|
84 |
+
"<end_of_turn>"
|
85 |
+
],
|
86 |
+
"stop_token_ids": [
|
87 |
+
1,
|
88 |
+
107
|
89 |
+
],
|
90 |
+
"function_string": "",
|
91 |
+
"use_function_calling": false
|
92 |
+
},
|
93 |
+
"pad_token_id": 0,
|
94 |
+
"bos_token_id": 2,
|
95 |
+
"eos_token_id": [
|
96 |
+
1,
|
97 |
+
106
|
98 |
+
]
|
99 |
+
}
|
ndarray-cache-b16.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:956bea43ffd41cfbe994fc946afa939848903a224d4259687caa9ea10fcacee1
|
3 |
+
size 2819260416
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77c8bff8512e36b6d826d4b4c71a2e2208c32663e78531a699b3744c166f2407
|
3 |
+
size 231211008
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ceb704b252bf8f621831508ee8ff8c032dc93a378aa707f7ed198c056e028f7c
|
3 |
+
size 22020096
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f40727de772da7848ab91fa7309eab07ca60c88adc4e86b22320bd147e631b9
|
3 |
+
size 44040192
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:20de1d74151edcd184ca0e0538eb37dd709e2df6eae10430b0072b8e96498c8b
|
3 |
+
size 22020096
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9efca4514bd6273d819a3d9390d8555d00f2d491be86a104913d248ba1cd5b09
|
3 |
+
size 231211008
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5e3a3431b97440b3c872d68e3794439bd4dd36b53e5ebf7fdcfe60139d512f4f
|
3 |
+
size 462422016
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf60b587c11118f8f6cb70d4efb6326282a97f22641eddcdd849342d5c42b375
|
3 |
+
size 22020096
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7babdba80584b38efaee95094eeb451ba7dc698964684fe35c9b59477e5095ba
|
3 |
+
size 44040192
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a3c680f0e541525dd47f31b1fa733c73274e4cf3231622c15a1266c942f9e60c
|
3 |
+
size 44040192
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eab3d65eee12bd4ba9eb8e9ad8fd864ee7ae55128503ab9904fa5d6e3d5beecb
|
3 |
+
size 22020096
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ad766223d2d32908bc3baa13e34c5a7cedc39784f636def6c4029aa80db2fcd
|
3 |
+
size 231211008
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f94fa6de84325ca1d98298e1c96edcc2e15e51cb40953bf3d123ad4abd2c6c1
|
3 |
+
size 462422016
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c3746323772979da387aa8878c6733cef9f040c5cd985ec46a71fb697840b0b
|
3 |
+
size 231211008
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02f8464908884043ad8072f7940297b45bd9be51d21c1b7284818e5a74fe6d01
|
3 |
+
size 22020096
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6d88f4660fa5bced9613296be17eac50df8b6afd42251753ade9c1766a579b7e
|
3 |
+
size 44040192
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7a9be42ff50e155bbbfd4ccdb1ad96f5aaf4ca5a141af614b5ce7581c9ab5a72
|
3 |
+
size 44040192
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e3bf9f09c0c2e4baade972eec82c07ad5c9c4549b882179bd7362dfc15a712fe
|
3 |
+
size 22020096
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96b5d1d61cb407f7591e30886beec7577cc9dc28e0cf0d39f76688ccd1b2eeaf
|
3 |
+
size 462422016
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:250df95870a41bd6c5d718c11d13c8dcf4b58965949db4263beff18c7675cb0b
|
3 |
+
size 22020096
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:754550356615daf341015669739da15178bf224ab09b46874ae570352cc09fa2
|
3 |
+
size 44040192
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5b04787b94558add239989acdbcd2b2bae6afe9bde6a47154cc9225ae626b329
|
3 |
+
size 44040192
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8ae37920f3cbb56f5a8905aa155c5bc8288f09a78142af694c6f8e0642bd4fc
|
3 |
+
size 22020096
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c05e2220f331f47bbe0c6bea085119a8ecf65004632755937ac97407013e8f9
|
3 |
+
size 231211008
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:28760469b76b1d0e20911f3ee168b2e812556f2f1e69008caa83718fb1722787
|
3 |
+
size 231211008
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15650b1335e3ce8c5a2745c6db6d0e33becf16e29d3194a70555758a38aa126a
|
3 |
+
size 231211008
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d93d5769e74e5a3936065bcd916cd299628ea358e24c89c4ecdcd80bdd5d80a4
|
3 |
+
size 462422016
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8bc11d9640cdeb10c768a1ec92e5780edd62ae2832cab2b5a7f686d89a5c124
|
3 |
+
size 22020096
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a09cad7198c7de7b72f7e6927a459b3a2624b7fd9b70c8e894832f162c2c47a
|
3 |
+
size 44040192
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a6b5e8d5f96ba27b8406acc1e6462c09461ef60fe54442011d80b4e98d3e017
|
3 |
+
size 44040192
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d1acdab22f8e30a3b2a96a612eaf222c7ef2ad8ab0db81c3492760dbc0ae241
|
3 |
+
size 22020096
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff2763b8147048dcfa2c28471b1f0af2d15ab95b481499467d6012d504a30700
|
3 |
+
size 231211008
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:579a07475453490914ef4aff81ce4c79fd03752770f816320edfb93213832783
|
3 |
+
size 462422016
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d37ebc444434bada0ad09e5d5cf671b92833cb3b62adb565d6618e678971045
|
3 |
+
size 22020096
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1a45c4d07a741f3a4edf52d79215f062e8469299fd5c25841de31b5ac70e91fd
|
3 |
+
size 44040192
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c70f22e9d6a1971e9faacecd95fe03dfb198afc1bf5178a907525dbe2092b01d
|
3 |
+
size 462422016
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8824c30e047cbd0b9452846a0f53c81e13397bb3c6e70bbebc9c01066b2241fa
|
3 |
+
size 44040192
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50b52ce54e5322d456a344a880428bdcd375f808fbacf738f08f6b66ff4f018b
|
3 |
+
size 22020096
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:602356317ffc5fd46dd4b58ffda1b04bf7ccdea4ff7e5047703df13fdcc3db83
|
3 |
+
size 231211008
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3ff94319d22ad417e1d2b9731743e61ad8488e3abf8390960fe157f22ceb856d
|
3 |
+
size 462422016
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eacd23aae203a2661bb16ada469417d5b4caad424e4558b576b915fed285e73a
|
3 |
+
size 22020096
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:254d852452343fee2522ecc63da0ca3fc2714817c72fa1cecd48a11d6bad71ca
|
3 |
+
size 44040192
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07aa7eaeb96d109a0861e45b380efee308d97b553faf86f1bb22fda737bd60d8
|
3 |
+
size 44040192
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ff943433b3ead3d2702b4c704e58b69bf018a118045419a7b81add5148ce63ce
|
3 |
+
size 22020096
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3bcd91340a2b603f33b0b417d48a6962c9d83fddf58c7bc5398a6fc8678e626f
|
3 |
+
size 231211008
|