Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +1 -0
- added_tokens.json +3 -0
- mlc-chat-config.json +99 -0
- ndarray-cache.json +0 -0
- params_shard_0.bin +3 -0
- params_shard_1.bin +3 -0
- params_shard_10.bin +3 -0
- params_shard_100.bin +3 -0
- params_shard_101.bin +3 -0
- params_shard_102.bin +3 -0
- params_shard_103.bin +3 -0
- params_shard_104.bin +3 -0
- params_shard_105.bin +3 -0
- params_shard_106.bin +3 -0
- params_shard_107.bin +3 -0
- params_shard_108.bin +3 -0
- params_shard_109.bin +3 -0
- params_shard_11.bin +3 -0
- params_shard_110.bin +3 -0
- params_shard_111.bin +3 -0
- params_shard_112.bin +3 -0
- params_shard_113.bin +3 -0
- params_shard_114.bin +3 -0
- params_shard_115.bin +3 -0
- params_shard_116.bin +3 -0
- params_shard_117.bin +3 -0
- params_shard_118.bin +3 -0
- params_shard_119.bin +3 -0
- params_shard_12.bin +3 -0
- params_shard_120.bin +3 -0
- params_shard_121.bin +3 -0
- params_shard_122.bin +3 -0
- params_shard_123.bin +3 -0
- params_shard_124.bin +3 -0
- params_shard_125.bin +3 -0
- params_shard_126.bin +3 -0
- params_shard_127.bin +3 -0
- params_shard_128.bin +3 -0
- params_shard_129.bin +3 -0
- params_shard_13.bin +3 -0
- params_shard_130.bin +3 -0
- params_shard_131.bin +3 -0
- params_shard_132.bin +3 -0
- params_shard_133.bin +3 -0
- params_shard_134.bin +3 -0
- params_shard_135.bin +3 -0
- params_shard_136.bin +3 -0
- params_shard_137.bin +3 -0
- params_shard_138.bin +3 -0
- params_shard_139.bin +3 -0
.gitattributes
CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
tokenizer.json filter=lfs diff=lfs merge=lfs -text
|
added_tokens.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"<image_soft_token>": 262144
|
3 |
+
}
|
mlc-chat-config.json
ADDED
@@ -0,0 +1,99 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"version": "0.1.0",
|
3 |
+
"model_type": "gemma3",
|
4 |
+
"quantization": "q0bf16",
|
5 |
+
"model_config": {
|
6 |
+
"text_config": {
|
7 |
+
"hidden_size": 3840,
|
8 |
+
"intermediate_size": 15360,
|
9 |
+
"num_hidden_layers": 48,
|
10 |
+
"attention_bias": false,
|
11 |
+
"num_attention_heads": 16,
|
12 |
+
"num_key_value_heads": 8,
|
13 |
+
"head_dim": 256,
|
14 |
+
"rms_norm_eps": 1e-06,
|
15 |
+
"hidden_activation": "gelu_pytorch_tanh",
|
16 |
+
"position_embedding_base": 10000,
|
17 |
+
"context_window_size": 8192,
|
18 |
+
"prefill_chunk_size": 8192,
|
19 |
+
"query_pre_attn_scalar": 256,
|
20 |
+
"sliding_window": 1024,
|
21 |
+
"kwargs": {
|
22 |
+
"model_type": "gemma3_text",
|
23 |
+
"rope_scaling": {
|
24 |
+
"factor": 8.0,
|
25 |
+
"rope_type": "linear"
|
26 |
+
}
|
27 |
+
}
|
28 |
+
},
|
29 |
+
"vocab_size": 262208,
|
30 |
+
"tensor_parallel_shards": 1,
|
31 |
+
"max_batch_size": 128,
|
32 |
+
"context_window_size": 8192,
|
33 |
+
"sliding_window_size": -1,
|
34 |
+
"prefill_chunk_size": 8192,
|
35 |
+
"is_text_model": false
|
36 |
+
},
|
37 |
+
"vocab_size": 262208,
|
38 |
+
"context_window_size": 8192,
|
39 |
+
"sliding_window_size": -1,
|
40 |
+
"prefill_chunk_size": 8192,
|
41 |
+
"attention_sink_size": -1,
|
42 |
+
"tensor_parallel_shards": 1,
|
43 |
+
"pipeline_parallel_stages": 1,
|
44 |
+
"temperature": 1.0,
|
45 |
+
"presence_penalty": 0.0,
|
46 |
+
"frequency_penalty": 0.0,
|
47 |
+
"repetition_penalty": 1.0,
|
48 |
+
"top_p": 1.0,
|
49 |
+
"tokenizer_files": [
|
50 |
+
"tokenizer.model",
|
51 |
+
"tokenizer.json",
|
52 |
+
"added_tokens.json",
|
53 |
+
"tokenizer_config.json"
|
54 |
+
],
|
55 |
+
"tokenizer_info": {
|
56 |
+
"token_postproc_method": "byte_fallback",
|
57 |
+
"prepend_space_in_encode": false,
|
58 |
+
"strip_space_in_decode": false
|
59 |
+
},
|
60 |
+
"conv_template": {
|
61 |
+
"name": "gemma_instruction",
|
62 |
+
"system_template": "{system_message}",
|
63 |
+
"system_message": "",
|
64 |
+
"system_prefix_token_ids": [
|
65 |
+
2
|
66 |
+
],
|
67 |
+
"add_role_after_system_message": true,
|
68 |
+
"roles": {
|
69 |
+
"user": "<start_of_turn>user",
|
70 |
+
"assistant": "<start_of_turn>model"
|
71 |
+
},
|
72 |
+
"role_templates": {
|
73 |
+
"user": "{user_message}",
|
74 |
+
"assistant": "{assistant_message}",
|
75 |
+
"tool": "{tool_message}"
|
76 |
+
},
|
77 |
+
"messages": [],
|
78 |
+
"seps": [
|
79 |
+
"<end_of_turn>\n"
|
80 |
+
],
|
81 |
+
"role_content_sep": "\n",
|
82 |
+
"role_empty_sep": "\n",
|
83 |
+
"stop_str": [
|
84 |
+
"<end_of_turn>"
|
85 |
+
],
|
86 |
+
"stop_token_ids": [
|
87 |
+
1,
|
88 |
+
107
|
89 |
+
],
|
90 |
+
"function_string": "",
|
91 |
+
"use_function_calling": false
|
92 |
+
},
|
93 |
+
"pad_token_id": 0,
|
94 |
+
"bos_token_id": 2,
|
95 |
+
"eos_token_id": [
|
96 |
+
1,
|
97 |
+
106
|
98 |
+
]
|
99 |
+
}
|
ndarray-cache.json
ADDED
The diff for this file is too large to render.
See raw diff
|
|
params_shard_0.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cdc61e6e8c46552326bdd0f45f8e906788f8b8adc9abdadf8452b6137158f43
|
3 |
+
size 2013757440
|
params_shard_1.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01f7821e986950a1cb851b024b29c79efdd4046876620900b6a0279dd9bb5039
|
3 |
+
size 117964800
|
params_shard_10.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f7926fb6b21053f03ba0b89ab024b1ff5aefb244740ad34708582f29f778c87e
|
3 |
+
size 117964800
|
params_shard_100.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:005f1d7a42101cb8d610e95c0cb3edcc4f28c13206f910851b56d971afb5c07e
|
3 |
+
size 117964800
|
params_shard_101.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f901c7ffa59de593782b7443268ddd46fa18838846936d665017e3101be37837
|
3 |
+
size 235929600
|
params_shard_102.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:997c265f191935dc920706baedaf0d85db35fc069420088931760a36b5604be0
|
3 |
+
size 31489024
|
params_shard_103.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ec0e699adf1f1ec3437482c042576280cd5477d40e717d39b3f9f3b1c150496
|
3 |
+
size 31457280
|
params_shard_104.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d39eee7837d0095633af07722dbfbe64d6c43899703b6da89b384c987ad98c2a
|
3 |
+
size 31457280
|
params_shard_105.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:18baed78ecf1ae623404c33d87e615b4f0ded5745b6a084db3c0f5a93322f932
|
3 |
+
size 117964800
|
params_shard_106.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2daf75386c8ad8582a3d04442ef3678e034d2deb04e3aa1fd4dcb09a91254ced
|
3 |
+
size 235929600
|
params_shard_107.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:80cc4d7b2cb77fd8dfcf392b016a5665a3cad903e3dd3e99679ee612f087038d
|
3 |
+
size 31489024
|
params_shard_108.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f832e6b5811207f2f028911e6c23df7a6d2798672130377fd85b98c3c1ab21d
|
3 |
+
size 31457280
|
params_shard_109.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82d8c565e943bee47933aeebc50afbdb3d31036879e60b5ecb31232623f32b5a
|
3 |
+
size 31457280
|
params_shard_11.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ad5937ecda487b9be7a75b113b7de99f631dd2dbbca7e42cb39122acaeece99a
|
3 |
+
size 235929600
|
params_shard_110.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c1de89ba20ae2f6caa24f3e3aed7659184d017d7baaa43a3f547a05931788fa5
|
3 |
+
size 117964800
|
params_shard_111.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:097bd99b9bfcd6d2750b30b8c3e2ff97d21afa2c64f0f1669356492f945f538e
|
3 |
+
size 235929600
|
params_shard_112.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88ce82e8784b7b74c8f4bc5811f712c7858dfb8e28b211f023deca43c57c8f9b
|
3 |
+
size 31489024
|
params_shard_113.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8f3e775b85b14eab6be9e4a530ee63dc4abb6d800ba2ef5ae26fe738989e854
|
3 |
+
size 31457280
|
params_shard_114.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25f635140a2c838c49d6e3285e249967a90374aaf0beeb912e0cc380f07adc07
|
3 |
+
size 31457280
|
params_shard_115.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1307ee98cc9b002e433d821e0364ca37ce8e6d066cdb6b110167ae45924acffe
|
3 |
+
size 117964800
|
params_shard_116.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7aea866e5ae733d994a66511cb8a767802a90a5f9e62342e9afb051b8c5264fc
|
3 |
+
size 235929600
|
params_shard_117.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:157bd14eb00b1b1708b8e52dfcd02eab10361f1e651caa72947448556246c3e4
|
3 |
+
size 31489024
|
params_shard_118.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e149c2b96ff53882260bd18d237b77bec481c2c073ea5750db71bc7e642c8654
|
3 |
+
size 31457280
|
params_shard_119.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8149a1d1f26a7a8fe63a72f6935837e7d391546b792a2c52b47add179cc7185
|
3 |
+
size 31457280
|
params_shard_12.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:03540367e7c8e898da5c952f839dcbf342d2efefb5928c31f8d3afe45353631b
|
3 |
+
size 31489024
|
params_shard_120.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a8a1a373f48232f94a30a9bd39359eb9056d34059b12c94ace91756cef772a31
|
3 |
+
size 117964800
|
params_shard_121.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89722d2678957ef529eaf0894dce64fbdb8ad68a2a2db463ee007af1eeda5fcc
|
3 |
+
size 235929600
|
params_shard_122.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:adf72218987252cce754f3f8942746f331ced5276d3e7561713d87edcbbf18f2
|
3 |
+
size 31489024
|
params_shard_123.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0bd26446133800430be5a739457cc19deaaae9df14f321b8781151a9662680e
|
3 |
+
size 31457280
|
params_shard_124.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81994fc829d68acfbb1188cbe71d34dbe64386a25491a024e59f39b599634af5
|
3 |
+
size 31457280
|
params_shard_125.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b6e2c4fd716ec7780a1dc0ffc5de99641a2ea2e47a4cde36e4c81ef619c79e2
|
3 |
+
size 117964800
|
params_shard_126.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eabe6e409e4b6ee1b9fed59b790bbe7588511444f1442560b08c09dc46b7cb7a
|
3 |
+
size 235929600
|
params_shard_127.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cacef8490d1165d740cdb7d7b81855669f05cd3f77f65abe3c06be5337df3537
|
3 |
+
size 31489024
|
params_shard_128.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:097551450fb857a3159e8d533b553abe92878ecdf2264d245dd7e0cff8b6a086
|
3 |
+
size 31457280
|
params_shard_129.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b5337b8e28539dfc0326cf32c4872da596c708c4fb2606bde2d4ee4451fcbd99
|
3 |
+
size 31457280
|
params_shard_13.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ce551ff40fe091f490d8f0bc384311be3dec6861e82ca50d4dbadb365fbe6dcb
|
3 |
+
size 31457280
|
params_shard_130.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f587a3d9de5fb8ba0b58f7d81d6d280fda1fa1f491fb7eff80912e15e1c5bf0
|
3 |
+
size 235929600
|
params_shard_131.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b83f044869e1f1255ce9889f8ced631885b10529683ba1c6665bdd6f1094746a
|
3 |
+
size 31458304
|
params_shard_132.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe8d40ef8c4da3b33f83e5a5bf9d309499748d2dfc7c23a1426f314c277a8d6e
|
3 |
+
size 31457280
|
params_shard_133.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4e11c69e148143720d2e5d7440dbb33445d53503b2dc1fb6e6f786ebdfab584
|
3 |
+
size 31457280
|
params_shard_134.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:561c31a94a7b6492860863d5609575f062cb3114bc7213456c962f9646cb202c
|
3 |
+
size 117964800
|
params_shard_135.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4cb996ff6012765476c9e43730493f64a6a6fa83ed2ecc8b048e5dc960cf3b64
|
3 |
+
size 117964800
|
params_shard_136.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5ef2b93f159943dd8f4a7f5bf4eb9950db7eff6cdd702446fe6983cc300a6a64
|
3 |
+
size 235929600
|
params_shard_137.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4450d959fd9b91b1fbc3d51af7b2fcb799df052a06229011862b23ec40b41460
|
3 |
+
size 31519744
|
params_shard_138.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00771522ac672462678dc4736693aa02cdedc7bb10c72307dd73e83e475b8c76
|
3 |
+
size 31457280
|
params_shard_139.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7cb6e7aaffcf4ec0392baeac40927bcc485973fd07121dc49e4426fad932bd72
|
3 |
+
size 31457280
|