riczhou commited on
Commit
e7a8437
·
verified ·
1 Parent(s): a327d4e

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
mlc-chat-config.json ADDED
@@ -0,0 +1,99 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "version": "0.1.0",
3
+ "model_type": "gemma3",
4
+ "quantization": "q0bf16",
5
+ "model_config": {
6
+ "text_config": {
7
+ "hidden_size": 3840,
8
+ "intermediate_size": 15360,
9
+ "num_hidden_layers": 48,
10
+ "attention_bias": false,
11
+ "num_attention_heads": 16,
12
+ "num_key_value_heads": 8,
13
+ "head_dim": 256,
14
+ "rms_norm_eps": 1e-06,
15
+ "hidden_activation": "gelu_pytorch_tanh",
16
+ "position_embedding_base": 10000,
17
+ "context_window_size": 8192,
18
+ "prefill_chunk_size": 8192,
19
+ "query_pre_attn_scalar": 256,
20
+ "sliding_window": 1024,
21
+ "kwargs": {
22
+ "model_type": "gemma3_text",
23
+ "rope_scaling": {
24
+ "factor": 8.0,
25
+ "rope_type": "linear"
26
+ }
27
+ }
28
+ },
29
+ "vocab_size": 262208,
30
+ "tensor_parallel_shards": 1,
31
+ "max_batch_size": 128,
32
+ "context_window_size": 8192,
33
+ "sliding_window_size": -1,
34
+ "prefill_chunk_size": 8192,
35
+ "is_text_model": false
36
+ },
37
+ "vocab_size": 262208,
38
+ "context_window_size": 8192,
39
+ "sliding_window_size": -1,
40
+ "prefill_chunk_size": 8192,
41
+ "attention_sink_size": -1,
42
+ "tensor_parallel_shards": 1,
43
+ "pipeline_parallel_stages": 1,
44
+ "temperature": 1.0,
45
+ "presence_penalty": 0.0,
46
+ "frequency_penalty": 0.0,
47
+ "repetition_penalty": 1.0,
48
+ "top_p": 1.0,
49
+ "tokenizer_files": [
50
+ "tokenizer.model",
51
+ "tokenizer.json",
52
+ "added_tokens.json",
53
+ "tokenizer_config.json"
54
+ ],
55
+ "tokenizer_info": {
56
+ "token_postproc_method": "byte_fallback",
57
+ "prepend_space_in_encode": false,
58
+ "strip_space_in_decode": false
59
+ },
60
+ "conv_template": {
61
+ "name": "gemma_instruction",
62
+ "system_template": "{system_message}",
63
+ "system_message": "",
64
+ "system_prefix_token_ids": [
65
+ 2
66
+ ],
67
+ "add_role_after_system_message": true,
68
+ "roles": {
69
+ "user": "<start_of_turn>user",
70
+ "assistant": "<start_of_turn>model"
71
+ },
72
+ "role_templates": {
73
+ "user": "{user_message}",
74
+ "assistant": "{assistant_message}",
75
+ "tool": "{tool_message}"
76
+ },
77
+ "messages": [],
78
+ "seps": [
79
+ "<end_of_turn>\n"
80
+ ],
81
+ "role_content_sep": "\n",
82
+ "role_empty_sep": "\n",
83
+ "stop_str": [
84
+ "<end_of_turn>"
85
+ ],
86
+ "stop_token_ids": [
87
+ 1,
88
+ 107
89
+ ],
90
+ "function_string": "",
91
+ "use_function_calling": false
92
+ },
93
+ "pad_token_id": 0,
94
+ "bos_token_id": 2,
95
+ "eos_token_id": [
96
+ 1,
97
+ 106
98
+ ]
99
+ }
ndarray-cache.json ADDED
The diff for this file is too large to render. See raw diff
 
params_shard_0.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cdc61e6e8c46552326bdd0f45f8e906788f8b8adc9abdadf8452b6137158f43
3
+ size 2013757440
params_shard_1.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01f7821e986950a1cb851b024b29c79efdd4046876620900b6a0279dd9bb5039
3
+ size 117964800
params_shard_10.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7926fb6b21053f03ba0b89ab024b1ff5aefb244740ad34708582f29f778c87e
3
+ size 117964800
params_shard_100.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:005f1d7a42101cb8d610e95c0cb3edcc4f28c13206f910851b56d971afb5c07e
3
+ size 117964800
params_shard_101.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f901c7ffa59de593782b7443268ddd46fa18838846936d665017e3101be37837
3
+ size 235929600
params_shard_102.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:997c265f191935dc920706baedaf0d85db35fc069420088931760a36b5604be0
3
+ size 31489024
params_shard_103.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6ec0e699adf1f1ec3437482c042576280cd5477d40e717d39b3f9f3b1c150496
3
+ size 31457280
params_shard_104.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d39eee7837d0095633af07722dbfbe64d6c43899703b6da89b384c987ad98c2a
3
+ size 31457280
params_shard_105.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18baed78ecf1ae623404c33d87e615b4f0ded5745b6a084db3c0f5a93322f932
3
+ size 117964800
params_shard_106.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2daf75386c8ad8582a3d04442ef3678e034d2deb04e3aa1fd4dcb09a91254ced
3
+ size 235929600
params_shard_107.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80cc4d7b2cb77fd8dfcf392b016a5665a3cad903e3dd3e99679ee612f087038d
3
+ size 31489024
params_shard_108.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f832e6b5811207f2f028911e6c23df7a6d2798672130377fd85b98c3c1ab21d
3
+ size 31457280
params_shard_109.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82d8c565e943bee47933aeebc50afbdb3d31036879e60b5ecb31232623f32b5a
3
+ size 31457280
params_shard_11.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ad5937ecda487b9be7a75b113b7de99f631dd2dbbca7e42cb39122acaeece99a
3
+ size 235929600
params_shard_110.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c1de89ba20ae2f6caa24f3e3aed7659184d017d7baaa43a3f547a05931788fa5
3
+ size 117964800
params_shard_111.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:097bd99b9bfcd6d2750b30b8c3e2ff97d21afa2c64f0f1669356492f945f538e
3
+ size 235929600
params_shard_112.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88ce82e8784b7b74c8f4bc5811f712c7858dfb8e28b211f023deca43c57c8f9b
3
+ size 31489024
params_shard_113.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8f3e775b85b14eab6be9e4a530ee63dc4abb6d800ba2ef5ae26fe738989e854
3
+ size 31457280
params_shard_114.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25f635140a2c838c49d6e3285e249967a90374aaf0beeb912e0cc380f07adc07
3
+ size 31457280
params_shard_115.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1307ee98cc9b002e433d821e0364ca37ce8e6d066cdb6b110167ae45924acffe
3
+ size 117964800
params_shard_116.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aea866e5ae733d994a66511cb8a767802a90a5f9e62342e9afb051b8c5264fc
3
+ size 235929600
params_shard_117.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:157bd14eb00b1b1708b8e52dfcd02eab10361f1e651caa72947448556246c3e4
3
+ size 31489024
params_shard_118.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e149c2b96ff53882260bd18d237b77bec481c2c073ea5750db71bc7e642c8654
3
+ size 31457280
params_shard_119.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8149a1d1f26a7a8fe63a72f6935837e7d391546b792a2c52b47add179cc7185
3
+ size 31457280
params_shard_12.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:03540367e7c8e898da5c952f839dcbf342d2efefb5928c31f8d3afe45353631b
3
+ size 31489024
params_shard_120.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8a1a373f48232f94a30a9bd39359eb9056d34059b12c94ace91756cef772a31
3
+ size 117964800
params_shard_121.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89722d2678957ef529eaf0894dce64fbdb8ad68a2a2db463ee007af1eeda5fcc
3
+ size 235929600
params_shard_122.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:adf72218987252cce754f3f8942746f331ced5276d3e7561713d87edcbbf18f2
3
+ size 31489024
params_shard_123.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c0bd26446133800430be5a739457cc19deaaae9df14f321b8781151a9662680e
3
+ size 31457280
params_shard_124.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81994fc829d68acfbb1188cbe71d34dbe64386a25491a024e59f39b599634af5
3
+ size 31457280
params_shard_125.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b6e2c4fd716ec7780a1dc0ffc5de99641a2ea2e47a4cde36e4c81ef619c79e2
3
+ size 117964800
params_shard_126.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eabe6e409e4b6ee1b9fed59b790bbe7588511444f1442560b08c09dc46b7cb7a
3
+ size 235929600
params_shard_127.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cacef8490d1165d740cdb7d7b81855669f05cd3f77f65abe3c06be5337df3537
3
+ size 31489024
params_shard_128.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:097551450fb857a3159e8d533b553abe92878ecdf2264d245dd7e0cff8b6a086
3
+ size 31457280
params_shard_129.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5337b8e28539dfc0326cf32c4872da596c708c4fb2606bde2d4ee4451fcbd99
3
+ size 31457280
params_shard_13.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ce551ff40fe091f490d8f0bc384311be3dec6861e82ca50d4dbadb365fbe6dcb
3
+ size 31457280
params_shard_130.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f587a3d9de5fb8ba0b58f7d81d6d280fda1fa1f491fb7eff80912e15e1c5bf0
3
+ size 235929600
params_shard_131.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b83f044869e1f1255ce9889f8ced631885b10529683ba1c6665bdd6f1094746a
3
+ size 31458304
params_shard_132.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fe8d40ef8c4da3b33f83e5a5bf9d309499748d2dfc7c23a1426f314c277a8d6e
3
+ size 31457280
params_shard_133.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4e11c69e148143720d2e5d7440dbb33445d53503b2dc1fb6e6f786ebdfab584
3
+ size 31457280
params_shard_134.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:561c31a94a7b6492860863d5609575f062cb3114bc7213456c962f9646cb202c
3
+ size 117964800
params_shard_135.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cb996ff6012765476c9e43730493f64a6a6fa83ed2ecc8b048e5dc960cf3b64
3
+ size 117964800
params_shard_136.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ef2b93f159943dd8f4a7f5bf4eb9950db7eff6cdd702446fe6983cc300a6a64
3
+ size 235929600
params_shard_137.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4450d959fd9b91b1fbc3d51af7b2fcb799df052a06229011862b23ec40b41460
3
+ size 31519744
params_shard_138.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00771522ac672462678dc4736693aa02cdedc7bb10c72307dd73e83e475b8c76
3
+ size 31457280
params_shard_139.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7cb6e7aaffcf4ec0392baeac40927bcc485973fd07121dc49e4426fad932bd72
3
+ size 31457280