Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +30 -0
- generation_config.json +6 -0
- model-00001-of-00059.safetensors +3 -0
- model-00002-of-00059.safetensors +3 -0
- model-00003-of-00059.safetensors +3 -0
- model-00004-of-00059.safetensors +3 -0
- model-00005-of-00059.safetensors +3 -0
- model-00006-of-00059.safetensors +3 -0
- model-00007-of-00059.safetensors +3 -0
- model-00008-of-00059.safetensors +3 -0
- model-00009-of-00059.safetensors +3 -0
- model-00010-of-00059.safetensors +3 -0
- model-00011-of-00059.safetensors +3 -0
- model-00012-of-00059.safetensors +3 -0
- model-00013-of-00059.safetensors +3 -0
- model-00014-of-00059.safetensors +3 -0
- model-00015-of-00059.safetensors +3 -0
- model-00016-of-00059.safetensors +3 -0
- model-00017-of-00059.safetensors +3 -0
- model-00018-of-00059.safetensors +3 -0
- model-00019-of-00059.safetensors +3 -0
- model-00020-of-00059.safetensors +3 -0
- model-00021-of-00059.safetensors +3 -0
- model-00022-of-00059.safetensors +3 -0
- model-00023-of-00059.safetensors +3 -0
- model-00024-of-00059.safetensors +3 -0
- model-00025-of-00059.safetensors +3 -0
- model-00026-of-00059.safetensors +3 -0
- model-00027-of-00059.safetensors +3 -0
- model-00028-of-00059.safetensors +3 -0
- model-00029-of-00059.safetensors +3 -0
- model-00030-of-00059.safetensors +3 -0
- model-00031-of-00059.safetensors +3 -0
- model-00032-of-00059.safetensors +3 -0
- model-00033-of-00059.safetensors +3 -0
- model-00034-of-00059.safetensors +3 -0
- model-00035-of-00059.safetensors +3 -0
- model-00036-of-00059.safetensors +3 -0
- model-00037-of-00059.safetensors +3 -0
- model-00038-of-00059.safetensors +3 -0
- model-00039-of-00059.safetensors +3 -0
- model-00040-of-00059.safetensors +3 -0
- model-00041-of-00059.safetensors +3 -0
- model-00042-of-00059.safetensors +3 -0
- model-00043-of-00059.safetensors +3 -0
- model-00044-of-00059.safetensors +3 -0
- model-00045-of-00059.safetensors +3 -0
- model-00046-of-00059.safetensors +3 -0
- model-00047-of-00059.safetensors +3 -0
- model-00048-of-00059.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,30 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"MixtralForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_dropout": 0.0,
|
6 |
+
"bos_token_id": 1,
|
7 |
+
"eos_token_id": 2,
|
8 |
+
"hidden_act": "silu",
|
9 |
+
"hidden_size": 6144,
|
10 |
+
"initializer_range": 0.02,
|
11 |
+
"intermediate_size": 16384,
|
12 |
+
"max_position_embeddings": 65536,
|
13 |
+
"model_type": "mixtral",
|
14 |
+
"num_attention_heads": 48,
|
15 |
+
"num_experts_per_tok": 2,
|
16 |
+
"num_hidden_layers": 56,
|
17 |
+
"num_key_value_heads": 8,
|
18 |
+
"num_local_experts": 8,
|
19 |
+
"output_router_logits": false,
|
20 |
+
"rms_norm_eps": 1e-05,
|
21 |
+
"rope_theta": 1000000,
|
22 |
+
"router_aux_loss_coef": 0.001,
|
23 |
+
"router_jitter_noise": 0.0,
|
24 |
+
"sliding_window": null,
|
25 |
+
"tie_word_embeddings": false,
|
26 |
+
"torch_dtype": "bfloat16",
|
27 |
+
"transformers_version": "4.40.0.dev0",
|
28 |
+
"use_cache": true,
|
29 |
+
"vocab_size": 32000
|
30 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"transformers_version": "4.40.0.dev0"
|
6 |
+
}
|
model-00001-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:959215668dd6848473ea880a260766bd84d49f3091a1b5f41be1b3b2f7bf35c4
|
3 |
+
size 4998663696
|
model-00002-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:800f904fea1a126f9a032f0f5b24cc66233eef9b66e5896d0361e8871ca64981
|
3 |
+
size 4806799120
|
model-00003-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:69d479a3893bc011da056deb52e1b4f1f70b802a0538968cd63eedb55d067925
|
3 |
+
size 4806799120
|
model-00004-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74ea035e0138a2bfbabf942fbc843f1191037ed27e0062a6c0f02ff1c6102e3b
|
3 |
+
size 4806799120
|
model-00005-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56002e6eded8e1a494e07f833a16512a01f99f1da734e2dc13268d134ad4a383
|
3 |
+
size 4806799120
|
model-00006-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91178c8d09cd0dae938ce81fea1507a36cf2b28a2d0f995f765c246fca90825b
|
3 |
+
size 4806799120
|
model-00007-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bd272e4a82b0de29a563069b470912d860f5fdceed800889948155b8dada2c2f
|
3 |
+
size 4806799120
|
model-00008-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9248cd047634f2c5c540556d0d4b396a3e3f11988dac72c8e074ade51cbe22a9
|
3 |
+
size 4806799120
|
model-00009-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:19d8ac7544629355e147b17469214f18b79c3c43c70fb48563cc200aedd1e8cb
|
3 |
+
size 4806799120
|
model-00010-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cbc3658591e93d488518d8cc46c2ce09ed19e28950dc9a8918438a386a36f08a
|
3 |
+
size 4806799120
|
model-00011-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d12b9677f2ef087ad3c52c3a97c8ddb87673e9614486ac4f2077846436a40dc
|
3 |
+
size 4806799136
|
model-00012-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:504cbcc3c1b6918fe52713d764ec2e9cb70bc12436bd89466b987b0d05ddf1bd
|
3 |
+
size 4806799152
|
model-00013-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8c4e20accd34d8f8c51e6c8ae6fbc23cebbc7519c7c6242abe82be69d0b324ea
|
3 |
+
size 4806799152
|
model-00014-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4a06577994c4117e5398be33e53b0b8f25949bb5046432fbc30442fea9fded54
|
3 |
+
size 4806799152
|
model-00015-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c590ff45831d065390b8e5ba86cc9aec9bb6906677a79a3cf2fbde3760ab4c74
|
3 |
+
size 4806799152
|
model-00016-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66f3ca30927595ba1a53439a3258660548e7e01b60e2e6455439991344675059
|
3 |
+
size 4806799152
|
model-00017-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bb0a3a4d51305c48f3fcef1055be70ea752b01468c3f9da8ad71c3cba452c2b5
|
3 |
+
size 4806799152
|
model-00018-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d5fe7294be953c69007cb8c482c68a3e69e253dda478dbf04df7bd073a83fa43
|
3 |
+
size 4806799152
|
model-00019-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:664059b8a83121d16b19a9231fd81adbe5ef2f48bb5c6eaf8d4a40934269b524
|
3 |
+
size 4806799152
|
model-00020-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0821243522d3542a127f2cfe0ed17b778f4f17dd50202be53ef40d14fcdba648
|
3 |
+
size 4806799152
|
model-00021-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:68f1e1e1895674a6810adb48931d3a9711e10fac510859851e7bda8ee9a18000
|
3 |
+
size 4806799152
|
model-00022-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77d1c0bc279b7f4bf89c5a2929bc2f194dfc90a7ca962ec4bfb4e18085482eaf
|
3 |
+
size 4806799152
|
model-00023-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:120b4205c1823e72d11f7772cdc6a37414f447da13f641c91b3d40d17e5eb4eb
|
3 |
+
size 4806799152
|
model-00024-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:16c61d525809d1320387c5592ab98f05cc2ab3d1187d66e546cb9e1188b812aa
|
3 |
+
size 4932529864
|
model-00025-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f761c6570988d5b6bdf7f511fbc9c994ef9d3faa6408fd6f562c1a729429dba
|
3 |
+
size 4995542848
|
model-00026-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:879fe13767d964005b9fa8bfa1b5ba0899ec6529dd44a4e41c8a47dfbdb47967
|
3 |
+
size 4995542848
|
model-00027-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee959271ba7d2323ae1081f3e51440cd48fbffd6473c643ff27c54a1ac6c02d4
|
3 |
+
size 4932628288
|
model-00028-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4fa0860fea0341ee0044a1b23fc4872c16b0d7cbc3b086a3796b26c27160007d
|
3 |
+
size 4806774344
|
model-00029-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cef3e592eda756117188740eae81d27028dccee47d0777b0ea7911d68da4a971
|
3 |
+
size 4806799144
|
model-00030-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6ac4814702cf7083f1082dec351cea3137a136f8d6f2844f2364f2db576c2667
|
3 |
+
size 4806799144
|
model-00031-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66eacaddda00ed6286e91930ab2a07f4a90997335dd4b8ce618dd5354b082f74
|
3 |
+
size 4806799144
|
model-00032-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d55dbbf151e5a8da0c178fbafcd204a758b56eb62428433a6d1de0bcfa306fbe
|
3 |
+
size 4806799144
|
model-00033-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9861a4561cb309a6c41559b966d57581ce4502c1c69dadf8767419c10d311c16
|
3 |
+
size 4806799152
|
model-00034-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0db8de1ab89311fad868185498e7733e873e9cdcc7f7204e8dc2af38d5f8256b
|
3 |
+
size 4806799152
|
model-00035-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b7f097c59c32acfa28f31cfa9fd357563b35c48d3c9a2773948e374beef2b62f
|
3 |
+
size 4806799152
|
model-00036-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b14337938ed54763155528e16bb66a4436967e68a630683db1a890264fd4e5a
|
3 |
+
size 4806799152
|
model-00037-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:56adc089068f1b680d18ab038b2a92db63bb2d6155688e670ad46de66441b65c
|
3 |
+
size 4806799152
|
model-00038-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:545a85e71d61ddf175f50324ff655485a59dd640dafaff5a9b7b77d7bf812113
|
3 |
+
size 4806799152
|
model-00039-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:484e246d71f782b9f2f71f0a9d2ae18d6780f74a8fc657dd28c65bba614987fa
|
3 |
+
size 4806799152
|
model-00040-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9ed8c78a8e1f2cc786ceb6e06b2a362cbea71a738b4e2211a4ce6af5b9afec74
|
3 |
+
size 4806799152
|
model-00041-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:567e34b5f751e9c6d0d6c83887b85d7700f860c70df88f204cc0a7df9d9017fb
|
3 |
+
size 4806799152
|
model-00042-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1b3b34903f58d50d83fb28c0906ebdb567525020b79162d8ef70392e8231eef
|
3 |
+
size 4806799152
|
model-00043-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9331cbc59ddf8277728e5fd955f0a99eb88b6a0d3d876f415abcfd3197d36543
|
3 |
+
size 4806799152
|
model-00044-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ca409e96ac060028d1ebcf604663f2913f0ea9965bbe3d0e92d3e1772c666186
|
3 |
+
size 4806799152
|
model-00045-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0674c49ba7d91f376d0c639d0f27db271f8462d669170e33e4029cc256040926
|
3 |
+
size 4806799152
|
model-00046-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b291db3505669ebb9ff38aab8fb1b8b2ec39a7841557fdbccfe045b737568ee6
|
3 |
+
size 4806799152
|
model-00047-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bb412d255b48bdb6ff41962426e30519e56313f99c7b784091f0d4ec0c46063
|
3 |
+
size 4806799152
|
model-00048-of-00059.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:471c7534a519ae1c525b2109b0a86aee581a46ef1f65e079ed9a3fd3869e957e
|
3 |
+
size 4806799152
|