Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- config.json +38 -0
- generation_config.json +6 -0
- model-00001-of-00189.safetensors +3 -0
- model-00002-of-00189.safetensors +3 -0
- model-00003-of-00189.safetensors +3 -0
- model-00004-of-00189.safetensors +3 -0
- model-00005-of-00189.safetensors +3 -0
- model-00006-of-00189.safetensors +3 -0
- model-00007-of-00189.safetensors +3 -0
- model-00008-of-00189.safetensors +3 -0
- model-00009-of-00189.safetensors +3 -0
- model-00010-of-00189.safetensors +3 -0
- model-00011-of-00189.safetensors +3 -0
- model-00012-of-00189.safetensors +3 -0
- model-00013-of-00189.safetensors +3 -0
- model-00014-of-00189.safetensors +3 -0
- model-00015-of-00189.safetensors +3 -0
- model-00016-of-00189.safetensors +3 -0
- model-00017-of-00189.safetensors +3 -0
- model-00018-of-00189.safetensors +3 -0
- model-00019-of-00189.safetensors +3 -0
- model-00020-of-00189.safetensors +3 -0
- model-00021-of-00189.safetensors +3 -0
- model-00022-of-00189.safetensors +3 -0
- model-00023-of-00189.safetensors +3 -0
- model-00024-of-00189.safetensors +3 -0
- model-00025-of-00189.safetensors +3 -0
- model-00026-of-00189.safetensors +3 -0
- model-00027-of-00189.safetensors +3 -0
- model-00028-of-00189.safetensors +3 -0
- model-00029-of-00189.safetensors +3 -0
- model-00030-of-00189.safetensors +3 -0
- model-00031-of-00189.safetensors +3 -0
- model-00032-of-00189.safetensors +3 -0
- model-00033-of-00189.safetensors +3 -0
- model-00034-of-00189.safetensors +3 -0
- model-00035-of-00189.safetensors +3 -0
- model-00036-of-00189.safetensors +3 -0
- model-00037-of-00189.safetensors +3 -0
- model-00038-of-00189.safetensors +3 -0
- model-00039-of-00189.safetensors +3 -0
- model-00040-of-00189.safetensors +3 -0
- model-00041-of-00189.safetensors +3 -0
- model-00042-of-00189.safetensors +3 -0
- model-00043-of-00189.safetensors +3 -0
- model-00044-of-00189.safetensors +3 -0
- model-00045-of-00189.safetensors +3 -0
- model-00046-of-00189.safetensors +3 -0
- model-00047-of-00189.safetensors +3 -0
- model-00048-of-00189.safetensors +3 -0
config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "Nemotron-4-340B-Instruct-hf",
|
3 |
+
"architectures": [
|
4 |
+
"NemotronForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 2,
|
9 |
+
"eos_token_id": 3,
|
10 |
+
"head_dim": 192,
|
11 |
+
"hidden_act": "relu2",
|
12 |
+
"hidden_size": 18432,
|
13 |
+
"initializer_range": 0.0063,
|
14 |
+
"intermediate_size": 73728,
|
15 |
+
"max_position_embeddings": 4096,
|
16 |
+
"mlp_bias": false,
|
17 |
+
"model_type": "nemotron",
|
18 |
+
"norm_eps": 1e-05,
|
19 |
+
"num_attention_heads": 96,
|
20 |
+
"num_hidden_layers": 96,
|
21 |
+
"num_key_value_heads": 8,
|
22 |
+
"quantization_config": {
|
23 |
+
"activation_scheme": "dynamic",
|
24 |
+
"ignored_layers": [
|
25 |
+
"lm_head"
|
26 |
+
],
|
27 |
+
"quant_method": "fp8"
|
28 |
+
},
|
29 |
+
"rope_percent": 0.5,
|
30 |
+
"rope_percentage": 0.5,
|
31 |
+
"rope_scaling": null,
|
32 |
+
"rope_theta": 10000,
|
33 |
+
"tie_word_embeddings": false,
|
34 |
+
"torch_dtype": "bfloat16",
|
35 |
+
"transformers_version": "4.43.0.dev0",
|
36 |
+
"use_cache": true,
|
37 |
+
"vocab_size": 256000
|
38 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,6 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 2,
|
4 |
+
"eos_token_id": 3,
|
5 |
+
"transformers_version": "4.43.0.dev0"
|
6 |
+
}
|
model-00001-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3acc010dae170bb2e747754807e46f8210bbcb8020b6d4f7c60d953ea147c0d5
|
3 |
+
size 9437184112
|
model-00002-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1241cb0e1c6bef6670a378c7c969b051aed5cff6d09ae884ee97e98a14a383f9
|
3 |
+
size 2095055948
|
model-00003-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9e2b4bc51db835ef4dec7496bcb396b1edc6b10f34edc27d88fa69c691a52052
|
3 |
+
size 2095203836
|
model-00004-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:81d1c3f14142563bb4a866b916aec8bcdfaf9124daf4a39ae01e87c57b64eda1
|
3 |
+
size 1358954708
|
model-00005-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:705f8828b4f753269814308145de39324aaf019e4e964d3252b14a53f57d81f2
|
3 |
+
size 2095203836
|
model-00006-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30bff5938b807eea5d757ba42bcae23bdd851309fa0a63c28798cfc4795ec59c
|
3 |
+
size 1358954708
|
model-00007-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ba4d876816ab715e82b3cbd590bca26607cc80435be87aa1b34e8b4879a8c71a
|
3 |
+
size 2095203836
|
model-00008-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:956379d7ebf47042d0515343dd07abc961761974a26b293155c1353ad4dc79f3
|
3 |
+
size 1358954708
|
model-00009-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:35a904ddb2bd0608faf308ae114d19ba866d2ee230ddfbf7361a6ab32a21f155
|
3 |
+
size 2095203836
|
model-00010-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fd71156f376b05d311369b0448d8ac92374256a3f58f96e39297e5e6cd5a66d
|
3 |
+
size 1358954708
|
model-00011-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f9d995d696ff479079e4eb2cbfda822620b6565ad393382e920876ec816a7f7b
|
3 |
+
size 2095203836
|
model-00012-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:295995dfdefb76f9915731fbaf0779b7acaa2540fa1c3b52b14f66d78b1f3d45
|
3 |
+
size 1358954708
|
model-00013-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:053ad3dfc43503e4b44631eb51d837b3f08c01dbdb44bbb1516e69017967fc83
|
3 |
+
size 2095203836
|
model-00014-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9fb57eba81ee64c8c6e661e3113a63470c0c9a87e2049d1efa18f44ffdfe1953
|
3 |
+
size 1358954708
|
model-00015-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4d3fa0722515d8dbab46f7787f69d4dab4528f3b85512389e52d06ef9d8f23af
|
3 |
+
size 2095203836
|
model-00016-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:32d4703552bafa6af8abfde29ebca5c9188c76aea6a01c538ad56c41698151c2
|
3 |
+
size 1358954708
|
model-00017-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2f42520344ddf8d3623ff183db863903c1887fa4043b8abd8d2969223182a67
|
3 |
+
size 2095203836
|
model-00018-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4e60bb195f7a89f3ce350f3dd3eaaab44dfc2ce3eda8a6842428b6834b8f222
|
3 |
+
size 1358954708
|
model-00019-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d78907097c3dd061e20bdd069c380f2b8c936c72a32bbc8573c25445866d783a
|
3 |
+
size 2095203836
|
model-00020-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:30564d2900e111d7a12c4413548c3f4e4dbe701e7ad156b257ce691ef4e4bbe2
|
3 |
+
size 1358954708
|
model-00021-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53eb12fde483fd0cc9ce9a010e74d443bd3f007eb556adbbc6a228a217b29216
|
3 |
+
size 2095203836
|
model-00022-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf3d8e9f1308ec0e7ae25e7e0bc8c8b58ad895d830d9eb3c2ffba0608ff06a5b
|
3 |
+
size 1358954716
|
model-00023-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7e124bc9daafbe95d926b6f1aee1d1707bec80f4bf34ad930ef2faaa4484f6ce
|
3 |
+
size 2095203852
|
model-00024-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:177ca5c3def9898b2e848e096d8e835a646194ac70059f99d5378e9abccc98fb
|
3 |
+
size 1358954716
|
model-00025-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c8425b9192b8d81a7768ca39036b945d82120df5dbb32171b5e229e26390775e
|
3 |
+
size 2095203852
|
model-00026-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fad56578b0306c3bf9685f276692c1da378880af876b4c6d8b4f91277abcb561
|
3 |
+
size 1358954716
|
model-00027-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:601fa83dc9bea36ab1bbd3fded2092737f12eb5820cb6c1812fc4772b5e191a0
|
3 |
+
size 2095203852
|
model-00028-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4afeacd8653af6e30f1bcca18bce2488451e7678efb8595c6e9d7f399fbebcc
|
3 |
+
size 1358954716
|
model-00029-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:974b92a564f3044c31d221f964069f7afa39eb4795db70f01c441ad4f0e4bc62
|
3 |
+
size 2095203852
|
model-00030-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:df044bb15845c94511169782387829e0f86ec76faa624e8cc730f2ad958ecb4c
|
3 |
+
size 1358954716
|
model-00031-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01b5321072213be3510952662088fe206a56aaf13020076b6b37b0fb5f9f1370
|
3 |
+
size 2095203852
|
model-00032-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:65ecd6b00a57a54f9b9f856311f9637d99663000014302f54c36297fa8edda1b
|
3 |
+
size 1358954716
|
model-00033-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45454e5dc4f630f0ad3bdd55e65570c91c6665211b3b095be94a8550b43ab33e
|
3 |
+
size 2095203852
|
model-00034-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e32f6c316129612855ccfc9ea8a2635fc30545cfb9f22fb2f178e01537846f7e
|
3 |
+
size 1358954716
|
model-00035-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0da9a282090aaf8dd5e02468b89b71f8ed16c8b830d42a941e30470976b07c1
|
3 |
+
size 2095203852
|
model-00036-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a76de48532a89f6f0986a2827c3f0a79ec51a24c7a7088885d742d4a543cc8e
|
3 |
+
size 1358954716
|
model-00037-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e32eee7f6f95cc5a5ee279433659ad6b1463d488f1fefa2cc4c7fe677884a490
|
3 |
+
size 2095203852
|
model-00038-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f6f1918e4ff4095d942458288e2f4a1f9fa51a09321bba7fe043d53744c4886
|
3 |
+
size 1358954716
|
model-00039-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bbba97b91379b6d4c51e4bb0636231dc0735848b41fb2b376e8c23df1baaac4a
|
3 |
+
size 2095203852
|
model-00040-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f92c091572ff317063ec352b0190ae9c654e67bccac623d4298980c02ff15f1
|
3 |
+
size 1358954716
|
model-00041-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b760acd1baa08564d006fbd5506e3c327ba0808a48c85cf532064f868a32bbfe
|
3 |
+
size 2095203852
|
model-00042-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ded4f3360b3c85a14c7e3a55b60e2c4ec8ae9fc7c7f9030c36436348d13423c9
|
3 |
+
size 1358954716
|
model-00043-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f3f1a4d732e41751b65dc0566abb5daf04d2746204511d76e262d47f3076447
|
3 |
+
size 2095203852
|
model-00044-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:74a4a2b4096e276890ff25b779b653535ce4cb3c5dbeb39f6b7be408d997900f
|
3 |
+
size 1358954716
|
model-00045-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b2c0c82b56ac317fdfc36ceff7257a731732326e7700d8a38329f520ac09c403
|
3 |
+
size 2095203852
|
model-00046-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:82e62e7a891fe44ae1d5a237b0f0285ea60a5ee1bb117bb83cf10e92322dd021
|
3 |
+
size 1358954716
|
model-00047-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8eca8f41a8eebc4a8e08ab59041c2942895ccdea4d7f8dcb003e1f878ad699fd
|
3 |
+
size 2095203852
|
model-00048-of-00189.safetensors
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2d1cfbad5360619e143ef08010e81496c71f49432f78928da1c86c0b0c1a7285
|
3 |
+
size 1358954716
|