mgoin commited on
Commit
5c7b184
1 Parent(s): dd1ec1f

Upload folder using huggingface_hub

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. config.json +38 -0
  2. generation_config.json +6 -0
  3. model-00001-of-00189.safetensors +3 -0
  4. model-00002-of-00189.safetensors +3 -0
  5. model-00003-of-00189.safetensors +3 -0
  6. model-00004-of-00189.safetensors +3 -0
  7. model-00005-of-00189.safetensors +3 -0
  8. model-00006-of-00189.safetensors +3 -0
  9. model-00007-of-00189.safetensors +3 -0
  10. model-00008-of-00189.safetensors +3 -0
  11. model-00009-of-00189.safetensors +3 -0
  12. model-00010-of-00189.safetensors +3 -0
  13. model-00011-of-00189.safetensors +3 -0
  14. model-00012-of-00189.safetensors +3 -0
  15. model-00013-of-00189.safetensors +3 -0
  16. model-00014-of-00189.safetensors +3 -0
  17. model-00015-of-00189.safetensors +3 -0
  18. model-00016-of-00189.safetensors +3 -0
  19. model-00017-of-00189.safetensors +3 -0
  20. model-00018-of-00189.safetensors +3 -0
  21. model-00019-of-00189.safetensors +3 -0
  22. model-00020-of-00189.safetensors +3 -0
  23. model-00021-of-00189.safetensors +3 -0
  24. model-00022-of-00189.safetensors +3 -0
  25. model-00023-of-00189.safetensors +3 -0
  26. model-00024-of-00189.safetensors +3 -0
  27. model-00025-of-00189.safetensors +3 -0
  28. model-00026-of-00189.safetensors +3 -0
  29. model-00027-of-00189.safetensors +3 -0
  30. model-00028-of-00189.safetensors +3 -0
  31. model-00029-of-00189.safetensors +3 -0
  32. model-00030-of-00189.safetensors +3 -0
  33. model-00031-of-00189.safetensors +3 -0
  34. model-00032-of-00189.safetensors +3 -0
  35. model-00033-of-00189.safetensors +3 -0
  36. model-00034-of-00189.safetensors +3 -0
  37. model-00035-of-00189.safetensors +3 -0
  38. model-00036-of-00189.safetensors +3 -0
  39. model-00037-of-00189.safetensors +3 -0
  40. model-00038-of-00189.safetensors +3 -0
  41. model-00039-of-00189.safetensors +3 -0
  42. model-00040-of-00189.safetensors +3 -0
  43. model-00041-of-00189.safetensors +3 -0
  44. model-00042-of-00189.safetensors +3 -0
  45. model-00043-of-00189.safetensors +3 -0
  46. model-00044-of-00189.safetensors +3 -0
  47. model-00045-of-00189.safetensors +3 -0
  48. model-00046-of-00189.safetensors +3 -0
  49. model-00047-of-00189.safetensors +3 -0
  50. model-00048-of-00189.safetensors +3 -0
config.json ADDED
@@ -0,0 +1,38 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_name_or_path": "Nemotron-4-340B-Instruct-hf",
3
+ "architectures": [
4
+ "NemotronForCausalLM"
5
+ ],
6
+ "attention_bias": false,
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 2,
9
+ "eos_token_id": 3,
10
+ "head_dim": 192,
11
+ "hidden_act": "relu2",
12
+ "hidden_size": 18432,
13
+ "initializer_range": 0.0063,
14
+ "intermediate_size": 73728,
15
+ "max_position_embeddings": 4096,
16
+ "mlp_bias": false,
17
+ "model_type": "nemotron",
18
+ "norm_eps": 1e-05,
19
+ "num_attention_heads": 96,
20
+ "num_hidden_layers": 96,
21
+ "num_key_value_heads": 8,
22
+ "quantization_config": {
23
+ "activation_scheme": "dynamic",
24
+ "ignored_layers": [
25
+ "lm_head"
26
+ ],
27
+ "quant_method": "fp8"
28
+ },
29
+ "rope_percent": 0.5,
30
+ "rope_percentage": 0.5,
31
+ "rope_scaling": null,
32
+ "rope_theta": 10000,
33
+ "tie_word_embeddings": false,
34
+ "torch_dtype": "bfloat16",
35
+ "transformers_version": "4.43.0.dev0",
36
+ "use_cache": true,
37
+ "vocab_size": 256000
38
+ }
generation_config.json ADDED
@@ -0,0 +1,6 @@
 
 
 
 
 
 
 
1
+ {
2
+ "_from_model_config": true,
3
+ "bos_token_id": 2,
4
+ "eos_token_id": 3,
5
+ "transformers_version": "4.43.0.dev0"
6
+ }
model-00001-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3acc010dae170bb2e747754807e46f8210bbcb8020b6d4f7c60d953ea147c0d5
3
+ size 9437184112
model-00002-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1241cb0e1c6bef6670a378c7c969b051aed5cff6d09ae884ee97e98a14a383f9
3
+ size 2095055948
model-00003-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9e2b4bc51db835ef4dec7496bcb396b1edc6b10f34edc27d88fa69c691a52052
3
+ size 2095203836
model-00004-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:81d1c3f14142563bb4a866b916aec8bcdfaf9124daf4a39ae01e87c57b64eda1
3
+ size 1358954708
model-00005-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:705f8828b4f753269814308145de39324aaf019e4e964d3252b14a53f57d81f2
3
+ size 2095203836
model-00006-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30bff5938b807eea5d757ba42bcae23bdd851309fa0a63c28798cfc4795ec59c
3
+ size 1358954708
model-00007-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ba4d876816ab715e82b3cbd590bca26607cc80435be87aa1b34e8b4879a8c71a
3
+ size 2095203836
model-00008-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:956379d7ebf47042d0515343dd07abc961761974a26b293155c1353ad4dc79f3
3
+ size 1358954708
model-00009-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:35a904ddb2bd0608faf308ae114d19ba866d2ee230ddfbf7361a6ab32a21f155
3
+ size 2095203836
model-00010-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fd71156f376b05d311369b0448d8ac92374256a3f58f96e39297e5e6cd5a66d
3
+ size 1358954708
model-00011-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f9d995d696ff479079e4eb2cbfda822620b6565ad393382e920876ec816a7f7b
3
+ size 2095203836
model-00012-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:295995dfdefb76f9915731fbaf0779b7acaa2540fa1c3b52b14f66d78b1f3d45
3
+ size 1358954708
model-00013-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:053ad3dfc43503e4b44631eb51d837b3f08c01dbdb44bbb1516e69017967fc83
3
+ size 2095203836
model-00014-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9fb57eba81ee64c8c6e661e3113a63470c0c9a87e2049d1efa18f44ffdfe1953
3
+ size 1358954708
model-00015-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d3fa0722515d8dbab46f7787f69d4dab4528f3b85512389e52d06ef9d8f23af
3
+ size 2095203836
model-00016-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32d4703552bafa6af8abfde29ebca5c9188c76aea6a01c538ad56c41698151c2
3
+ size 1358954708
model-00017-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c2f42520344ddf8d3623ff183db863903c1887fa4043b8abd8d2969223182a67
3
+ size 2095203836
model-00018-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4e60bb195f7a89f3ce350f3dd3eaaab44dfc2ce3eda8a6842428b6834b8f222
3
+ size 1358954708
model-00019-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d78907097c3dd061e20bdd069c380f2b8c936c72a32bbc8573c25445866d783a
3
+ size 2095203836
model-00020-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:30564d2900e111d7a12c4413548c3f4e4dbe701e7ad156b257ce691ef4e4bbe2
3
+ size 1358954708
model-00021-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53eb12fde483fd0cc9ce9a010e74d443bd3f007eb556adbbc6a228a217b29216
3
+ size 2095203836
model-00022-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf3d8e9f1308ec0e7ae25e7e0bc8c8b58ad895d830d9eb3c2ffba0608ff06a5b
3
+ size 1358954716
model-00023-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e124bc9daafbe95d926b6f1aee1d1707bec80f4bf34ad930ef2faaa4484f6ce
3
+ size 2095203852
model-00024-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:177ca5c3def9898b2e848e096d8e835a646194ac70059f99d5378e9abccc98fb
3
+ size 1358954716
model-00025-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8425b9192b8d81a7768ca39036b945d82120df5dbb32171b5e229e26390775e
3
+ size 2095203852
model-00026-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fad56578b0306c3bf9685f276692c1da378880af876b4c6d8b4f91277abcb561
3
+ size 1358954716
model-00027-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:601fa83dc9bea36ab1bbd3fded2092737f12eb5820cb6c1812fc4772b5e191a0
3
+ size 2095203852
model-00028-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c4afeacd8653af6e30f1bcca18bce2488451e7678efb8595c6e9d7f399fbebcc
3
+ size 1358954716
model-00029-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:974b92a564f3044c31d221f964069f7afa39eb4795db70f01c441ad4f0e4bc62
3
+ size 2095203852
model-00030-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df044bb15845c94511169782387829e0f86ec76faa624e8cc730f2ad958ecb4c
3
+ size 1358954716
model-00031-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01b5321072213be3510952662088fe206a56aaf13020076b6b37b0fb5f9f1370
3
+ size 2095203852
model-00032-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65ecd6b00a57a54f9b9f856311f9637d99663000014302f54c36297fa8edda1b
3
+ size 1358954716
model-00033-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45454e5dc4f630f0ad3bdd55e65570c91c6665211b3b095be94a8550b43ab33e
3
+ size 2095203852
model-00034-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e32f6c316129612855ccfc9ea8a2635fc30545cfb9f22fb2f178e01537846f7e
3
+ size 1358954716
model-00035-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f0da9a282090aaf8dd5e02468b89b71f8ed16c8b830d42a941e30470976b07c1
3
+ size 2095203852
model-00036-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0a76de48532a89f6f0986a2827c3f0a79ec51a24c7a7088885d742d4a543cc8e
3
+ size 1358954716
model-00037-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e32eee7f6f95cc5a5ee279433659ad6b1463d488f1fefa2cc4c7fe677884a490
3
+ size 2095203852
model-00038-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8f6f1918e4ff4095d942458288e2f4a1f9fa51a09321bba7fe043d53744c4886
3
+ size 1358954716
model-00039-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bbba97b91379b6d4c51e4bb0636231dc0735848b41fb2b376e8c23df1baaac4a
3
+ size 2095203852
model-00040-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f92c091572ff317063ec352b0190ae9c654e67bccac623d4298980c02ff15f1
3
+ size 1358954716
model-00041-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b760acd1baa08564d006fbd5506e3c327ba0808a48c85cf532064f868a32bbfe
3
+ size 2095203852
model-00042-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ded4f3360b3c85a14c7e3a55b60e2c4ec8ae9fc7c7f9030c36436348d13423c9
3
+ size 1358954716
model-00043-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f3f1a4d732e41751b65dc0566abb5daf04d2746204511d76e262d47f3076447
3
+ size 2095203852
model-00044-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74a4a2b4096e276890ff25b779b653535ce4cb3c5dbeb39f6b7be408d997900f
3
+ size 1358954716
model-00045-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b2c0c82b56ac317fdfc36ceff7257a731732326e7700d8a38329f520ac09c403
3
+ size 2095203852
model-00046-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:82e62e7a891fe44ae1d5a237b0f0285ea60a5ee1bb117bb83cf10e92322dd021
3
+ size 1358954716
model-00047-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8eca8f41a8eebc4a8e08ab59041c2942895ccdea4d7f8dcb003e1f878ad699fd
3
+ size 2095203852
model-00048-of-00189.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2d1cfbad5360619e143ef08010e81496c71f49432f78928da1c86c0b0c1a7285
3
+ size 1358954716