Upload folder using huggingface_hub
Browse files- .gitattributes +10 -0
- compiled/02303aa7a8919611746e.neff +3 -0
- compiled/62ccc72e2188dd36c0ac.neff +3 -0
- compiled/7a59f63dad73b3a6850d.neff +3 -0
- compiled/a020eebfabaf2eb952de.neff +3 -0
- compiled/a74eace73605307c877e.neff +3 -0
- compiled/af5adbbdb5a3e1743a9a.neff +3 -0
- compiled/b395f57f89b246c69e20.neff +3 -0
- compiled/b6ef21232aa80f4998ee.neff +3 -0
- compiled/cbb482ade0566ea4d9b8.neff +3 -0
- compiled/d601d278537d61e59c36.neff +3 -0
- config.json +40 -0
- generation_config.json +7 -0
.gitattributes
CHANGED
@@ -33,3 +33,13 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
compiled/02303aa7a8919611746e.neff filter=lfs diff=lfs merge=lfs -text
|
37 |
+
compiled/62ccc72e2188dd36c0ac.neff filter=lfs diff=lfs merge=lfs -text
|
38 |
+
compiled/7a59f63dad73b3a6850d.neff filter=lfs diff=lfs merge=lfs -text
|
39 |
+
compiled/a020eebfabaf2eb952de.neff filter=lfs diff=lfs merge=lfs -text
|
40 |
+
compiled/a74eace73605307c877e.neff filter=lfs diff=lfs merge=lfs -text
|
41 |
+
compiled/af5adbbdb5a3e1743a9a.neff filter=lfs diff=lfs merge=lfs -text
|
42 |
+
compiled/b395f57f89b246c69e20.neff filter=lfs diff=lfs merge=lfs -text
|
43 |
+
compiled/b6ef21232aa80f4998ee.neff filter=lfs diff=lfs merge=lfs -text
|
44 |
+
compiled/cbb482ade0566ea4d9b8.neff filter=lfs diff=lfs merge=lfs -text
|
45 |
+
compiled/d601d278537d61e59c36.neff filter=lfs diff=lfs merge=lfs -text
|
compiled/02303aa7a8919611746e.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4df2eb617ca2d4c699699b0302294b40f0a363eb9007220e3da9da7994cdc893
|
3 |
+
size 2520064
|
compiled/62ccc72e2188dd36c0ac.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9576a88d78f32adf27e08ebfd574a54ce5a6d56fb8715125dac9d051e0ae4183
|
3 |
+
size 2110464
|
compiled/7a59f63dad73b3a6850d.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:77da165344c2d4eef40b91604617bfaebaafb01d422368da98eebe63f25c7f83
|
3 |
+
size 2038784
|
compiled/a020eebfabaf2eb952de.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:90b24840fef4b9c24dfd7739daeb7afc8eb5665ab092f414785c595d3b662d41
|
3 |
+
size 1987584
|
compiled/a74eace73605307c877e.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f35a001742a46e8718fc626902bdfb3210233daee5ea23ad1e2807af88708a8b
|
3 |
+
size 2008064
|
compiled/af5adbbdb5a3e1743a9a.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b6ee80486e654f61907d6f770639ffbcfebe78077cfdad335f2816aa7e407c0
|
3 |
+
size 2284544
|
compiled/b395f57f89b246c69e20.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb094aeb99ecfa066ed683684ebb88853d8f87eb29ebf5528f5d4d9834f12b1e
|
3 |
+
size 2223104
|
compiled/b6ef21232aa80f4998ee.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d8f320779523e8ea55504aa9c160da8d400de3c22021bd3dd60de46ebcb90db4
|
3 |
+
size 2857984
|
compiled/cbb482ade0566ea4d9b8.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:101abf993b2656cb6b45baa5b40d9f41b8f6406feb3c923f73f44a470393dbb0
|
3 |
+
size 2345984
|
compiled/d601d278537d61e59c36.neff
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8a13bee97bd0ad42d74cb1df4c03cb682e4b0454bacab61438e95ef1bc0a52f1
|
3 |
+
size 6349824
|
config.json
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "elyza/ELYZA-japanese-Llama-2-13b-instruct",
|
3 |
+
"architectures": [
|
4 |
+
"LlamaForCausalLM"
|
5 |
+
],
|
6 |
+
"attention_bias": false,
|
7 |
+
"attention_dropout": 0.0,
|
8 |
+
"bos_token_id": 1,
|
9 |
+
"eos_token_id": 2,
|
10 |
+
"hidden_act": "silu",
|
11 |
+
"hidden_size": 5120,
|
12 |
+
"initializer_range": 0.02,
|
13 |
+
"intermediate_size": 13824,
|
14 |
+
"max_position_embeddings": 4096,
|
15 |
+
"model_type": "llama",
|
16 |
+
"neuron": {
|
17 |
+
"auto_cast_type": "bf16",
|
18 |
+
"batch_size": 1,
|
19 |
+
"checkpoint_id": "elyza/ELYZA-japanese-Llama-2-13b-instruct",
|
20 |
+
"checkpoint_revision": "ed15089024f3ecad9a8c4ce1db302cc01aa9f4ee",
|
21 |
+
"compiler_type": "neuronx-cc",
|
22 |
+
"compiler_version": "2.12.68.0+4480452af",
|
23 |
+
"num_cores": 24,
|
24 |
+
"sequence_length": 2048,
|
25 |
+
"task": "text-generation"
|
26 |
+
},
|
27 |
+
"num_attention_heads": 40,
|
28 |
+
"num_hidden_layers": 40,
|
29 |
+
"num_key_value_heads": 40,
|
30 |
+
"pad_token_id": 2,
|
31 |
+
"pretraining_tp": 1,
|
32 |
+
"rms_norm_eps": 1e-05,
|
33 |
+
"rope_scaling": null,
|
34 |
+
"rope_theta": 10000.0,
|
35 |
+
"tie_word_embeddings": false,
|
36 |
+
"torch_dtype": "bfloat16",
|
37 |
+
"transformers_version": "4.36.2",
|
38 |
+
"use_cache": true,
|
39 |
+
"vocab_size": 32000
|
40 |
+
}
|
generation_config.json
ADDED
@@ -0,0 +1,7 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_from_model_config": true,
|
3 |
+
"bos_token_id": 1,
|
4 |
+
"eos_token_id": 2,
|
5 |
+
"pad_token_id": 2,
|
6 |
+
"transformers_version": "4.36.2"
|
7 |
+
}
|