Upload Qwen3ForCausalLM
Browse files- config.json +14 -7
- generation_config.json +1 -1
- pytorch_model-00001-of-00007.bin +2 -2
- pytorch_model-00002-of-00007.bin +2 -2
- pytorch_model-00003-of-00007.bin +2 -2
- pytorch_model-00004-of-00007.bin +2 -2
- pytorch_model-00005-of-00007.bin +2 -2
- pytorch_model-00006-of-00007.bin +2 -2
- pytorch_model-00007-of-00007.bin +2 -2
config.json
CHANGED
@@ -18,7 +18,7 @@
|
|
18 |
"num_hidden_layers": 64,
|
19 |
"num_key_value_heads": 8,
|
20 |
"quantization_config": {
|
21 |
-
"
|
22 |
"modules_to_not_convert": null,
|
23 |
"quant_method": "torchao",
|
24 |
"quant_type": {
|
@@ -28,11 +28,18 @@
|
|
28 |
"_data": "float8_e4m3fn",
|
29 |
"_type": "torch.dtype"
|
30 |
},
|
31 |
-
"granularity":
|
32 |
-
|
33 |
-
|
34 |
-
|
35 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
36 |
"mm_config": {
|
37 |
"_data": {
|
38 |
"emulate": false,
|
@@ -61,7 +68,7 @@
|
|
61 |
"sliding_window": null,
|
62 |
"tie_word_embeddings": false,
|
63 |
"torch_dtype": "bfloat16",
|
64 |
-
"transformers_version": "4.52.
|
65 |
"use_cache": true,
|
66 |
"use_sliding_window": false,
|
67 |
"vocab_size": 151936
|
|
|
18 |
"num_hidden_layers": 64,
|
19 |
"num_key_value_heads": 8,
|
20 |
"quantization_config": {
|
21 |
+
"include_input_output_embeddings": false,
|
22 |
"modules_to_not_convert": null,
|
23 |
"quant_method": "torchao",
|
24 |
"quant_type": {
|
|
|
28 |
"_data": "float8_e4m3fn",
|
29 |
"_type": "torch.dtype"
|
30 |
},
|
31 |
+
"granularity": [
|
32 |
+
{
|
33 |
+
"_data": {},
|
34 |
+
"_type": "PerRow",
|
35 |
+
"_version": 1
|
36 |
+
},
|
37 |
+
{
|
38 |
+
"_data": {},
|
39 |
+
"_type": "PerRow",
|
40 |
+
"_version": 1
|
41 |
+
}
|
42 |
+
],
|
43 |
"mm_config": {
|
44 |
"_data": {
|
45 |
"emulate": false,
|
|
|
68 |
"sliding_window": null,
|
69 |
"tie_word_embeddings": false,
|
70 |
"torch_dtype": "bfloat16",
|
71 |
+
"transformers_version": "4.52.3",
|
72 |
"use_cache": true,
|
73 |
"use_sliding_window": false,
|
74 |
"vocab_size": 151936
|
generation_config.json
CHANGED
@@ -9,5 +9,5 @@
|
|
9 |
"temperature": 0.6,
|
10 |
"top_k": 20,
|
11 |
"top_p": 0.95,
|
12 |
-
"transformers_version": "4.52.
|
13 |
}
|
|
|
9 |
"temperature": 0.6,
|
10 |
"top_k": 20,
|
11 |
"top_p": 0.95,
|
12 |
+
"transformers_version": "4.52.3"
|
13 |
}
|
pytorch_model-00001-of-00007.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eed0a42c41196d852a0ad630145156d1f25ebbd5503f308233b211b81604c03e
|
3 |
+
size 4971155870
|
pytorch_model-00002-of-00007.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3e647e9ddf448a623b78897e10808f3a1c971453ab1a719eae153fb628e5e51c
|
3 |
+
size 4973482027
|
pytorch_model-00003-of-00007.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:787b871f002495b07948640c6c2268c57dda22c12e8084194d751522c99e53b5
|
3 |
+
size 4879043437
|
pytorch_model-00004-of-00007.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34d6f19c4295c04255fcdebccd83b9a7768584d33db6426350dce44c9d2bebc4
|
3 |
+
size 4879043437
|
pytorch_model-00005-of-00007.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e584b23cec40945a33df1465d9df128b01f08780ce06d75793c787ad2199bf94
|
3 |
+
size 4879043437
|
pytorch_model-00006-of-00007.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f728859761efca7d6e8ea7a0385ced26e22b2c3e3cd18f4aa4206e363e49a9ab
|
3 |
+
size 4879043437
|
pytorch_model-00007-of-00007.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:403de3a4d63a3fbc964476f7cdee8aa8349242eac732621b199330d1b41e0ecd
|
3 |
+
size 4876727583
|