Update models
Browse files- .gitattributes +15 -0
- Qwen3-30B-A3B-Q2_K.gguf +3 -0
- Qwen3-30B-A3B-Q3_K_L.gguf +3 -0
- Qwen3-30B-A3B-Q3_K_M.gguf +3 -0
- Qwen3-30B-A3B-Q3_K_S.gguf +3 -0
- Qwen3-30B-A3B-Q4_0.gguf +3 -0
- Qwen3-30B-A3B-Q4_K_M.gguf +3 -0
- Qwen3-30B-A3B-Q4_K_S.gguf +3 -0
- Qwen3-30B-A3B-Q5_0.gguf +3 -0
- Qwen3-30B-A3B-Q5_K_M.gguf +3 -0
- Qwen3-30B-A3B-Q5_K_S.gguf +3 -0
- Qwen3-30B-A3B-Q6_K.gguf +3 -0
- Qwen3-30B-A3B-Q8_0.gguf +3 -0
- Qwen3-30B-A3B-f16-00001-of-00003.gguf +3 -0
- Qwen3-30B-A3B-f16-00002-of-00003.gguf +3 -0
- Qwen3-30B-A3B-f16-00003-of-00003.gguf +3 -0
- config.json +38 -0
.gitattributes
CHANGED
@@ -33,3 +33,18 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
33 |
*.zip filter=lfs diff=lfs merge=lfs -text
|
34 |
*.zst filter=lfs diff=lfs merge=lfs -text
|
35 |
*tfevents* filter=lfs diff=lfs merge=lfs -text
|
36 |
+
Qwen3-30B-A3B-Q2_K.gguf filter=lfs diff=lfs merge=lfs -text
|
37 |
+
Qwen3-30B-A3B-Q3_K_L.gguf filter=lfs diff=lfs merge=lfs -text
|
38 |
+
Qwen3-30B-A3B-Q3_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
39 |
+
Qwen3-30B-A3B-Q3_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
40 |
+
Qwen3-30B-A3B-Q4_0.gguf filter=lfs diff=lfs merge=lfs -text
|
41 |
+
Qwen3-30B-A3B-Q4_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
42 |
+
Qwen3-30B-A3B-Q4_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
43 |
+
Qwen3-30B-A3B-Q5_0.gguf filter=lfs diff=lfs merge=lfs -text
|
44 |
+
Qwen3-30B-A3B-Q5_K_M.gguf filter=lfs diff=lfs merge=lfs -text
|
45 |
+
Qwen3-30B-A3B-Q5_K_S.gguf filter=lfs diff=lfs merge=lfs -text
|
46 |
+
Qwen3-30B-A3B-Q6_K.gguf filter=lfs diff=lfs merge=lfs -text
|
47 |
+
Qwen3-30B-A3B-Q8_0.gguf filter=lfs diff=lfs merge=lfs -text
|
48 |
+
Qwen3-30B-A3B-f16-00001-of-00003.gguf filter=lfs diff=lfs merge=lfs -text
|
49 |
+
Qwen3-30B-A3B-f16-00002-of-00003.gguf filter=lfs diff=lfs merge=lfs -text
|
50 |
+
Qwen3-30B-A3B-f16-00003-of-00003.gguf filter=lfs diff=lfs merge=lfs -text
|
Qwen3-30B-A3B-Q2_K.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f5504ab72182288f7d794aeb9647647496754c0a777c3eb5faf4045f3b8b2bfb
|
3 |
+
size 11258609568
|
Qwen3-30B-A3B-Q3_K_L.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e2f1592c6a0e54dbf98dc2f0876cd75b006010e954abb0bfd54f5ef6490164df
|
3 |
+
size 15900669856
|
Qwen3-30B-A3B-Q3_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c4bf314a2505fbc78637a83e87fed061964ef79b3bcc508a8d4d1f23dc9e46df
|
3 |
+
size 14711846816
|
Qwen3-30B-A3B-Q3_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4b689267ba923035bf51be1381a610a5349f6f72962be20f56934d534882326
|
3 |
+
size 13292468128
|
Qwen3-30B-A3B-Q4_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f2cc7707c7fba2fe2cbc4d74dec0aefeffcf163cf9ac8c8f08d7fcf9644ac260
|
3 |
+
size 17304489888
|
Qwen3-30B-A3B-Q4_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c2dcb989171190cb65ca4b2663fd3d17c6b17fa074e8c3e712bbb0c8b67bef9b
|
3 |
+
size 18556686240
|
Qwen3-30B-A3B-Q4_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5bfa4cad6dc1fcd79d58de0d0443c8c759cc7bb4d6176fb0b7c780f45d7b793a
|
3 |
+
size 17456009120
|
Qwen3-30B-A3B-Q5_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1b47c6609f4ca8f08ed4ae3e0a4f00fb41c720c1a9cba1af60490d8eabc1fba6
|
3 |
+
size 21080510368
|
Qwen3-30B-A3B-Q5_K_M.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e664ed4aa9f79e7160cdf09eeb0f4d18d19aa5faec03cb5495747aec35814b9e
|
3 |
+
size 21725581216
|
Qwen3-30B-A3B-Q5_K_S.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cf5dbeadb910b95f14ebe3e93ebc1e7c2315a5f1738a86a4174101d320d08de1
|
3 |
+
size 21080510368
|
Qwen3-30B-A3B-Q6_K.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f0d7f357d25782b6faba0d64bc7912942e7360c4c346ca7e1fb0cbf40fb0fef9
|
3 |
+
size 25092532128
|
Qwen3-30B-A3B-Q8_0.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f804d1c2d37e5c7929bd3541428a471d69a84aa5023d1a7a47fd5941c34475df
|
3 |
+
size 32483932064
|
Qwen3-30B-A3B-f16-00001-of-00003.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d81c3fdfabe25eef69f831a11a14c61b1ab1fc95fd83a7333f76a210345f656
|
3 |
+
size 29706750496
|
Qwen3-30B-A3B-f16-00002-of-00003.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3fd1799712bc147cea24e82f8670d85e425b1ae6e8406c87a26867f14b3787f3
|
3 |
+
size 29558738080
|
Qwen3-30B-A3B-f16-00003-of-00003.gguf
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6011ea3b4306a739a5b56208ed4d929a324bd7cce3db80c3cbee1404a60dc48e
|
3 |
+
size 1830314528
|
config.json
ADDED
@@ -0,0 +1,38 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"architectures": [
|
3 |
+
"Qwen3MoeForCausalLM"
|
4 |
+
],
|
5 |
+
"attention_bias": false,
|
6 |
+
"attention_dropout": 0.0,
|
7 |
+
"bos_token_id": 151643,
|
8 |
+
"decoder_sparse_step": 1,
|
9 |
+
"eos_token_id": 151645,
|
10 |
+
"head_dim": 128,
|
11 |
+
"hidden_act": "silu",
|
12 |
+
"hidden_size": 2048,
|
13 |
+
"initializer_range": 0.02,
|
14 |
+
"intermediate_size": 6144,
|
15 |
+
"max_position_embeddings": 40960,
|
16 |
+
"max_window_layers": 48,
|
17 |
+
"mlp_only_layers": [],
|
18 |
+
"model_type": "qwen3_moe",
|
19 |
+
"moe_intermediate_size": 768,
|
20 |
+
"norm_topk_prob": true,
|
21 |
+
"num_attention_heads": 32,
|
22 |
+
"num_experts": 128,
|
23 |
+
"num_experts_per_tok": 8,
|
24 |
+
"num_hidden_layers": 48,
|
25 |
+
"num_key_value_heads": 4,
|
26 |
+
"output_router_logits": false,
|
27 |
+
"rms_norm_eps": 1e-06,
|
28 |
+
"rope_scaling": null,
|
29 |
+
"rope_theta": 1000000.0,
|
30 |
+
"router_aux_loss_coef": 0.001,
|
31 |
+
"sliding_window": null,
|
32 |
+
"tie_word_embeddings": false,
|
33 |
+
"torch_dtype": "bfloat16",
|
34 |
+
"transformers_version": "4.51.0",
|
35 |
+
"use_cache": true,
|
36 |
+
"use_sliding_window": false,
|
37 |
+
"vocab_size": 151936
|
38 |
+
}
|