Upload 11 files
Browse files- DeepSeek-v2.5-1210-UD-iq1_m-00001-of-00002.gguf.tensors.txt +540 -0
- DeepSeek-v2.5-1210-UD-iq1_m-00002-of-00002.gguf.tensors.txt +489 -0
- DeepSeek-v2.5-1210-UD-iq1_s-00001-of-00002.gguf.tensors.txt +540 -0
- DeepSeek-v2.5-1210-UD-iq1_s-00002-of-00002.gguf.tensors.txt +489 -0
- DeepSeek-v2.5-1210-UD-iq2_s-00001-of-00002.gguf.tensors.txt +540 -0
- DeepSeek-v2.5-1210-UD-iq2_s-00002-of-00002.gguf.tensors.txt +489 -0
- DeepSeek-v2.5-1210-UD-iq2_xxs-00001-of-00002.gguf.tensors.txt +537 -0
- DeepSeek-v2.5-1210-UD-iq2_xxs-00002-of-00002.gguf.tensors.txt +492 -0
- DeepSeek-v2.5-1210-UD-iq3_m-00001-of-00003.gguf.tensors.txt +380 -0
- DeepSeek-v2.5-1210-UD-iq3_m-00002-of-00003.gguf.tensors.txt +330 -0
- DeepSeek-v2.5-1210-UD-iq3_m-00003-of-00003.gguf.tensors.txt +329 -0
DeepSeek-v2.5-1210-UD-iq1_m-00001-of-00002.gguf.tensors.txt
ADDED
@@ -0,0 +1,540 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq1_m-00001-of-00002.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 56 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 480
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 53
|
7 |
+
4: STRING | 1 | general.architecture = 'deepseek2'
|
8 |
+
5: STRING | 1 | general.type = 'model'
|
9 |
+
6: STRING | 1 | general.name = 'Dsv25'
|
10 |
+
7: STRING | 1 | general.size_label = '160x14B'
|
11 |
+
8: STRING | 1 | general.license = 'other'
|
12 |
+
9: STRING | 1 | general.license.name = 'deepseek'
|
13 |
+
10: STRING | 1 | general.license.link = 'https://github.com/deepseek-ai/DeepSeek-V2/blob/main/LICENSE'
|
14 |
+
11: UINT32 | 1 | deepseek2.block_count = 60
|
15 |
+
12: UINT32 | 1 | deepseek2.context_length = 163840
|
16 |
+
13: UINT32 | 1 | deepseek2.embedding_length = 5120
|
17 |
+
14: UINT32 | 1 | deepseek2.feed_forward_length = 12288
|
18 |
+
15: UINT32 | 1 | deepseek2.attention.head_count = 128
|
19 |
+
16: UINT32 | 1 | deepseek2.attention.head_count_kv = 128
|
20 |
+
17: FLOAT32 | 1 | deepseek2.rope.freq_base = 10000.0
|
21 |
+
18: FLOAT32 | 1 | deepseek2.attention.layer_norm_rms_epsilon = 9.999999974752427e-07
|
22 |
+
19: UINT32 | 1 | deepseek2.expert_used_count = 6
|
23 |
+
20: UINT32 | 1 | deepseek2.leading_dense_block_count = 1
|
24 |
+
21: UINT32 | 1 | deepseek2.vocab_size = 102400
|
25 |
+
22: UINT32 | 1 | deepseek2.attention.q_lora_rank = 1536
|
26 |
+
23: UINT32 | 1 | deepseek2.attention.kv_lora_rank = 512
|
27 |
+
24: UINT32 | 1 | deepseek2.attention.key_length = 192
|
28 |
+
25: UINT32 | 1 | deepseek2.attention.value_length = 128
|
29 |
+
26: UINT32 | 1 | deepseek2.expert_feed_forward_length = 1536
|
30 |
+
27: UINT32 | 1 | deepseek2.expert_count = 160
|
31 |
+
28: UINT32 | 1 | deepseek2.expert_shared_count = 2
|
32 |
+
29: FLOAT32 | 1 | deepseek2.expert_weights_scale = 16.0
|
33 |
+
30: BOOL | 1 | deepseek2.expert_weights_norm = False
|
34 |
+
31: UINT32 | 1 | deepseek2.expert_gating_func = 1
|
35 |
+
32: UINT32 | 1 | deepseek2.rope.dimension_count = 64
|
36 |
+
33: STRING | 1 | deepseek2.rope.scaling.type = 'yarn'
|
37 |
+
34: FLOAT32 | 1 | deepseek2.rope.scaling.factor = 40.0
|
38 |
+
35: UINT32 | 1 | deepseek2.rope.scaling.original_context_length = 4096
|
39 |
+
36: FLOAT32 | 1 | deepseek2.rope.scaling.yarn_log_multiplier = 0.10000000149011612
|
40 |
+
37: STRING | 1 | tokenizer.ggml.model = 'gpt2'
|
41 |
+
38: STRING | 1 | tokenizer.ggml.pre = 'deepseek-llm'
|
42 |
+
39: [STRING] | 102400 | tokenizer.ggml.tokens
|
43 |
+
40: [INT32] | 102400 | tokenizer.ggml.token_type
|
44 |
+
41: [STRING] | 99757 | tokenizer.ggml.merges
|
45 |
+
42: UINT32 | 1 | tokenizer.ggml.bos_token_id = 100000
|
46 |
+
43: UINT32 | 1 | tokenizer.ggml.eos_token_id = 100001
|
47 |
+
44: UINT32 | 1 | tokenizer.ggml.padding_token_id = 100001
|
48 |
+
45: BOOL | 1 | tokenizer.ggml.add_bos_token = True
|
49 |
+
46: BOOL | 1 | tokenizer.ggml.add_eos_token = False
|
50 |
+
47: STRING | 1 | tokenizer.chat_template = '{% if not add_generation_prompt is defined %}{% set add_gene'
|
51 |
+
48: UINT32 | 1 | general.quantization_version = 2
|
52 |
+
49: UINT32 | 1 | general.file_type = 31
|
53 |
+
50: STRING | 1 | quantize.imatrix.file = '/archive/nuc/LLM/raw/imatrix-DeepSeek-V2.5-1210-bartowski.da'
|
54 |
+
51: STRING | 1 | quantize.imatrix.dataset = '/training_dir/calibration_datav3.txt'
|
55 |
+
52: INT32 | 1 | quantize.imatrix.entries_count = 716
|
56 |
+
53: INT32 | 1 | quantize.imatrix.chunks_count = 139
|
57 |
+
54: UINT16 | 1 | split.no = 0
|
58 |
+
55: INT32 | 1 | split.tensors.count = 959
|
59 |
+
56: UINT16 | 1 | split.count = 2
|
60 |
+
* Dumping 480 tensor(s)
|
61 |
+
1: 524288000 | 5120, 102400, 1, 1 | Q6_K | output.weight
|
62 |
+
2: 5120 | 5120, 1, 1, 1 | F32 | output_norm.weight
|
63 |
+
3: 524288000 | 5120, 102400, 1, 1 | Q6_K | token_embd.weight
|
64 |
+
4: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.0.attn_kv_a_mqa.weight
|
65 |
+
5: 512 | 512, 1, 1, 1 | F32 | blk.0.attn_kv_a_norm.weight
|
66 |
+
6: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.0.attn_kv_b.weight
|
67 |
+
7: 5120 | 5120, 1, 1, 1 | F32 | blk.0.attn_norm.weight
|
68 |
+
8: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.0.attn_output.weight
|
69 |
+
9: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.0.attn_q_a.weight
|
70 |
+
10: 1536 | 1536, 1, 1, 1 | F32 | blk.0.attn_q_a_norm.weight
|
71 |
+
11: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.0.attn_q_b.weight
|
72 |
+
12: 62914560 | 12288, 5120, 1, 1 | Q6_K | blk.0.ffn_down.weight
|
73 |
+
13: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_gate.weight
|
74 |
+
14: 5120 | 5120, 1, 1, 1 | F32 | blk.0.ffn_norm.weight
|
75 |
+
15: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_up.weight
|
76 |
+
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.1.attn_kv_a_mqa.weight
|
77 |
+
17: 512 | 512, 1, 1, 1 | F32 | blk.1.attn_kv_a_norm.weight
|
78 |
+
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.1.attn_kv_b.weight
|
79 |
+
19: 5120 | 5120, 1, 1, 1 | F32 | blk.1.attn_norm.weight
|
80 |
+
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.1.attn_output.weight
|
81 |
+
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.1.attn_q_a.weight
|
82 |
+
22: 1536 | 1536, 1, 1, 1 | F32 | blk.1.attn_q_a_norm.weight
|
83 |
+
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.1.attn_q_b.weight
|
84 |
+
24: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.1.ffn_down_exps.weight
|
85 |
+
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.1.ffn_down_shexp.weight
|
86 |
+
26: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.1.ffn_gate_exps.weight
|
87 |
+
27: 819200 | 5120, 160, 1, 1 | F32 | blk.1.ffn_gate_inp.weight
|
88 |
+
28: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.1.ffn_gate_shexp.weight
|
89 |
+
29: 5120 | 5120, 1, 1, 1 | F32 | blk.1.ffn_norm.weight
|
90 |
+
30: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.1.ffn_up_exps.weight
|
91 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.1.ffn_up_shexp.weight
|
92 |
+
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.2.attn_kv_a_mqa.weight
|
93 |
+
33: 512 | 512, 1, 1, 1 | F32 | blk.2.attn_kv_a_norm.weight
|
94 |
+
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.2.attn_kv_b.weight
|
95 |
+
35: 5120 | 5120, 1, 1, 1 | F32 | blk.2.attn_norm.weight
|
96 |
+
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.2.attn_output.weight
|
97 |
+
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.2.attn_q_a.weight
|
98 |
+
38: 1536 | 1536, 1, 1, 1 | F32 | blk.2.attn_q_a_norm.weight
|
99 |
+
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.2.attn_q_b.weight
|
100 |
+
40: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.2.ffn_down_exps.weight
|
101 |
+
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.2.ffn_down_shexp.weight
|
102 |
+
42: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.2.ffn_gate_exps.weight
|
103 |
+
43: 819200 | 5120, 160, 1, 1 | F32 | blk.2.ffn_gate_inp.weight
|
104 |
+
44: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.2.ffn_gate_shexp.weight
|
105 |
+
45: 5120 | 5120, 1, 1, 1 | F32 | blk.2.ffn_norm.weight
|
106 |
+
46: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.2.ffn_up_exps.weight
|
107 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.2.ffn_up_shexp.weight
|
108 |
+
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.3.attn_kv_a_mqa.weight
|
109 |
+
49: 512 | 512, 1, 1, 1 | F32 | blk.3.attn_kv_a_norm.weight
|
110 |
+
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.3.attn_kv_b.weight
|
111 |
+
51: 5120 | 5120, 1, 1, 1 | F32 | blk.3.attn_norm.weight
|
112 |
+
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.3.attn_output.weight
|
113 |
+
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.3.attn_q_a.weight
|
114 |
+
54: 1536 | 1536, 1, 1, 1 | F32 | blk.3.attn_q_a_norm.weight
|
115 |
+
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.3.attn_q_b.weight
|
116 |
+
56: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.3.ffn_down_exps.weight
|
117 |
+
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.3.ffn_down_shexp.weight
|
118 |
+
58: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.3.ffn_gate_exps.weight
|
119 |
+
59: 819200 | 5120, 160, 1, 1 | F32 | blk.3.ffn_gate_inp.weight
|
120 |
+
60: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.3.ffn_gate_shexp.weight
|
121 |
+
61: 5120 | 5120, 1, 1, 1 | F32 | blk.3.ffn_norm.weight
|
122 |
+
62: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.3.ffn_up_exps.weight
|
123 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.3.ffn_up_shexp.weight
|
124 |
+
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.4.attn_kv_a_mqa.weight
|
125 |
+
65: 512 | 512, 1, 1, 1 | F32 | blk.4.attn_kv_a_norm.weight
|
126 |
+
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.4.attn_kv_b.weight
|
127 |
+
67: 5120 | 5120, 1, 1, 1 | F32 | blk.4.attn_norm.weight
|
128 |
+
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.4.attn_output.weight
|
129 |
+
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.4.attn_q_a.weight
|
130 |
+
70: 1536 | 1536, 1, 1, 1 | F32 | blk.4.attn_q_a_norm.weight
|
131 |
+
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.4.attn_q_b.weight
|
132 |
+
72: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.4.ffn_down_exps.weight
|
133 |
+
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.4.ffn_down_shexp.weight
|
134 |
+
74: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.4.ffn_gate_exps.weight
|
135 |
+
75: 819200 | 5120, 160, 1, 1 | F32 | blk.4.ffn_gate_inp.weight
|
136 |
+
76: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.4.ffn_gate_shexp.weight
|
137 |
+
77: 5120 | 5120, 1, 1, 1 | F32 | blk.4.ffn_norm.weight
|
138 |
+
78: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.4.ffn_up_exps.weight
|
139 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.4.ffn_up_shexp.weight
|
140 |
+
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.5.attn_kv_a_mqa.weight
|
141 |
+
81: 512 | 512, 1, 1, 1 | F32 | blk.5.attn_kv_a_norm.weight
|
142 |
+
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.5.attn_kv_b.weight
|
143 |
+
83: 5120 | 5120, 1, 1, 1 | F32 | blk.5.attn_norm.weight
|
144 |
+
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.5.attn_output.weight
|
145 |
+
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.5.attn_q_a.weight
|
146 |
+
86: 1536 | 1536, 1, 1, 1 | F32 | blk.5.attn_q_a_norm.weight
|
147 |
+
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.5.attn_q_b.weight
|
148 |
+
88: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.5.ffn_down_exps.weight
|
149 |
+
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.5.ffn_down_shexp.weight
|
150 |
+
90: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.5.ffn_gate_exps.weight
|
151 |
+
91: 819200 | 5120, 160, 1, 1 | F32 | blk.5.ffn_gate_inp.weight
|
152 |
+
92: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.5.ffn_gate_shexp.weight
|
153 |
+
93: 5120 | 5120, 1, 1, 1 | F32 | blk.5.ffn_norm.weight
|
154 |
+
94: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.5.ffn_up_exps.weight
|
155 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.5.ffn_up_shexp.weight
|
156 |
+
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.6.attn_kv_a_mqa.weight
|
157 |
+
97: 512 | 512, 1, 1, 1 | F32 | blk.6.attn_kv_a_norm.weight
|
158 |
+
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.6.attn_kv_b.weight
|
159 |
+
99: 5120 | 5120, 1, 1, 1 | F32 | blk.6.attn_norm.weight
|
160 |
+
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.6.attn_output.weight
|
161 |
+
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.6.attn_q_a.weight
|
162 |
+
102: 1536 | 1536, 1, 1, 1 | F32 | blk.6.attn_q_a_norm.weight
|
163 |
+
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.6.attn_q_b.weight
|
164 |
+
104: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.6.ffn_down_exps.weight
|
165 |
+
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.6.ffn_down_shexp.weight
|
166 |
+
106: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.6.ffn_gate_exps.weight
|
167 |
+
107: 819200 | 5120, 160, 1, 1 | F32 | blk.6.ffn_gate_inp.weight
|
168 |
+
108: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.6.ffn_gate_shexp.weight
|
169 |
+
109: 5120 | 5120, 1, 1, 1 | F32 | blk.6.ffn_norm.weight
|
170 |
+
110: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.6.ffn_up_exps.weight
|
171 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.6.ffn_up_shexp.weight
|
172 |
+
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.7.attn_kv_a_mqa.weight
|
173 |
+
113: 512 | 512, 1, 1, 1 | F32 | blk.7.attn_kv_a_norm.weight
|
174 |
+
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.7.attn_kv_b.weight
|
175 |
+
115: 5120 | 5120, 1, 1, 1 | F32 | blk.7.attn_norm.weight
|
176 |
+
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.7.attn_output.weight
|
177 |
+
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.7.attn_q_a.weight
|
178 |
+
118: 1536 | 1536, 1, 1, 1 | F32 | blk.7.attn_q_a_norm.weight
|
179 |
+
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.7.attn_q_b.weight
|
180 |
+
120: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.7.ffn_down_exps.weight
|
181 |
+
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.7.ffn_down_shexp.weight
|
182 |
+
122: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.7.ffn_gate_exps.weight
|
183 |
+
123: 819200 | 5120, 160, 1, 1 | F32 | blk.7.ffn_gate_inp.weight
|
184 |
+
124: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.7.ffn_gate_shexp.weight
|
185 |
+
125: 5120 | 5120, 1, 1, 1 | F32 | blk.7.ffn_norm.weight
|
186 |
+
126: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.7.ffn_up_exps.weight
|
187 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.7.ffn_up_shexp.weight
|
188 |
+
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.8.attn_kv_a_mqa.weight
|
189 |
+
129: 512 | 512, 1, 1, 1 | F32 | blk.8.attn_kv_a_norm.weight
|
190 |
+
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.8.attn_kv_b.weight
|
191 |
+
131: 5120 | 5120, 1, 1, 1 | F32 | blk.8.attn_norm.weight
|
192 |
+
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.8.attn_output.weight
|
193 |
+
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.8.attn_q_a.weight
|
194 |
+
134: 1536 | 1536, 1, 1, 1 | F32 | blk.8.attn_q_a_norm.weight
|
195 |
+
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.8.attn_q_b.weight
|
196 |
+
136: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.8.ffn_down_exps.weight
|
197 |
+
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.8.ffn_down_shexp.weight
|
198 |
+
138: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.8.ffn_gate_exps.weight
|
199 |
+
139: 819200 | 5120, 160, 1, 1 | F32 | blk.8.ffn_gate_inp.weight
|
200 |
+
140: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.8.ffn_gate_shexp.weight
|
201 |
+
141: 5120 | 5120, 1, 1, 1 | F32 | blk.8.ffn_norm.weight
|
202 |
+
142: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.8.ffn_up_exps.weight
|
203 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.8.ffn_up_shexp.weight
|
204 |
+
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.9.attn_kv_a_mqa.weight
|
205 |
+
145: 512 | 512, 1, 1, 1 | F32 | blk.9.attn_kv_a_norm.weight
|
206 |
+
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.9.attn_kv_b.weight
|
207 |
+
147: 5120 | 5120, 1, 1, 1 | F32 | blk.9.attn_norm.weight
|
208 |
+
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.9.attn_output.weight
|
209 |
+
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.9.attn_q_a.weight
|
210 |
+
150: 1536 | 1536, 1, 1, 1 | F32 | blk.9.attn_q_a_norm.weight
|
211 |
+
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.9.attn_q_b.weight
|
212 |
+
152: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.9.ffn_down_exps.weight
|
213 |
+
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.9.ffn_down_shexp.weight
|
214 |
+
154: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.9.ffn_gate_exps.weight
|
215 |
+
155: 819200 | 5120, 160, 1, 1 | F32 | blk.9.ffn_gate_inp.weight
|
216 |
+
156: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.9.ffn_gate_shexp.weight
|
217 |
+
157: 5120 | 5120, 1, 1, 1 | F32 | blk.9.ffn_norm.weight
|
218 |
+
158: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.9.ffn_up_exps.weight
|
219 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.9.ffn_up_shexp.weight
|
220 |
+
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.10.attn_kv_a_mqa.weight
|
221 |
+
161: 512 | 512, 1, 1, 1 | F32 | blk.10.attn_kv_a_norm.weight
|
222 |
+
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.10.attn_kv_b.weight
|
223 |
+
163: 5120 | 5120, 1, 1, 1 | F32 | blk.10.attn_norm.weight
|
224 |
+
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.10.attn_output.weight
|
225 |
+
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.10.attn_q_a.weight
|
226 |
+
166: 1536 | 1536, 1, 1, 1 | F32 | blk.10.attn_q_a_norm.weight
|
227 |
+
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.10.attn_q_b.weight
|
228 |
+
168: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.10.ffn_down_exps.weight
|
229 |
+
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.10.ffn_down_shexp.weight
|
230 |
+
170: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.10.ffn_gate_exps.weight
|
231 |
+
171: 819200 | 5120, 160, 1, 1 | F32 | blk.10.ffn_gate_inp.weight
|
232 |
+
172: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.10.ffn_gate_shexp.weight
|
233 |
+
173: 5120 | 5120, 1, 1, 1 | F32 | blk.10.ffn_norm.weight
|
234 |
+
174: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.10.ffn_up_exps.weight
|
235 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.10.ffn_up_shexp.weight
|
236 |
+
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.11.attn_kv_a_mqa.weight
|
237 |
+
177: 512 | 512, 1, 1, 1 | F32 | blk.11.attn_kv_a_norm.weight
|
238 |
+
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.11.attn_kv_b.weight
|
239 |
+
179: 5120 | 5120, 1, 1, 1 | F32 | blk.11.attn_norm.weight
|
240 |
+
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.11.attn_output.weight
|
241 |
+
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.11.attn_q_a.weight
|
242 |
+
182: 1536 | 1536, 1, 1, 1 | F32 | blk.11.attn_q_a_norm.weight
|
243 |
+
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.11.attn_q_b.weight
|
244 |
+
184: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.11.ffn_down_exps.weight
|
245 |
+
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.11.ffn_down_shexp.weight
|
246 |
+
186: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.11.ffn_gate_exps.weight
|
247 |
+
187: 819200 | 5120, 160, 1, 1 | F32 | blk.11.ffn_gate_inp.weight
|
248 |
+
188: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.11.ffn_gate_shexp.weight
|
249 |
+
189: 5120 | 5120, 1, 1, 1 | F32 | blk.11.ffn_norm.weight
|
250 |
+
190: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.11.ffn_up_exps.weight
|
251 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.11.ffn_up_shexp.weight
|
252 |
+
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.12.attn_kv_a_mqa.weight
|
253 |
+
193: 512 | 512, 1, 1, 1 | F32 | blk.12.attn_kv_a_norm.weight
|
254 |
+
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.12.attn_kv_b.weight
|
255 |
+
195: 5120 | 5120, 1, 1, 1 | F32 | blk.12.attn_norm.weight
|
256 |
+
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.12.attn_output.weight
|
257 |
+
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.12.attn_q_a.weight
|
258 |
+
198: 1536 | 1536, 1, 1, 1 | F32 | blk.12.attn_q_a_norm.weight
|
259 |
+
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.12.attn_q_b.weight
|
260 |
+
200: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.12.ffn_down_exps.weight
|
261 |
+
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.12.ffn_down_shexp.weight
|
262 |
+
202: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.12.ffn_gate_exps.weight
|
263 |
+
203: 819200 | 5120, 160, 1, 1 | F32 | blk.12.ffn_gate_inp.weight
|
264 |
+
204: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.12.ffn_gate_shexp.weight
|
265 |
+
205: 5120 | 5120, 1, 1, 1 | F32 | blk.12.ffn_norm.weight
|
266 |
+
206: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.12.ffn_up_exps.weight
|
267 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.12.ffn_up_shexp.weight
|
268 |
+
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.13.attn_kv_a_mqa.weight
|
269 |
+
209: 512 | 512, 1, 1, 1 | F32 | blk.13.attn_kv_a_norm.weight
|
270 |
+
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.13.attn_kv_b.weight
|
271 |
+
211: 5120 | 5120, 1, 1, 1 | F32 | blk.13.attn_norm.weight
|
272 |
+
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.13.attn_output.weight
|
273 |
+
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.13.attn_q_a.weight
|
274 |
+
214: 1536 | 1536, 1, 1, 1 | F32 | blk.13.attn_q_a_norm.weight
|
275 |
+
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.13.attn_q_b.weight
|
276 |
+
216: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.13.ffn_down_exps.weight
|
277 |
+
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.13.ffn_down_shexp.weight
|
278 |
+
218: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.13.ffn_gate_exps.weight
|
279 |
+
219: 819200 | 5120, 160, 1, 1 | F32 | blk.13.ffn_gate_inp.weight
|
280 |
+
220: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.13.ffn_gate_shexp.weight
|
281 |
+
221: 5120 | 5120, 1, 1, 1 | F32 | blk.13.ffn_norm.weight
|
282 |
+
222: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.13.ffn_up_exps.weight
|
283 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.13.ffn_up_shexp.weight
|
284 |
+
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.14.attn_kv_a_mqa.weight
|
285 |
+
225: 512 | 512, 1, 1, 1 | F32 | blk.14.attn_kv_a_norm.weight
|
286 |
+
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.14.attn_kv_b.weight
|
287 |
+
227: 5120 | 5120, 1, 1, 1 | F32 | blk.14.attn_norm.weight
|
288 |
+
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.14.attn_output.weight
|
289 |
+
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.14.attn_q_a.weight
|
290 |
+
230: 1536 | 1536, 1, 1, 1 | F32 | blk.14.attn_q_a_norm.weight
|
291 |
+
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.14.attn_q_b.weight
|
292 |
+
232: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.14.ffn_down_exps.weight
|
293 |
+
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.14.ffn_down_shexp.weight
|
294 |
+
234: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.14.ffn_gate_exps.weight
|
295 |
+
235: 819200 | 5120, 160, 1, 1 | F32 | blk.14.ffn_gate_inp.weight
|
296 |
+
236: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.14.ffn_gate_shexp.weight
|
297 |
+
237: 5120 | 5120, 1, 1, 1 | F32 | blk.14.ffn_norm.weight
|
298 |
+
238: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.14.ffn_up_exps.weight
|
299 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.14.ffn_up_shexp.weight
|
300 |
+
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.15.attn_kv_a_mqa.weight
|
301 |
+
241: 512 | 512, 1, 1, 1 | F32 | blk.15.attn_kv_a_norm.weight
|
302 |
+
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.15.attn_kv_b.weight
|
303 |
+
243: 5120 | 5120, 1, 1, 1 | F32 | blk.15.attn_norm.weight
|
304 |
+
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.15.attn_output.weight
|
305 |
+
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.15.attn_q_a.weight
|
306 |
+
246: 1536 | 1536, 1, 1, 1 | F32 | blk.15.attn_q_a_norm.weight
|
307 |
+
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.15.attn_q_b.weight
|
308 |
+
248: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.15.ffn_down_exps.weight
|
309 |
+
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.15.ffn_down_shexp.weight
|
310 |
+
250: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.15.ffn_gate_exps.weight
|
311 |
+
251: 819200 | 5120, 160, 1, 1 | F32 | blk.15.ffn_gate_inp.weight
|
312 |
+
252: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.15.ffn_gate_shexp.weight
|
313 |
+
253: 5120 | 5120, 1, 1, 1 | F32 | blk.15.ffn_norm.weight
|
314 |
+
254: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.15.ffn_up_exps.weight
|
315 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.15.ffn_up_shexp.weight
|
316 |
+
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.16.attn_kv_a_mqa.weight
|
317 |
+
257: 512 | 512, 1, 1, 1 | F32 | blk.16.attn_kv_a_norm.weight
|
318 |
+
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.16.attn_kv_b.weight
|
319 |
+
259: 5120 | 5120, 1, 1, 1 | F32 | blk.16.attn_norm.weight
|
320 |
+
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.16.attn_output.weight
|
321 |
+
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.16.attn_q_a.weight
|
322 |
+
262: 1536 | 1536, 1, 1, 1 | F32 | blk.16.attn_q_a_norm.weight
|
323 |
+
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.16.attn_q_b.weight
|
324 |
+
264: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.16.ffn_down_exps.weight
|
325 |
+
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.16.ffn_down_shexp.weight
|
326 |
+
266: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.16.ffn_gate_exps.weight
|
327 |
+
267: 819200 | 5120, 160, 1, 1 | F32 | blk.16.ffn_gate_inp.weight
|
328 |
+
268: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.16.ffn_gate_shexp.weight
|
329 |
+
269: 5120 | 5120, 1, 1, 1 | F32 | blk.16.ffn_norm.weight
|
330 |
+
270: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.16.ffn_up_exps.weight
|
331 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.16.ffn_up_shexp.weight
|
332 |
+
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.17.attn_kv_a_mqa.weight
|
333 |
+
273: 512 | 512, 1, 1, 1 | F32 | blk.17.attn_kv_a_norm.weight
|
334 |
+
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.17.attn_kv_b.weight
|
335 |
+
275: 5120 | 5120, 1, 1, 1 | F32 | blk.17.attn_norm.weight
|
336 |
+
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.17.attn_output.weight
|
337 |
+
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.17.attn_q_a.weight
|
338 |
+
278: 1536 | 1536, 1, 1, 1 | F32 | blk.17.attn_q_a_norm.weight
|
339 |
+
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.17.attn_q_b.weight
|
340 |
+
280: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.17.ffn_down_exps.weight
|
341 |
+
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.17.ffn_down_shexp.weight
|
342 |
+
282: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.17.ffn_gate_exps.weight
|
343 |
+
283: 819200 | 5120, 160, 1, 1 | F32 | blk.17.ffn_gate_inp.weight
|
344 |
+
284: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.17.ffn_gate_shexp.weight
|
345 |
+
285: 5120 | 5120, 1, 1, 1 | F32 | blk.17.ffn_norm.weight
|
346 |
+
286: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.17.ffn_up_exps.weight
|
347 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.17.ffn_up_shexp.weight
|
348 |
+
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.18.attn_kv_a_mqa.weight
|
349 |
+
289: 512 | 512, 1, 1, 1 | F32 | blk.18.attn_kv_a_norm.weight
|
350 |
+
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.18.attn_kv_b.weight
|
351 |
+
291: 5120 | 5120, 1, 1, 1 | F32 | blk.18.attn_norm.weight
|
352 |
+
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.18.attn_output.weight
|
353 |
+
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.18.attn_q_a.weight
|
354 |
+
294: 1536 | 1536, 1, 1, 1 | F32 | blk.18.attn_q_a_norm.weight
|
355 |
+
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.18.attn_q_b.weight
|
356 |
+
296: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.18.ffn_down_exps.weight
|
357 |
+
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.18.ffn_down_shexp.weight
|
358 |
+
298: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.18.ffn_gate_exps.weight
|
359 |
+
299: 819200 | 5120, 160, 1, 1 | F32 | blk.18.ffn_gate_inp.weight
|
360 |
+
300: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.18.ffn_gate_shexp.weight
|
361 |
+
301: 5120 | 5120, 1, 1, 1 | F32 | blk.18.ffn_norm.weight
|
362 |
+
302: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.18.ffn_up_exps.weight
|
363 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.18.ffn_up_shexp.weight
|
364 |
+
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.19.attn_kv_a_mqa.weight
|
365 |
+
305: 512 | 512, 1, 1, 1 | F32 | blk.19.attn_kv_a_norm.weight
|
366 |
+
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.19.attn_kv_b.weight
|
367 |
+
307: 5120 | 5120, 1, 1, 1 | F32 | blk.19.attn_norm.weight
|
368 |
+
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.19.attn_output.weight
|
369 |
+
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.19.attn_q_a.weight
|
370 |
+
310: 1536 | 1536, 1, 1, 1 | F32 | blk.19.attn_q_a_norm.weight
|
371 |
+
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.19.attn_q_b.weight
|
372 |
+
312: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.19.ffn_down_exps.weight
|
373 |
+
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.19.ffn_down_shexp.weight
|
374 |
+
314: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.19.ffn_gate_exps.weight
|
375 |
+
315: 819200 | 5120, 160, 1, 1 | F32 | blk.19.ffn_gate_inp.weight
|
376 |
+
316: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.19.ffn_gate_shexp.weight
|
377 |
+
317: 5120 | 5120, 1, 1, 1 | F32 | blk.19.ffn_norm.weight
|
378 |
+
318: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.19.ffn_up_exps.weight
|
379 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.19.ffn_up_shexp.weight
|
380 |
+
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.20.attn_kv_a_mqa.weight
|
381 |
+
321: 512 | 512, 1, 1, 1 | F32 | blk.20.attn_kv_a_norm.weight
|
382 |
+
322: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.20.attn_kv_b.weight
|
383 |
+
323: 5120 | 5120, 1, 1, 1 | F32 | blk.20.attn_norm.weight
|
384 |
+
324: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.20.attn_output.weight
|
385 |
+
325: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.20.attn_q_a.weight
|
386 |
+
326: 1536 | 1536, 1, 1, 1 | F32 | blk.20.attn_q_a_norm.weight
|
387 |
+
327: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.20.attn_q_b.weight
|
388 |
+
328: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.20.ffn_down_exps.weight
|
389 |
+
329: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.20.ffn_down_shexp.weight
|
390 |
+
330: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.20.ffn_gate_exps.weight
|
391 |
+
331: 819200 | 5120, 160, 1, 1 | F32 | blk.20.ffn_gate_inp.weight
|
392 |
+
332: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.20.ffn_gate_shexp.weight
|
393 |
+
333: 5120 | 5120, 1, 1, 1 | F32 | blk.20.ffn_norm.weight
|
394 |
+
334: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.20.ffn_up_exps.weight
|
395 |
+
335: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.20.ffn_up_shexp.weight
|
396 |
+
336: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.21.attn_kv_a_mqa.weight
|
397 |
+
337: 512 | 512, 1, 1, 1 | F32 | blk.21.attn_kv_a_norm.weight
|
398 |
+
338: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.21.attn_kv_b.weight
|
399 |
+
339: 5120 | 5120, 1, 1, 1 | F32 | blk.21.attn_norm.weight
|
400 |
+
340: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.21.attn_output.weight
|
401 |
+
341: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.21.attn_q_a.weight
|
402 |
+
342: 1536 | 1536, 1, 1, 1 | F32 | blk.21.attn_q_a_norm.weight
|
403 |
+
343: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.21.attn_q_b.weight
|
404 |
+
344: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.21.ffn_down_exps.weight
|
405 |
+
345: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.21.ffn_down_shexp.weight
|
406 |
+
346: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.21.ffn_gate_exps.weight
|
407 |
+
347: 819200 | 5120, 160, 1, 1 | F32 | blk.21.ffn_gate_inp.weight
|
408 |
+
348: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.21.ffn_gate_shexp.weight
|
409 |
+
349: 5120 | 5120, 1, 1, 1 | F32 | blk.21.ffn_norm.weight
|
410 |
+
350: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.21.ffn_up_exps.weight
|
411 |
+
351: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.21.ffn_up_shexp.weight
|
412 |
+
352: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.22.attn_kv_a_mqa.weight
|
413 |
+
353: 512 | 512, 1, 1, 1 | F32 | blk.22.attn_kv_a_norm.weight
|
414 |
+
354: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.22.attn_kv_b.weight
|
415 |
+
355: 5120 | 5120, 1, 1, 1 | F32 | blk.22.attn_norm.weight
|
416 |
+
356: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.22.attn_output.weight
|
417 |
+
357: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.22.attn_q_a.weight
|
418 |
+
358: 1536 | 1536, 1, 1, 1 | F32 | blk.22.attn_q_a_norm.weight
|
419 |
+
359: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.22.attn_q_b.weight
|
420 |
+
360: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.22.ffn_down_exps.weight
|
421 |
+
361: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.22.ffn_down_shexp.weight
|
422 |
+
362: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.22.ffn_gate_exps.weight
|
423 |
+
363: 819200 | 5120, 160, 1, 1 | F32 | blk.22.ffn_gate_inp.weight
|
424 |
+
364: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.22.ffn_gate_shexp.weight
|
425 |
+
365: 5120 | 5120, 1, 1, 1 | F32 | blk.22.ffn_norm.weight
|
426 |
+
366: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.22.ffn_up_exps.weight
|
427 |
+
367: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.22.ffn_up_shexp.weight
|
428 |
+
368: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.23.attn_kv_a_mqa.weight
|
429 |
+
369: 512 | 512, 1, 1, 1 | F32 | blk.23.attn_kv_a_norm.weight
|
430 |
+
370: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.23.attn_kv_b.weight
|
431 |
+
371: 5120 | 5120, 1, 1, 1 | F32 | blk.23.attn_norm.weight
|
432 |
+
372: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.23.attn_output.weight
|
433 |
+
373: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.23.attn_q_a.weight
|
434 |
+
374: 1536 | 1536, 1, 1, 1 | F32 | blk.23.attn_q_a_norm.weight
|
435 |
+
375: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.23.attn_q_b.weight
|
436 |
+
376: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.23.ffn_down_exps.weight
|
437 |
+
377: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.23.ffn_down_shexp.weight
|
438 |
+
378: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.23.ffn_gate_exps.weight
|
439 |
+
379: 819200 | 5120, 160, 1, 1 | F32 | blk.23.ffn_gate_inp.weight
|
440 |
+
380: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.23.ffn_gate_shexp.weight
|
441 |
+
381: 5120 | 5120, 1, 1, 1 | F32 | blk.23.ffn_norm.weight
|
442 |
+
382: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.23.ffn_up_exps.weight
|
443 |
+
383: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.23.ffn_up_shexp.weight
|
444 |
+
384: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.24.attn_kv_a_mqa.weight
|
445 |
+
385: 512 | 512, 1, 1, 1 | F32 | blk.24.attn_kv_a_norm.weight
|
446 |
+
386: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.24.attn_kv_b.weight
|
447 |
+
387: 5120 | 5120, 1, 1, 1 | F32 | blk.24.attn_norm.weight
|
448 |
+
388: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.24.attn_output.weight
|
449 |
+
389: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.24.attn_q_a.weight
|
450 |
+
390: 1536 | 1536, 1, 1, 1 | F32 | blk.24.attn_q_a_norm.weight
|
451 |
+
391: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.24.attn_q_b.weight
|
452 |
+
392: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.24.ffn_down_exps.weight
|
453 |
+
393: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.24.ffn_down_shexp.weight
|
454 |
+
394: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.24.ffn_gate_exps.weight
|
455 |
+
395: 819200 | 5120, 160, 1, 1 | F32 | blk.24.ffn_gate_inp.weight
|
456 |
+
396: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.24.ffn_gate_shexp.weight
|
457 |
+
397: 5120 | 5120, 1, 1, 1 | F32 | blk.24.ffn_norm.weight
|
458 |
+
398: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.24.ffn_up_exps.weight
|
459 |
+
399: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.24.ffn_up_shexp.weight
|
460 |
+
400: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.25.attn_kv_a_mqa.weight
|
461 |
+
401: 512 | 512, 1, 1, 1 | F32 | blk.25.attn_kv_a_norm.weight
|
462 |
+
402: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.25.attn_kv_b.weight
|
463 |
+
403: 5120 | 5120, 1, 1, 1 | F32 | blk.25.attn_norm.weight
|
464 |
+
404: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.25.attn_output.weight
|
465 |
+
405: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.25.attn_q_a.weight
|
466 |
+
406: 1536 | 1536, 1, 1, 1 | F32 | blk.25.attn_q_a_norm.weight
|
467 |
+
407: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.25.attn_q_b.weight
|
468 |
+
408: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.25.ffn_down_exps.weight
|
469 |
+
409: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.25.ffn_down_shexp.weight
|
470 |
+
410: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.25.ffn_gate_exps.weight
|
471 |
+
411: 819200 | 5120, 160, 1, 1 | F32 | blk.25.ffn_gate_inp.weight
|
472 |
+
412: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.25.ffn_gate_shexp.weight
|
473 |
+
413: 5120 | 5120, 1, 1, 1 | F32 | blk.25.ffn_norm.weight
|
474 |
+
414: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.25.ffn_up_exps.weight
|
475 |
+
415: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.25.ffn_up_shexp.weight
|
476 |
+
416: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.26.attn_kv_a_mqa.weight
|
477 |
+
417: 512 | 512, 1, 1, 1 | F32 | blk.26.attn_kv_a_norm.weight
|
478 |
+
418: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.26.attn_kv_b.weight
|
479 |
+
419: 5120 | 5120, 1, 1, 1 | F32 | blk.26.attn_norm.weight
|
480 |
+
420: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.26.attn_output.weight
|
481 |
+
421: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.26.attn_q_a.weight
|
482 |
+
422: 1536 | 1536, 1, 1, 1 | F32 | blk.26.attn_q_a_norm.weight
|
483 |
+
423: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.26.attn_q_b.weight
|
484 |
+
424: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.26.ffn_down_exps.weight
|
485 |
+
425: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.26.ffn_down_shexp.weight
|
486 |
+
426: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.26.ffn_gate_exps.weight
|
487 |
+
427: 819200 | 5120, 160, 1, 1 | F32 | blk.26.ffn_gate_inp.weight
|
488 |
+
428: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.26.ffn_gate_shexp.weight
|
489 |
+
429: 5120 | 5120, 1, 1, 1 | F32 | blk.26.ffn_norm.weight
|
490 |
+
430: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.26.ffn_up_exps.weight
|
491 |
+
431: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.26.ffn_up_shexp.weight
|
492 |
+
432: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.27.attn_kv_a_mqa.weight
|
493 |
+
433: 512 | 512, 1, 1, 1 | F32 | blk.27.attn_kv_a_norm.weight
|
494 |
+
434: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.27.attn_kv_b.weight
|
495 |
+
435: 5120 | 5120, 1, 1, 1 | F32 | blk.27.attn_norm.weight
|
496 |
+
436: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.27.attn_output.weight
|
497 |
+
437: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.27.attn_q_a.weight
|
498 |
+
438: 1536 | 1536, 1, 1, 1 | F32 | blk.27.attn_q_a_norm.weight
|
499 |
+
439: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.27.attn_q_b.weight
|
500 |
+
440: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.27.ffn_down_exps.weight
|
501 |
+
441: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.27.ffn_down_shexp.weight
|
502 |
+
442: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.27.ffn_gate_exps.weight
|
503 |
+
443: 819200 | 5120, 160, 1, 1 | F32 | blk.27.ffn_gate_inp.weight
|
504 |
+
444: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.27.ffn_gate_shexp.weight
|
505 |
+
445: 5120 | 5120, 1, 1, 1 | F32 | blk.27.ffn_norm.weight
|
506 |
+
446: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.27.ffn_up_exps.weight
|
507 |
+
447: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.27.ffn_up_shexp.weight
|
508 |
+
448: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.28.attn_kv_a_mqa.weight
|
509 |
+
449: 512 | 512, 1, 1, 1 | F32 | blk.28.attn_kv_a_norm.weight
|
510 |
+
450: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.28.attn_kv_b.weight
|
511 |
+
451: 5120 | 5120, 1, 1, 1 | F32 | blk.28.attn_norm.weight
|
512 |
+
452: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.28.attn_output.weight
|
513 |
+
453: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.28.attn_q_a.weight
|
514 |
+
454: 1536 | 1536, 1, 1, 1 | F32 | blk.28.attn_q_a_norm.weight
|
515 |
+
455: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.28.attn_q_b.weight
|
516 |
+
456: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.28.ffn_down_exps.weight
|
517 |
+
457: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.28.ffn_down_shexp.weight
|
518 |
+
458: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.28.ffn_gate_exps.weight
|
519 |
+
459: 819200 | 5120, 160, 1, 1 | F32 | blk.28.ffn_gate_inp.weight
|
520 |
+
460: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.28.ffn_gate_shexp.weight
|
521 |
+
461: 5120 | 5120, 1, 1, 1 | F32 | blk.28.ffn_norm.weight
|
522 |
+
462: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.28.ffn_up_exps.weight
|
523 |
+
463: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.28.ffn_up_shexp.weight
|
524 |
+
464: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.29.attn_kv_a_mqa.weight
|
525 |
+
465: 512 | 512, 1, 1, 1 | F32 | blk.29.attn_kv_a_norm.weight
|
526 |
+
466: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.29.attn_kv_b.weight
|
527 |
+
467: 5120 | 5120, 1, 1, 1 | F32 | blk.29.attn_norm.weight
|
528 |
+
468: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.29.attn_output.weight
|
529 |
+
469: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.29.attn_q_a.weight
|
530 |
+
470: 1536 | 1536, 1, 1, 1 | F32 | blk.29.attn_q_a_norm.weight
|
531 |
+
471: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.29.attn_q_b.weight
|
532 |
+
472: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.29.ffn_down_exps.weight
|
533 |
+
473: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.29.ffn_down_shexp.weight
|
534 |
+
474: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.29.ffn_gate_exps.weight
|
535 |
+
475: 819200 | 5120, 160, 1, 1 | F32 | blk.29.ffn_gate_inp.weight
|
536 |
+
476: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.29.ffn_gate_shexp.weight
|
537 |
+
477: 5120 | 5120, 1, 1, 1 | F32 | blk.29.ffn_norm.weight
|
538 |
+
478: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.29.ffn_up_exps.weight
|
539 |
+
479: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.29.ffn_up_shexp.weight
|
540 |
+
480: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.30.attn_kv_a_mqa.weight
|
DeepSeek-v2.5-1210-UD-iq1_m-00002-of-00002.gguf.tensors.txt
ADDED
@@ -0,0 +1,489 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq1_m-00002-of-00002.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 6 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 479
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 3
|
7 |
+
4: UINT16 | 1 | split.no = 1
|
8 |
+
5: INT32 | 1 | split.tensors.count = 959
|
9 |
+
6: UINT16 | 1 | split.count = 2
|
10 |
+
* Dumping 479 tensor(s)
|
11 |
+
1: 512 | 512, 1, 1, 1 | F32 | blk.30.attn_kv_a_norm.weight
|
12 |
+
2: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.30.attn_kv_b.weight
|
13 |
+
3: 5120 | 5120, 1, 1, 1 | F32 | blk.30.attn_norm.weight
|
14 |
+
4: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.30.attn_output.weight
|
15 |
+
5: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.30.attn_q_a.weight
|
16 |
+
6: 1536 | 1536, 1, 1, 1 | F32 | blk.30.attn_q_a_norm.weight
|
17 |
+
7: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.30.attn_q_b.weight
|
18 |
+
8: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.30.ffn_down_exps.weight
|
19 |
+
9: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.30.ffn_down_shexp.weight
|
20 |
+
10: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.30.ffn_gate_exps.weight
|
21 |
+
11: 819200 | 5120, 160, 1, 1 | F32 | blk.30.ffn_gate_inp.weight
|
22 |
+
12: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.30.ffn_gate_shexp.weight
|
23 |
+
13: 5120 | 5120, 1, 1, 1 | F32 | blk.30.ffn_norm.weight
|
24 |
+
14: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.30.ffn_up_exps.weight
|
25 |
+
15: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.30.ffn_up_shexp.weight
|
26 |
+
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.31.attn_kv_a_mqa.weight
|
27 |
+
17: 512 | 512, 1, 1, 1 | F32 | blk.31.attn_kv_a_norm.weight
|
28 |
+
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.31.attn_kv_b.weight
|
29 |
+
19: 5120 | 5120, 1, 1, 1 | F32 | blk.31.attn_norm.weight
|
30 |
+
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.31.attn_output.weight
|
31 |
+
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.31.attn_q_a.weight
|
32 |
+
22: 1536 | 1536, 1, 1, 1 | F32 | blk.31.attn_q_a_norm.weight
|
33 |
+
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.31.attn_q_b.weight
|
34 |
+
24: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.31.ffn_down_exps.weight
|
35 |
+
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.31.ffn_down_shexp.weight
|
36 |
+
26: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.31.ffn_gate_exps.weight
|
37 |
+
27: 819200 | 5120, 160, 1, 1 | F32 | blk.31.ffn_gate_inp.weight
|
38 |
+
28: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.31.ffn_gate_shexp.weight
|
39 |
+
29: 5120 | 5120, 1, 1, 1 | F32 | blk.31.ffn_norm.weight
|
40 |
+
30: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.31.ffn_up_exps.weight
|
41 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.31.ffn_up_shexp.weight
|
42 |
+
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.32.attn_kv_a_mqa.weight
|
43 |
+
33: 512 | 512, 1, 1, 1 | F32 | blk.32.attn_kv_a_norm.weight
|
44 |
+
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.32.attn_kv_b.weight
|
45 |
+
35: 5120 | 5120, 1, 1, 1 | F32 | blk.32.attn_norm.weight
|
46 |
+
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.32.attn_output.weight
|
47 |
+
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.32.attn_q_a.weight
|
48 |
+
38: 1536 | 1536, 1, 1, 1 | F32 | blk.32.attn_q_a_norm.weight
|
49 |
+
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.32.attn_q_b.weight
|
50 |
+
40: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.32.ffn_down_exps.weight
|
51 |
+
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.32.ffn_down_shexp.weight
|
52 |
+
42: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.32.ffn_gate_exps.weight
|
53 |
+
43: 819200 | 5120, 160, 1, 1 | F32 | blk.32.ffn_gate_inp.weight
|
54 |
+
44: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.32.ffn_gate_shexp.weight
|
55 |
+
45: 5120 | 5120, 1, 1, 1 | F32 | blk.32.ffn_norm.weight
|
56 |
+
46: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.32.ffn_up_exps.weight
|
57 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.32.ffn_up_shexp.weight
|
58 |
+
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.33.attn_kv_a_mqa.weight
|
59 |
+
49: 512 | 512, 1, 1, 1 | F32 | blk.33.attn_kv_a_norm.weight
|
60 |
+
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.33.attn_kv_b.weight
|
61 |
+
51: 5120 | 5120, 1, 1, 1 | F32 | blk.33.attn_norm.weight
|
62 |
+
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.33.attn_output.weight
|
63 |
+
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.33.attn_q_a.weight
|
64 |
+
54: 1536 | 1536, 1, 1, 1 | F32 | blk.33.attn_q_a_norm.weight
|
65 |
+
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.33.attn_q_b.weight
|
66 |
+
56: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.33.ffn_down_exps.weight
|
67 |
+
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.33.ffn_down_shexp.weight
|
68 |
+
58: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.33.ffn_gate_exps.weight
|
69 |
+
59: 819200 | 5120, 160, 1, 1 | F32 | blk.33.ffn_gate_inp.weight
|
70 |
+
60: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.33.ffn_gate_shexp.weight
|
71 |
+
61: 5120 | 5120, 1, 1, 1 | F32 | blk.33.ffn_norm.weight
|
72 |
+
62: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.33.ffn_up_exps.weight
|
73 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.33.ffn_up_shexp.weight
|
74 |
+
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.34.attn_kv_a_mqa.weight
|
75 |
+
65: 512 | 512, 1, 1, 1 | F32 | blk.34.attn_kv_a_norm.weight
|
76 |
+
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.34.attn_kv_b.weight
|
77 |
+
67: 5120 | 5120, 1, 1, 1 | F32 | blk.34.attn_norm.weight
|
78 |
+
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.34.attn_output.weight
|
79 |
+
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.34.attn_q_a.weight
|
80 |
+
70: 1536 | 1536, 1, 1, 1 | F32 | blk.34.attn_q_a_norm.weight
|
81 |
+
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.34.attn_q_b.weight
|
82 |
+
72: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.34.ffn_down_exps.weight
|
83 |
+
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.34.ffn_down_shexp.weight
|
84 |
+
74: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.34.ffn_gate_exps.weight
|
85 |
+
75: 819200 | 5120, 160, 1, 1 | F32 | blk.34.ffn_gate_inp.weight
|
86 |
+
76: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.34.ffn_gate_shexp.weight
|
87 |
+
77: 5120 | 5120, 1, 1, 1 | F32 | blk.34.ffn_norm.weight
|
88 |
+
78: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.34.ffn_up_exps.weight
|
89 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.34.ffn_up_shexp.weight
|
90 |
+
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.35.attn_kv_a_mqa.weight
|
91 |
+
81: 512 | 512, 1, 1, 1 | F32 | blk.35.attn_kv_a_norm.weight
|
92 |
+
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.35.attn_kv_b.weight
|
93 |
+
83: 5120 | 5120, 1, 1, 1 | F32 | blk.35.attn_norm.weight
|
94 |
+
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.35.attn_output.weight
|
95 |
+
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.35.attn_q_a.weight
|
96 |
+
86: 1536 | 1536, 1, 1, 1 | F32 | blk.35.attn_q_a_norm.weight
|
97 |
+
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.35.attn_q_b.weight
|
98 |
+
88: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.35.ffn_down_exps.weight
|
99 |
+
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.35.ffn_down_shexp.weight
|
100 |
+
90: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.35.ffn_gate_exps.weight
|
101 |
+
91: 819200 | 5120, 160, 1, 1 | F32 | blk.35.ffn_gate_inp.weight
|
102 |
+
92: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.35.ffn_gate_shexp.weight
|
103 |
+
93: 5120 | 5120, 1, 1, 1 | F32 | blk.35.ffn_norm.weight
|
104 |
+
94: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.35.ffn_up_exps.weight
|
105 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.35.ffn_up_shexp.weight
|
106 |
+
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.36.attn_kv_a_mqa.weight
|
107 |
+
97: 512 | 512, 1, 1, 1 | F32 | blk.36.attn_kv_a_norm.weight
|
108 |
+
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.36.attn_kv_b.weight
|
109 |
+
99: 5120 | 5120, 1, 1, 1 | F32 | blk.36.attn_norm.weight
|
110 |
+
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.36.attn_output.weight
|
111 |
+
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.36.attn_q_a.weight
|
112 |
+
102: 1536 | 1536, 1, 1, 1 | F32 | blk.36.attn_q_a_norm.weight
|
113 |
+
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.36.attn_q_b.weight
|
114 |
+
104: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.36.ffn_down_exps.weight
|
115 |
+
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.36.ffn_down_shexp.weight
|
116 |
+
106: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.36.ffn_gate_exps.weight
|
117 |
+
107: 819200 | 5120, 160, 1, 1 | F32 | blk.36.ffn_gate_inp.weight
|
118 |
+
108: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.36.ffn_gate_shexp.weight
|
119 |
+
109: 5120 | 5120, 1, 1, 1 | F32 | blk.36.ffn_norm.weight
|
120 |
+
110: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.36.ffn_up_exps.weight
|
121 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.36.ffn_up_shexp.weight
|
122 |
+
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.37.attn_kv_a_mqa.weight
|
123 |
+
113: 512 | 512, 1, 1, 1 | F32 | blk.37.attn_kv_a_norm.weight
|
124 |
+
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.37.attn_kv_b.weight
|
125 |
+
115: 5120 | 5120, 1, 1, 1 | F32 | blk.37.attn_norm.weight
|
126 |
+
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.37.attn_output.weight
|
127 |
+
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.37.attn_q_a.weight
|
128 |
+
118: 1536 | 1536, 1, 1, 1 | F32 | blk.37.attn_q_a_norm.weight
|
129 |
+
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.37.attn_q_b.weight
|
130 |
+
120: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.37.ffn_down_exps.weight
|
131 |
+
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.37.ffn_down_shexp.weight
|
132 |
+
122: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.37.ffn_gate_exps.weight
|
133 |
+
123: 819200 | 5120, 160, 1, 1 | F32 | blk.37.ffn_gate_inp.weight
|
134 |
+
124: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.37.ffn_gate_shexp.weight
|
135 |
+
125: 5120 | 5120, 1, 1, 1 | F32 | blk.37.ffn_norm.weight
|
136 |
+
126: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.37.ffn_up_exps.weight
|
137 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.37.ffn_up_shexp.weight
|
138 |
+
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.38.attn_kv_a_mqa.weight
|
139 |
+
129: 512 | 512, 1, 1, 1 | F32 | blk.38.attn_kv_a_norm.weight
|
140 |
+
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.38.attn_kv_b.weight
|
141 |
+
131: 5120 | 5120, 1, 1, 1 | F32 | blk.38.attn_norm.weight
|
142 |
+
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.38.attn_output.weight
|
143 |
+
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.38.attn_q_a.weight
|
144 |
+
134: 1536 | 1536, 1, 1, 1 | F32 | blk.38.attn_q_a_norm.weight
|
145 |
+
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.38.attn_q_b.weight
|
146 |
+
136: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.38.ffn_down_exps.weight
|
147 |
+
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.38.ffn_down_shexp.weight
|
148 |
+
138: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.38.ffn_gate_exps.weight
|
149 |
+
139: 819200 | 5120, 160, 1, 1 | F32 | blk.38.ffn_gate_inp.weight
|
150 |
+
140: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.38.ffn_gate_shexp.weight
|
151 |
+
141: 5120 | 5120, 1, 1, 1 | F32 | blk.38.ffn_norm.weight
|
152 |
+
142: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.38.ffn_up_exps.weight
|
153 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.38.ffn_up_shexp.weight
|
154 |
+
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.39.attn_kv_a_mqa.weight
|
155 |
+
145: 512 | 512, 1, 1, 1 | F32 | blk.39.attn_kv_a_norm.weight
|
156 |
+
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.39.attn_kv_b.weight
|
157 |
+
147: 5120 | 5120, 1, 1, 1 | F32 | blk.39.attn_norm.weight
|
158 |
+
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.39.attn_output.weight
|
159 |
+
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.39.attn_q_a.weight
|
160 |
+
150: 1536 | 1536, 1, 1, 1 | F32 | blk.39.attn_q_a_norm.weight
|
161 |
+
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.39.attn_q_b.weight
|
162 |
+
152: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.39.ffn_down_exps.weight
|
163 |
+
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.39.ffn_down_shexp.weight
|
164 |
+
154: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.39.ffn_gate_exps.weight
|
165 |
+
155: 819200 | 5120, 160, 1, 1 | F32 | blk.39.ffn_gate_inp.weight
|
166 |
+
156: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.39.ffn_gate_shexp.weight
|
167 |
+
157: 5120 | 5120, 1, 1, 1 | F32 | blk.39.ffn_norm.weight
|
168 |
+
158: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.39.ffn_up_exps.weight
|
169 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.39.ffn_up_shexp.weight
|
170 |
+
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.40.attn_kv_a_mqa.weight
|
171 |
+
161: 512 | 512, 1, 1, 1 | F32 | blk.40.attn_kv_a_norm.weight
|
172 |
+
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.40.attn_kv_b.weight
|
173 |
+
163: 5120 | 5120, 1, 1, 1 | F32 | blk.40.attn_norm.weight
|
174 |
+
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.40.attn_output.weight
|
175 |
+
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.40.attn_q_a.weight
|
176 |
+
166: 1536 | 1536, 1, 1, 1 | F32 | blk.40.attn_q_a_norm.weight
|
177 |
+
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.40.attn_q_b.weight
|
178 |
+
168: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.40.ffn_down_exps.weight
|
179 |
+
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.40.ffn_down_shexp.weight
|
180 |
+
170: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.40.ffn_gate_exps.weight
|
181 |
+
171: 819200 | 5120, 160, 1, 1 | F32 | blk.40.ffn_gate_inp.weight
|
182 |
+
172: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.40.ffn_gate_shexp.weight
|
183 |
+
173: 5120 | 5120, 1, 1, 1 | F32 | blk.40.ffn_norm.weight
|
184 |
+
174: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.40.ffn_up_exps.weight
|
185 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.40.ffn_up_shexp.weight
|
186 |
+
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.41.attn_kv_a_mqa.weight
|
187 |
+
177: 512 | 512, 1, 1, 1 | F32 | blk.41.attn_kv_a_norm.weight
|
188 |
+
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.41.attn_kv_b.weight
|
189 |
+
179: 5120 | 5120, 1, 1, 1 | F32 | blk.41.attn_norm.weight
|
190 |
+
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.41.attn_output.weight
|
191 |
+
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.41.attn_q_a.weight
|
192 |
+
182: 1536 | 1536, 1, 1, 1 | F32 | blk.41.attn_q_a_norm.weight
|
193 |
+
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.41.attn_q_b.weight
|
194 |
+
184: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.41.ffn_down_exps.weight
|
195 |
+
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.41.ffn_down_shexp.weight
|
196 |
+
186: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.41.ffn_gate_exps.weight
|
197 |
+
187: 819200 | 5120, 160, 1, 1 | F32 | blk.41.ffn_gate_inp.weight
|
198 |
+
188: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.41.ffn_gate_shexp.weight
|
199 |
+
189: 5120 | 5120, 1, 1, 1 | F32 | blk.41.ffn_norm.weight
|
200 |
+
190: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.41.ffn_up_exps.weight
|
201 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.41.ffn_up_shexp.weight
|
202 |
+
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.42.attn_kv_a_mqa.weight
|
203 |
+
193: 512 | 512, 1, 1, 1 | F32 | blk.42.attn_kv_a_norm.weight
|
204 |
+
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.42.attn_kv_b.weight
|
205 |
+
195: 5120 | 5120, 1, 1, 1 | F32 | blk.42.attn_norm.weight
|
206 |
+
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.42.attn_output.weight
|
207 |
+
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.42.attn_q_a.weight
|
208 |
+
198: 1536 | 1536, 1, 1, 1 | F32 | blk.42.attn_q_a_norm.weight
|
209 |
+
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.42.attn_q_b.weight
|
210 |
+
200: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.42.ffn_down_exps.weight
|
211 |
+
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.42.ffn_down_shexp.weight
|
212 |
+
202: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.42.ffn_gate_exps.weight
|
213 |
+
203: 819200 | 5120, 160, 1, 1 | F32 | blk.42.ffn_gate_inp.weight
|
214 |
+
204: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.42.ffn_gate_shexp.weight
|
215 |
+
205: 5120 | 5120, 1, 1, 1 | F32 | blk.42.ffn_norm.weight
|
216 |
+
206: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.42.ffn_up_exps.weight
|
217 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.42.ffn_up_shexp.weight
|
218 |
+
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.43.attn_kv_a_mqa.weight
|
219 |
+
209: 512 | 512, 1, 1, 1 | F32 | blk.43.attn_kv_a_norm.weight
|
220 |
+
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.43.attn_kv_b.weight
|
221 |
+
211: 5120 | 5120, 1, 1, 1 | F32 | blk.43.attn_norm.weight
|
222 |
+
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.43.attn_output.weight
|
223 |
+
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.43.attn_q_a.weight
|
224 |
+
214: 1536 | 1536, 1, 1, 1 | F32 | blk.43.attn_q_a_norm.weight
|
225 |
+
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.43.attn_q_b.weight
|
226 |
+
216: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.43.ffn_down_exps.weight
|
227 |
+
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.43.ffn_down_shexp.weight
|
228 |
+
218: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.43.ffn_gate_exps.weight
|
229 |
+
219: 819200 | 5120, 160, 1, 1 | F32 | blk.43.ffn_gate_inp.weight
|
230 |
+
220: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.43.ffn_gate_shexp.weight
|
231 |
+
221: 5120 | 5120, 1, 1, 1 | F32 | blk.43.ffn_norm.weight
|
232 |
+
222: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.43.ffn_up_exps.weight
|
233 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.43.ffn_up_shexp.weight
|
234 |
+
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.44.attn_kv_a_mqa.weight
|
235 |
+
225: 512 | 512, 1, 1, 1 | F32 | blk.44.attn_kv_a_norm.weight
|
236 |
+
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.44.attn_kv_b.weight
|
237 |
+
227: 5120 | 5120, 1, 1, 1 | F32 | blk.44.attn_norm.weight
|
238 |
+
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.44.attn_output.weight
|
239 |
+
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.44.attn_q_a.weight
|
240 |
+
230: 1536 | 1536, 1, 1, 1 | F32 | blk.44.attn_q_a_norm.weight
|
241 |
+
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.44.attn_q_b.weight
|
242 |
+
232: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.44.ffn_down_exps.weight
|
243 |
+
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.44.ffn_down_shexp.weight
|
244 |
+
234: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.44.ffn_gate_exps.weight
|
245 |
+
235: 819200 | 5120, 160, 1, 1 | F32 | blk.44.ffn_gate_inp.weight
|
246 |
+
236: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.44.ffn_gate_shexp.weight
|
247 |
+
237: 5120 | 5120, 1, 1, 1 | F32 | blk.44.ffn_norm.weight
|
248 |
+
238: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.44.ffn_up_exps.weight
|
249 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.44.ffn_up_shexp.weight
|
250 |
+
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.45.attn_kv_a_mqa.weight
|
251 |
+
241: 512 | 512, 1, 1, 1 | F32 | blk.45.attn_kv_a_norm.weight
|
252 |
+
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.45.attn_kv_b.weight
|
253 |
+
243: 5120 | 5120, 1, 1, 1 | F32 | blk.45.attn_norm.weight
|
254 |
+
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.45.attn_output.weight
|
255 |
+
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.45.attn_q_a.weight
|
256 |
+
246: 1536 | 1536, 1, 1, 1 | F32 | blk.45.attn_q_a_norm.weight
|
257 |
+
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.45.attn_q_b.weight
|
258 |
+
248: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.45.ffn_down_exps.weight
|
259 |
+
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.45.ffn_down_shexp.weight
|
260 |
+
250: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.45.ffn_gate_exps.weight
|
261 |
+
251: 819200 | 5120, 160, 1, 1 | F32 | blk.45.ffn_gate_inp.weight
|
262 |
+
252: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.45.ffn_gate_shexp.weight
|
263 |
+
253: 5120 | 5120, 1, 1, 1 | F32 | blk.45.ffn_norm.weight
|
264 |
+
254: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.45.ffn_up_exps.weight
|
265 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.45.ffn_up_shexp.weight
|
266 |
+
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.46.attn_kv_a_mqa.weight
|
267 |
+
257: 512 | 512, 1, 1, 1 | F32 | blk.46.attn_kv_a_norm.weight
|
268 |
+
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.46.attn_kv_b.weight
|
269 |
+
259: 5120 | 5120, 1, 1, 1 | F32 | blk.46.attn_norm.weight
|
270 |
+
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.46.attn_output.weight
|
271 |
+
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.46.attn_q_a.weight
|
272 |
+
262: 1536 | 1536, 1, 1, 1 | F32 | blk.46.attn_q_a_norm.weight
|
273 |
+
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.46.attn_q_b.weight
|
274 |
+
264: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.46.ffn_down_exps.weight
|
275 |
+
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.46.ffn_down_shexp.weight
|
276 |
+
266: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.46.ffn_gate_exps.weight
|
277 |
+
267: 819200 | 5120, 160, 1, 1 | F32 | blk.46.ffn_gate_inp.weight
|
278 |
+
268: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.46.ffn_gate_shexp.weight
|
279 |
+
269: 5120 | 5120, 1, 1, 1 | F32 | blk.46.ffn_norm.weight
|
280 |
+
270: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.46.ffn_up_exps.weight
|
281 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.46.ffn_up_shexp.weight
|
282 |
+
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.47.attn_kv_a_mqa.weight
|
283 |
+
273: 512 | 512, 1, 1, 1 | F32 | blk.47.attn_kv_a_norm.weight
|
284 |
+
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.47.attn_kv_b.weight
|
285 |
+
275: 5120 | 5120, 1, 1, 1 | F32 | blk.47.attn_norm.weight
|
286 |
+
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.47.attn_output.weight
|
287 |
+
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.47.attn_q_a.weight
|
288 |
+
278: 1536 | 1536, 1, 1, 1 | F32 | blk.47.attn_q_a_norm.weight
|
289 |
+
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.47.attn_q_b.weight
|
290 |
+
280: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.47.ffn_down_exps.weight
|
291 |
+
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.47.ffn_down_shexp.weight
|
292 |
+
282: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.47.ffn_gate_exps.weight
|
293 |
+
283: 819200 | 5120, 160, 1, 1 | F32 | blk.47.ffn_gate_inp.weight
|
294 |
+
284: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.47.ffn_gate_shexp.weight
|
295 |
+
285: 5120 | 5120, 1, 1, 1 | F32 | blk.47.ffn_norm.weight
|
296 |
+
286: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.47.ffn_up_exps.weight
|
297 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.47.ffn_up_shexp.weight
|
298 |
+
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.48.attn_kv_a_mqa.weight
|
299 |
+
289: 512 | 512, 1, 1, 1 | F32 | blk.48.attn_kv_a_norm.weight
|
300 |
+
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.48.attn_kv_b.weight
|
301 |
+
291: 5120 | 5120, 1, 1, 1 | F32 | blk.48.attn_norm.weight
|
302 |
+
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.48.attn_output.weight
|
303 |
+
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.48.attn_q_a.weight
|
304 |
+
294: 1536 | 1536, 1, 1, 1 | F32 | blk.48.attn_q_a_norm.weight
|
305 |
+
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.48.attn_q_b.weight
|
306 |
+
296: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.48.ffn_down_exps.weight
|
307 |
+
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.48.ffn_down_shexp.weight
|
308 |
+
298: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.48.ffn_gate_exps.weight
|
309 |
+
299: 819200 | 5120, 160, 1, 1 | F32 | blk.48.ffn_gate_inp.weight
|
310 |
+
300: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.48.ffn_gate_shexp.weight
|
311 |
+
301: 5120 | 5120, 1, 1, 1 | F32 | blk.48.ffn_norm.weight
|
312 |
+
302: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.48.ffn_up_exps.weight
|
313 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.48.ffn_up_shexp.weight
|
314 |
+
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.49.attn_kv_a_mqa.weight
|
315 |
+
305: 512 | 512, 1, 1, 1 | F32 | blk.49.attn_kv_a_norm.weight
|
316 |
+
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.49.attn_kv_b.weight
|
317 |
+
307: 5120 | 5120, 1, 1, 1 | F32 | blk.49.attn_norm.weight
|
318 |
+
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.49.attn_output.weight
|
319 |
+
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.49.attn_q_a.weight
|
320 |
+
310: 1536 | 1536, 1, 1, 1 | F32 | blk.49.attn_q_a_norm.weight
|
321 |
+
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.49.attn_q_b.weight
|
322 |
+
312: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.49.ffn_down_exps.weight
|
323 |
+
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.49.ffn_down_shexp.weight
|
324 |
+
314: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.49.ffn_gate_exps.weight
|
325 |
+
315: 819200 | 5120, 160, 1, 1 | F32 | blk.49.ffn_gate_inp.weight
|
326 |
+
316: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.49.ffn_gate_shexp.weight
|
327 |
+
317: 5120 | 5120, 1, 1, 1 | F32 | blk.49.ffn_norm.weight
|
328 |
+
318: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.49.ffn_up_exps.weight
|
329 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.49.ffn_up_shexp.weight
|
330 |
+
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.50.attn_kv_a_mqa.weight
|
331 |
+
321: 512 | 512, 1, 1, 1 | F32 | blk.50.attn_kv_a_norm.weight
|
332 |
+
322: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.50.attn_kv_b.weight
|
333 |
+
323: 5120 | 5120, 1, 1, 1 | F32 | blk.50.attn_norm.weight
|
334 |
+
324: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.50.attn_output.weight
|
335 |
+
325: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.50.attn_q_a.weight
|
336 |
+
326: 1536 | 1536, 1, 1, 1 | F32 | blk.50.attn_q_a_norm.weight
|
337 |
+
327: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.50.attn_q_b.weight
|
338 |
+
328: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.50.ffn_down_exps.weight
|
339 |
+
329: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.50.ffn_down_shexp.weight
|
340 |
+
330: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.50.ffn_gate_exps.weight
|
341 |
+
331: 819200 | 5120, 160, 1, 1 | F32 | blk.50.ffn_gate_inp.weight
|
342 |
+
332: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.50.ffn_gate_shexp.weight
|
343 |
+
333: 5120 | 5120, 1, 1, 1 | F32 | blk.50.ffn_norm.weight
|
344 |
+
334: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.50.ffn_up_exps.weight
|
345 |
+
335: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.50.ffn_up_shexp.weight
|
346 |
+
336: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.51.attn_kv_a_mqa.weight
|
347 |
+
337: 512 | 512, 1, 1, 1 | F32 | blk.51.attn_kv_a_norm.weight
|
348 |
+
338: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.51.attn_kv_b.weight
|
349 |
+
339: 5120 | 5120, 1, 1, 1 | F32 | blk.51.attn_norm.weight
|
350 |
+
340: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.51.attn_output.weight
|
351 |
+
341: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.51.attn_q_a.weight
|
352 |
+
342: 1536 | 1536, 1, 1, 1 | F32 | blk.51.attn_q_a_norm.weight
|
353 |
+
343: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.51.attn_q_b.weight
|
354 |
+
344: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.51.ffn_down_exps.weight
|
355 |
+
345: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.51.ffn_down_shexp.weight
|
356 |
+
346: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.51.ffn_gate_exps.weight
|
357 |
+
347: 819200 | 5120, 160, 1, 1 | F32 | blk.51.ffn_gate_inp.weight
|
358 |
+
348: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.51.ffn_gate_shexp.weight
|
359 |
+
349: 5120 | 5120, 1, 1, 1 | F32 | blk.51.ffn_norm.weight
|
360 |
+
350: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.51.ffn_up_exps.weight
|
361 |
+
351: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.51.ffn_up_shexp.weight
|
362 |
+
352: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.52.attn_kv_a_mqa.weight
|
363 |
+
353: 512 | 512, 1, 1, 1 | F32 | blk.52.attn_kv_a_norm.weight
|
364 |
+
354: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.52.attn_kv_b.weight
|
365 |
+
355: 5120 | 5120, 1, 1, 1 | F32 | blk.52.attn_norm.weight
|
366 |
+
356: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.52.attn_output.weight
|
367 |
+
357: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.52.attn_q_a.weight
|
368 |
+
358: 1536 | 1536, 1, 1, 1 | F32 | blk.52.attn_q_a_norm.weight
|
369 |
+
359: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.52.attn_q_b.weight
|
370 |
+
360: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.52.ffn_down_exps.weight
|
371 |
+
361: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.52.ffn_down_shexp.weight
|
372 |
+
362: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.52.ffn_gate_exps.weight
|
373 |
+
363: 819200 | 5120, 160, 1, 1 | F32 | blk.52.ffn_gate_inp.weight
|
374 |
+
364: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.52.ffn_gate_shexp.weight
|
375 |
+
365: 5120 | 5120, 1, 1, 1 | F32 | blk.52.ffn_norm.weight
|
376 |
+
366: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.52.ffn_up_exps.weight
|
377 |
+
367: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.52.ffn_up_shexp.weight
|
378 |
+
368: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.53.attn_kv_a_mqa.weight
|
379 |
+
369: 512 | 512, 1, 1, 1 | F32 | blk.53.attn_kv_a_norm.weight
|
380 |
+
370: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.53.attn_kv_b.weight
|
381 |
+
371: 5120 | 5120, 1, 1, 1 | F32 | blk.53.attn_norm.weight
|
382 |
+
372: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.53.attn_output.weight
|
383 |
+
373: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.53.attn_q_a.weight
|
384 |
+
374: 1536 | 1536, 1, 1, 1 | F32 | blk.53.attn_q_a_norm.weight
|
385 |
+
375: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.53.attn_q_b.weight
|
386 |
+
376: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.53.ffn_down_exps.weight
|
387 |
+
377: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.53.ffn_down_shexp.weight
|
388 |
+
378: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.53.ffn_gate_exps.weight
|
389 |
+
379: 819200 | 5120, 160, 1, 1 | F32 | blk.53.ffn_gate_inp.weight
|
390 |
+
380: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.53.ffn_gate_shexp.weight
|
391 |
+
381: 5120 | 5120, 1, 1, 1 | F32 | blk.53.ffn_norm.weight
|
392 |
+
382: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.53.ffn_up_exps.weight
|
393 |
+
383: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.53.ffn_up_shexp.weight
|
394 |
+
384: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.54.attn_kv_a_mqa.weight
|
395 |
+
385: 512 | 512, 1, 1, 1 | F32 | blk.54.attn_kv_a_norm.weight
|
396 |
+
386: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.54.attn_kv_b.weight
|
397 |
+
387: 5120 | 5120, 1, 1, 1 | F32 | blk.54.attn_norm.weight
|
398 |
+
388: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.54.attn_output.weight
|
399 |
+
389: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.54.attn_q_a.weight
|
400 |
+
390: 1536 | 1536, 1, 1, 1 | F32 | blk.54.attn_q_a_norm.weight
|
401 |
+
391: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.54.attn_q_b.weight
|
402 |
+
392: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.54.ffn_down_exps.weight
|
403 |
+
393: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.54.ffn_down_shexp.weight
|
404 |
+
394: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.54.ffn_gate_exps.weight
|
405 |
+
395: 819200 | 5120, 160, 1, 1 | F32 | blk.54.ffn_gate_inp.weight
|
406 |
+
396: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.54.ffn_gate_shexp.weight
|
407 |
+
397: 5120 | 5120, 1, 1, 1 | F32 | blk.54.ffn_norm.weight
|
408 |
+
398: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.54.ffn_up_exps.weight
|
409 |
+
399: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.54.ffn_up_shexp.weight
|
410 |
+
400: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.55.attn_kv_a_mqa.weight
|
411 |
+
401: 512 | 512, 1, 1, 1 | F32 | blk.55.attn_kv_a_norm.weight
|
412 |
+
402: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.55.attn_kv_b.weight
|
413 |
+
403: 5120 | 5120, 1, 1, 1 | F32 | blk.55.attn_norm.weight
|
414 |
+
404: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.55.attn_output.weight
|
415 |
+
405: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.55.attn_q_a.weight
|
416 |
+
406: 1536 | 1536, 1, 1, 1 | F32 | blk.55.attn_q_a_norm.weight
|
417 |
+
407: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.55.attn_q_b.weight
|
418 |
+
408: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.55.ffn_down_exps.weight
|
419 |
+
409: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.55.ffn_down_shexp.weight
|
420 |
+
410: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.55.ffn_gate_exps.weight
|
421 |
+
411: 819200 | 5120, 160, 1, 1 | F32 | blk.55.ffn_gate_inp.weight
|
422 |
+
412: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.55.ffn_gate_shexp.weight
|
423 |
+
413: 5120 | 5120, 1, 1, 1 | F32 | blk.55.ffn_norm.weight
|
424 |
+
414: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.55.ffn_up_exps.weight
|
425 |
+
415: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.55.ffn_up_shexp.weight
|
426 |
+
416: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.56.attn_kv_a_mqa.weight
|
427 |
+
417: 512 | 512, 1, 1, 1 | F32 | blk.56.attn_kv_a_norm.weight
|
428 |
+
418: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.56.attn_kv_b.weight
|
429 |
+
419: 5120 | 5120, 1, 1, 1 | F32 | blk.56.attn_norm.weight
|
430 |
+
420: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.56.attn_output.weight
|
431 |
+
421: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.56.attn_q_a.weight
|
432 |
+
422: 1536 | 1536, 1, 1, 1 | F32 | blk.56.attn_q_a_norm.weight
|
433 |
+
423: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.56.attn_q_b.weight
|
434 |
+
424: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.56.ffn_down_exps.weight
|
435 |
+
425: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.56.ffn_down_shexp.weight
|
436 |
+
426: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.56.ffn_gate_exps.weight
|
437 |
+
427: 819200 | 5120, 160, 1, 1 | F32 | blk.56.ffn_gate_inp.weight
|
438 |
+
428: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.56.ffn_gate_shexp.weight
|
439 |
+
429: 5120 | 5120, 1, 1, 1 | F32 | blk.56.ffn_norm.weight
|
440 |
+
430: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.56.ffn_up_exps.weight
|
441 |
+
431: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.56.ffn_up_shexp.weight
|
442 |
+
432: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.57.attn_kv_a_mqa.weight
|
443 |
+
433: 512 | 512, 1, 1, 1 | F32 | blk.57.attn_kv_a_norm.weight
|
444 |
+
434: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.57.attn_kv_b.weight
|
445 |
+
435: 5120 | 5120, 1, 1, 1 | F32 | blk.57.attn_norm.weight
|
446 |
+
436: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.57.attn_output.weight
|
447 |
+
437: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.57.attn_q_a.weight
|
448 |
+
438: 1536 | 1536, 1, 1, 1 | F32 | blk.57.attn_q_a_norm.weight
|
449 |
+
439: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.57.attn_q_b.weight
|
450 |
+
440: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.57.ffn_down_exps.weight
|
451 |
+
441: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.57.ffn_down_shexp.weight
|
452 |
+
442: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.57.ffn_gate_exps.weight
|
453 |
+
443: 819200 | 5120, 160, 1, 1 | F32 | blk.57.ffn_gate_inp.weight
|
454 |
+
444: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.57.ffn_gate_shexp.weight
|
455 |
+
445: 5120 | 5120, 1, 1, 1 | F32 | blk.57.ffn_norm.weight
|
456 |
+
446: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.57.ffn_up_exps.weight
|
457 |
+
447: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.57.ffn_up_shexp.weight
|
458 |
+
448: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.58.attn_kv_a_mqa.weight
|
459 |
+
449: 512 | 512, 1, 1, 1 | F32 | blk.58.attn_kv_a_norm.weight
|
460 |
+
450: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.58.attn_kv_b.weight
|
461 |
+
451: 5120 | 5120, 1, 1, 1 | F32 | blk.58.attn_norm.weight
|
462 |
+
452: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.58.attn_output.weight
|
463 |
+
453: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.58.attn_q_a.weight
|
464 |
+
454: 1536 | 1536, 1, 1, 1 | F32 | blk.58.attn_q_a_norm.weight
|
465 |
+
455: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.58.attn_q_b.weight
|
466 |
+
456: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.58.ffn_down_exps.weight
|
467 |
+
457: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.58.ffn_down_shexp.weight
|
468 |
+
458: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.58.ffn_gate_exps.weight
|
469 |
+
459: 819200 | 5120, 160, 1, 1 | F32 | blk.58.ffn_gate_inp.weight
|
470 |
+
460: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.58.ffn_gate_shexp.weight
|
471 |
+
461: 5120 | 5120, 1, 1, 1 | F32 | blk.58.ffn_norm.weight
|
472 |
+
462: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.58.ffn_up_exps.weight
|
473 |
+
463: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.58.ffn_up_shexp.weight
|
474 |
+
464: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.59.attn_kv_a_mqa.weight
|
475 |
+
465: 512 | 512, 1, 1, 1 | F32 | blk.59.attn_kv_a_norm.weight
|
476 |
+
466: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.59.attn_kv_b.weight
|
477 |
+
467: 5120 | 5120, 1, 1, 1 | F32 | blk.59.attn_norm.weight
|
478 |
+
468: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.59.attn_output.weight
|
479 |
+
469: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.59.attn_q_a.weight
|
480 |
+
470: 1536 | 1536, 1, 1, 1 | F32 | blk.59.attn_q_a_norm.weight
|
481 |
+
471: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.59.attn_q_b.weight
|
482 |
+
472: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.59.ffn_down_exps.weight
|
483 |
+
473: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.59.ffn_down_shexp.weight
|
484 |
+
474: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.59.ffn_gate_exps.weight
|
485 |
+
475: 819200 | 5120, 160, 1, 1 | F32 | blk.59.ffn_gate_inp.weight
|
486 |
+
476: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.59.ffn_gate_shexp.weight
|
487 |
+
477: 5120 | 5120, 1, 1, 1 | F32 | blk.59.ffn_norm.weight
|
488 |
+
478: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.59.ffn_up_exps.weight
|
489 |
+
479: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.59.ffn_up_shexp.weight
|
DeepSeek-v2.5-1210-UD-iq1_s-00001-of-00002.gguf.tensors.txt
ADDED
@@ -0,0 +1,540 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq1_s-00001-of-00002.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 56 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 480
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 53
|
7 |
+
4: STRING | 1 | general.architecture = 'deepseek2'
|
8 |
+
5: STRING | 1 | general.type = 'model'
|
9 |
+
6: STRING | 1 | general.name = 'Dsv25'
|
10 |
+
7: STRING | 1 | general.size_label = '160x14B'
|
11 |
+
8: STRING | 1 | general.license = 'other'
|
12 |
+
9: STRING | 1 | general.license.name = 'deepseek'
|
13 |
+
10: STRING | 1 | general.license.link = 'https://github.com/deepseek-ai/DeepSeek-V2/blob/main/LICENSE'
|
14 |
+
11: UINT32 | 1 | deepseek2.block_count = 60
|
15 |
+
12: UINT32 | 1 | deepseek2.context_length = 163840
|
16 |
+
13: UINT32 | 1 | deepseek2.embedding_length = 5120
|
17 |
+
14: UINT32 | 1 | deepseek2.feed_forward_length = 12288
|
18 |
+
15: UINT32 | 1 | deepseek2.attention.head_count = 128
|
19 |
+
16: UINT32 | 1 | deepseek2.attention.head_count_kv = 128
|
20 |
+
17: FLOAT32 | 1 | deepseek2.rope.freq_base = 10000.0
|
21 |
+
18: FLOAT32 | 1 | deepseek2.attention.layer_norm_rms_epsilon = 9.999999974752427e-07
|
22 |
+
19: UINT32 | 1 | deepseek2.expert_used_count = 6
|
23 |
+
20: UINT32 | 1 | deepseek2.leading_dense_block_count = 1
|
24 |
+
21: UINT32 | 1 | deepseek2.vocab_size = 102400
|
25 |
+
22: UINT32 | 1 | deepseek2.attention.q_lora_rank = 1536
|
26 |
+
23: UINT32 | 1 | deepseek2.attention.kv_lora_rank = 512
|
27 |
+
24: UINT32 | 1 | deepseek2.attention.key_length = 192
|
28 |
+
25: UINT32 | 1 | deepseek2.attention.value_length = 128
|
29 |
+
26: UINT32 | 1 | deepseek2.expert_feed_forward_length = 1536
|
30 |
+
27: UINT32 | 1 | deepseek2.expert_count = 160
|
31 |
+
28: UINT32 | 1 | deepseek2.expert_shared_count = 2
|
32 |
+
29: FLOAT32 | 1 | deepseek2.expert_weights_scale = 16.0
|
33 |
+
30: BOOL | 1 | deepseek2.expert_weights_norm = False
|
34 |
+
31: UINT32 | 1 | deepseek2.expert_gating_func = 1
|
35 |
+
32: UINT32 | 1 | deepseek2.rope.dimension_count = 64
|
36 |
+
33: STRING | 1 | deepseek2.rope.scaling.type = 'yarn'
|
37 |
+
34: FLOAT32 | 1 | deepseek2.rope.scaling.factor = 40.0
|
38 |
+
35: UINT32 | 1 | deepseek2.rope.scaling.original_context_length = 4096
|
39 |
+
36: FLOAT32 | 1 | deepseek2.rope.scaling.yarn_log_multiplier = 0.10000000149011612
|
40 |
+
37: STRING | 1 | tokenizer.ggml.model = 'gpt2'
|
41 |
+
38: STRING | 1 | tokenizer.ggml.pre = 'deepseek-llm'
|
42 |
+
39: [STRING] | 102400 | tokenizer.ggml.tokens
|
43 |
+
40: [INT32] | 102400 | tokenizer.ggml.token_type
|
44 |
+
41: [STRING] | 99757 | tokenizer.ggml.merges
|
45 |
+
42: UINT32 | 1 | tokenizer.ggml.bos_token_id = 100000
|
46 |
+
43: UINT32 | 1 | tokenizer.ggml.eos_token_id = 100001
|
47 |
+
44: UINT32 | 1 | tokenizer.ggml.padding_token_id = 100001
|
48 |
+
45: BOOL | 1 | tokenizer.ggml.add_bos_token = True
|
49 |
+
46: BOOL | 1 | tokenizer.ggml.add_eos_token = False
|
50 |
+
47: STRING | 1 | tokenizer.chat_template = '{% if not add_generation_prompt is defined %}{% set add_gene'
|
51 |
+
48: UINT32 | 1 | general.quantization_version = 2
|
52 |
+
49: UINT32 | 1 | general.file_type = 24
|
53 |
+
50: STRING | 1 | quantize.imatrix.file = '/archive/nuc/LLM/raw/imatrix-DeepSeek-V2.5-1210-bartowski.da'
|
54 |
+
51: STRING | 1 | quantize.imatrix.dataset = '/training_dir/calibration_datav3.txt'
|
55 |
+
52: INT32 | 1 | quantize.imatrix.entries_count = 716
|
56 |
+
53: INT32 | 1 | quantize.imatrix.chunks_count = 139
|
57 |
+
54: UINT16 | 1 | split.no = 0
|
58 |
+
55: INT32 | 1 | split.tensors.count = 959
|
59 |
+
56: UINT16 | 1 | split.count = 2
|
60 |
+
* Dumping 480 tensor(s)
|
61 |
+
1: 524288000 | 5120, 102400, 1, 1 | Q6_K | output.weight
|
62 |
+
2: 5120 | 5120, 1, 1, 1 | F32 | output_norm.weight
|
63 |
+
3: 524288000 | 5120, 102400, 1, 1 | Q6_K | token_embd.weight
|
64 |
+
4: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.0.attn_kv_a_mqa.weight
|
65 |
+
5: 512 | 512, 1, 1, 1 | F32 | blk.0.attn_kv_a_norm.weight
|
66 |
+
6: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.0.attn_kv_b.weight
|
67 |
+
7: 5120 | 5120, 1, 1, 1 | F32 | blk.0.attn_norm.weight
|
68 |
+
8: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.0.attn_output.weight
|
69 |
+
9: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.0.attn_q_a.weight
|
70 |
+
10: 1536 | 1536, 1, 1, 1 | F32 | blk.0.attn_q_a_norm.weight
|
71 |
+
11: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.0.attn_q_b.weight
|
72 |
+
12: 62914560 | 12288, 5120, 1, 1 | Q6_K | blk.0.ffn_down.weight
|
73 |
+
13: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_gate.weight
|
74 |
+
14: 5120 | 5120, 1, 1, 1 | F32 | blk.0.ffn_norm.weight
|
75 |
+
15: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_up.weight
|
76 |
+
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.1.attn_kv_a_mqa.weight
|
77 |
+
17: 512 | 512, 1, 1, 1 | F32 | blk.1.attn_kv_a_norm.weight
|
78 |
+
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.1.attn_kv_b.weight
|
79 |
+
19: 5120 | 5120, 1, 1, 1 | F32 | blk.1.attn_norm.weight
|
80 |
+
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.1.attn_output.weight
|
81 |
+
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.1.attn_q_a.weight
|
82 |
+
22: 1536 | 1536, 1, 1, 1 | F32 | blk.1.attn_q_a_norm.weight
|
83 |
+
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.1.attn_q_b.weight
|
84 |
+
24: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.1.ffn_down_exps.weight
|
85 |
+
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.1.ffn_down_shexp.weight
|
86 |
+
26: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.1.ffn_gate_exps.weight
|
87 |
+
27: 819200 | 5120, 160, 1, 1 | F32 | blk.1.ffn_gate_inp.weight
|
88 |
+
28: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.1.ffn_gate_shexp.weight
|
89 |
+
29: 5120 | 5120, 1, 1, 1 | F32 | blk.1.ffn_norm.weight
|
90 |
+
30: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.1.ffn_up_exps.weight
|
91 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.1.ffn_up_shexp.weight
|
92 |
+
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.2.attn_kv_a_mqa.weight
|
93 |
+
33: 512 | 512, 1, 1, 1 | F32 | blk.2.attn_kv_a_norm.weight
|
94 |
+
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.2.attn_kv_b.weight
|
95 |
+
35: 5120 | 5120, 1, 1, 1 | F32 | blk.2.attn_norm.weight
|
96 |
+
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.2.attn_output.weight
|
97 |
+
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.2.attn_q_a.weight
|
98 |
+
38: 1536 | 1536, 1, 1, 1 | F32 | blk.2.attn_q_a_norm.weight
|
99 |
+
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.2.attn_q_b.weight
|
100 |
+
40: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.2.ffn_down_exps.weight
|
101 |
+
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.2.ffn_down_shexp.weight
|
102 |
+
42: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.2.ffn_gate_exps.weight
|
103 |
+
43: 819200 | 5120, 160, 1, 1 | F32 | blk.2.ffn_gate_inp.weight
|
104 |
+
44: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.2.ffn_gate_shexp.weight
|
105 |
+
45: 5120 | 5120, 1, 1, 1 | F32 | blk.2.ffn_norm.weight
|
106 |
+
46: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.2.ffn_up_exps.weight
|
107 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.2.ffn_up_shexp.weight
|
108 |
+
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.3.attn_kv_a_mqa.weight
|
109 |
+
49: 512 | 512, 1, 1, 1 | F32 | blk.3.attn_kv_a_norm.weight
|
110 |
+
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.3.attn_kv_b.weight
|
111 |
+
51: 5120 | 5120, 1, 1, 1 | F32 | blk.3.attn_norm.weight
|
112 |
+
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.3.attn_output.weight
|
113 |
+
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.3.attn_q_a.weight
|
114 |
+
54: 1536 | 1536, 1, 1, 1 | F32 | blk.3.attn_q_a_norm.weight
|
115 |
+
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.3.attn_q_b.weight
|
116 |
+
56: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.3.ffn_down_exps.weight
|
117 |
+
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.3.ffn_down_shexp.weight
|
118 |
+
58: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.3.ffn_gate_exps.weight
|
119 |
+
59: 819200 | 5120, 160, 1, 1 | F32 | blk.3.ffn_gate_inp.weight
|
120 |
+
60: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.3.ffn_gate_shexp.weight
|
121 |
+
61: 5120 | 5120, 1, 1, 1 | F32 | blk.3.ffn_norm.weight
|
122 |
+
62: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.3.ffn_up_exps.weight
|
123 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.3.ffn_up_shexp.weight
|
124 |
+
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.4.attn_kv_a_mqa.weight
|
125 |
+
65: 512 | 512, 1, 1, 1 | F32 | blk.4.attn_kv_a_norm.weight
|
126 |
+
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.4.attn_kv_b.weight
|
127 |
+
67: 5120 | 5120, 1, 1, 1 | F32 | blk.4.attn_norm.weight
|
128 |
+
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.4.attn_output.weight
|
129 |
+
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.4.attn_q_a.weight
|
130 |
+
70: 1536 | 1536, 1, 1, 1 | F32 | blk.4.attn_q_a_norm.weight
|
131 |
+
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.4.attn_q_b.weight
|
132 |
+
72: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.4.ffn_down_exps.weight
|
133 |
+
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.4.ffn_down_shexp.weight
|
134 |
+
74: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.4.ffn_gate_exps.weight
|
135 |
+
75: 819200 | 5120, 160, 1, 1 | F32 | blk.4.ffn_gate_inp.weight
|
136 |
+
76: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.4.ffn_gate_shexp.weight
|
137 |
+
77: 5120 | 5120, 1, 1, 1 | F32 | blk.4.ffn_norm.weight
|
138 |
+
78: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.4.ffn_up_exps.weight
|
139 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.4.ffn_up_shexp.weight
|
140 |
+
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.5.attn_kv_a_mqa.weight
|
141 |
+
81: 512 | 512, 1, 1, 1 | F32 | blk.5.attn_kv_a_norm.weight
|
142 |
+
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.5.attn_kv_b.weight
|
143 |
+
83: 5120 | 5120, 1, 1, 1 | F32 | blk.5.attn_norm.weight
|
144 |
+
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.5.attn_output.weight
|
145 |
+
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.5.attn_q_a.weight
|
146 |
+
86: 1536 | 1536, 1, 1, 1 | F32 | blk.5.attn_q_a_norm.weight
|
147 |
+
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.5.attn_q_b.weight
|
148 |
+
88: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.5.ffn_down_exps.weight
|
149 |
+
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.5.ffn_down_shexp.weight
|
150 |
+
90: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.5.ffn_gate_exps.weight
|
151 |
+
91: 819200 | 5120, 160, 1, 1 | F32 | blk.5.ffn_gate_inp.weight
|
152 |
+
92: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.5.ffn_gate_shexp.weight
|
153 |
+
93: 5120 | 5120, 1, 1, 1 | F32 | blk.5.ffn_norm.weight
|
154 |
+
94: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.5.ffn_up_exps.weight
|
155 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.5.ffn_up_shexp.weight
|
156 |
+
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.6.attn_kv_a_mqa.weight
|
157 |
+
97: 512 | 512, 1, 1, 1 | F32 | blk.6.attn_kv_a_norm.weight
|
158 |
+
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.6.attn_kv_b.weight
|
159 |
+
99: 5120 | 5120, 1, 1, 1 | F32 | blk.6.attn_norm.weight
|
160 |
+
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.6.attn_output.weight
|
161 |
+
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.6.attn_q_a.weight
|
162 |
+
102: 1536 | 1536, 1, 1, 1 | F32 | blk.6.attn_q_a_norm.weight
|
163 |
+
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.6.attn_q_b.weight
|
164 |
+
104: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.6.ffn_down_exps.weight
|
165 |
+
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.6.ffn_down_shexp.weight
|
166 |
+
106: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.6.ffn_gate_exps.weight
|
167 |
+
107: 819200 | 5120, 160, 1, 1 | F32 | blk.6.ffn_gate_inp.weight
|
168 |
+
108: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.6.ffn_gate_shexp.weight
|
169 |
+
109: 5120 | 5120, 1, 1, 1 | F32 | blk.6.ffn_norm.weight
|
170 |
+
110: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.6.ffn_up_exps.weight
|
171 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.6.ffn_up_shexp.weight
|
172 |
+
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.7.attn_kv_a_mqa.weight
|
173 |
+
113: 512 | 512, 1, 1, 1 | F32 | blk.7.attn_kv_a_norm.weight
|
174 |
+
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.7.attn_kv_b.weight
|
175 |
+
115: 5120 | 5120, 1, 1, 1 | F32 | blk.7.attn_norm.weight
|
176 |
+
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.7.attn_output.weight
|
177 |
+
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.7.attn_q_a.weight
|
178 |
+
118: 1536 | 1536, 1, 1, 1 | F32 | blk.7.attn_q_a_norm.weight
|
179 |
+
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.7.attn_q_b.weight
|
180 |
+
120: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.7.ffn_down_exps.weight
|
181 |
+
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.7.ffn_down_shexp.weight
|
182 |
+
122: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.7.ffn_gate_exps.weight
|
183 |
+
123: 819200 | 5120, 160, 1, 1 | F32 | blk.7.ffn_gate_inp.weight
|
184 |
+
124: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.7.ffn_gate_shexp.weight
|
185 |
+
125: 5120 | 5120, 1, 1, 1 | F32 | blk.7.ffn_norm.weight
|
186 |
+
126: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.7.ffn_up_exps.weight
|
187 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.7.ffn_up_shexp.weight
|
188 |
+
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.8.attn_kv_a_mqa.weight
|
189 |
+
129: 512 | 512, 1, 1, 1 | F32 | blk.8.attn_kv_a_norm.weight
|
190 |
+
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.8.attn_kv_b.weight
|
191 |
+
131: 5120 | 5120, 1, 1, 1 | F32 | blk.8.attn_norm.weight
|
192 |
+
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.8.attn_output.weight
|
193 |
+
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.8.attn_q_a.weight
|
194 |
+
134: 1536 | 1536, 1, 1, 1 | F32 | blk.8.attn_q_a_norm.weight
|
195 |
+
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.8.attn_q_b.weight
|
196 |
+
136: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.8.ffn_down_exps.weight
|
197 |
+
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.8.ffn_down_shexp.weight
|
198 |
+
138: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.8.ffn_gate_exps.weight
|
199 |
+
139: 819200 | 5120, 160, 1, 1 | F32 | blk.8.ffn_gate_inp.weight
|
200 |
+
140: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.8.ffn_gate_shexp.weight
|
201 |
+
141: 5120 | 5120, 1, 1, 1 | F32 | blk.8.ffn_norm.weight
|
202 |
+
142: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.8.ffn_up_exps.weight
|
203 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.8.ffn_up_shexp.weight
|
204 |
+
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.9.attn_kv_a_mqa.weight
|
205 |
+
145: 512 | 512, 1, 1, 1 | F32 | blk.9.attn_kv_a_norm.weight
|
206 |
+
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.9.attn_kv_b.weight
|
207 |
+
147: 5120 | 5120, 1, 1, 1 | F32 | blk.9.attn_norm.weight
|
208 |
+
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.9.attn_output.weight
|
209 |
+
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.9.attn_q_a.weight
|
210 |
+
150: 1536 | 1536, 1, 1, 1 | F32 | blk.9.attn_q_a_norm.weight
|
211 |
+
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.9.attn_q_b.weight
|
212 |
+
152: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.9.ffn_down_exps.weight
|
213 |
+
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.9.ffn_down_shexp.weight
|
214 |
+
154: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.9.ffn_gate_exps.weight
|
215 |
+
155: 819200 | 5120, 160, 1, 1 | F32 | blk.9.ffn_gate_inp.weight
|
216 |
+
156: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.9.ffn_gate_shexp.weight
|
217 |
+
157: 5120 | 5120, 1, 1, 1 | F32 | blk.9.ffn_norm.weight
|
218 |
+
158: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.9.ffn_up_exps.weight
|
219 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.9.ffn_up_shexp.weight
|
220 |
+
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.10.attn_kv_a_mqa.weight
|
221 |
+
161: 512 | 512, 1, 1, 1 | F32 | blk.10.attn_kv_a_norm.weight
|
222 |
+
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.10.attn_kv_b.weight
|
223 |
+
163: 5120 | 5120, 1, 1, 1 | F32 | blk.10.attn_norm.weight
|
224 |
+
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.10.attn_output.weight
|
225 |
+
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.10.attn_q_a.weight
|
226 |
+
166: 1536 | 1536, 1, 1, 1 | F32 | blk.10.attn_q_a_norm.weight
|
227 |
+
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.10.attn_q_b.weight
|
228 |
+
168: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.10.ffn_down_exps.weight
|
229 |
+
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.10.ffn_down_shexp.weight
|
230 |
+
170: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.10.ffn_gate_exps.weight
|
231 |
+
171: 819200 | 5120, 160, 1, 1 | F32 | blk.10.ffn_gate_inp.weight
|
232 |
+
172: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.10.ffn_gate_shexp.weight
|
233 |
+
173: 5120 | 5120, 1, 1, 1 | F32 | blk.10.ffn_norm.weight
|
234 |
+
174: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.10.ffn_up_exps.weight
|
235 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.10.ffn_up_shexp.weight
|
236 |
+
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.11.attn_kv_a_mqa.weight
|
237 |
+
177: 512 | 512, 1, 1, 1 | F32 | blk.11.attn_kv_a_norm.weight
|
238 |
+
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.11.attn_kv_b.weight
|
239 |
+
179: 5120 | 5120, 1, 1, 1 | F32 | blk.11.attn_norm.weight
|
240 |
+
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.11.attn_output.weight
|
241 |
+
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.11.attn_q_a.weight
|
242 |
+
182: 1536 | 1536, 1, 1, 1 | F32 | blk.11.attn_q_a_norm.weight
|
243 |
+
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.11.attn_q_b.weight
|
244 |
+
184: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.11.ffn_down_exps.weight
|
245 |
+
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.11.ffn_down_shexp.weight
|
246 |
+
186: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.11.ffn_gate_exps.weight
|
247 |
+
187: 819200 | 5120, 160, 1, 1 | F32 | blk.11.ffn_gate_inp.weight
|
248 |
+
188: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.11.ffn_gate_shexp.weight
|
249 |
+
189: 5120 | 5120, 1, 1, 1 | F32 | blk.11.ffn_norm.weight
|
250 |
+
190: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.11.ffn_up_exps.weight
|
251 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.11.ffn_up_shexp.weight
|
252 |
+
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.12.attn_kv_a_mqa.weight
|
253 |
+
193: 512 | 512, 1, 1, 1 | F32 | blk.12.attn_kv_a_norm.weight
|
254 |
+
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.12.attn_kv_b.weight
|
255 |
+
195: 5120 | 5120, 1, 1, 1 | F32 | blk.12.attn_norm.weight
|
256 |
+
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.12.attn_output.weight
|
257 |
+
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.12.attn_q_a.weight
|
258 |
+
198: 1536 | 1536, 1, 1, 1 | F32 | blk.12.attn_q_a_norm.weight
|
259 |
+
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.12.attn_q_b.weight
|
260 |
+
200: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.12.ffn_down_exps.weight
|
261 |
+
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.12.ffn_down_shexp.weight
|
262 |
+
202: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.12.ffn_gate_exps.weight
|
263 |
+
203: 819200 | 5120, 160, 1, 1 | F32 | blk.12.ffn_gate_inp.weight
|
264 |
+
204: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.12.ffn_gate_shexp.weight
|
265 |
+
205: 5120 | 5120, 1, 1, 1 | F32 | blk.12.ffn_norm.weight
|
266 |
+
206: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.12.ffn_up_exps.weight
|
267 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.12.ffn_up_shexp.weight
|
268 |
+
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.13.attn_kv_a_mqa.weight
|
269 |
+
209: 512 | 512, 1, 1, 1 | F32 | blk.13.attn_kv_a_norm.weight
|
270 |
+
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.13.attn_kv_b.weight
|
271 |
+
211: 5120 | 5120, 1, 1, 1 | F32 | blk.13.attn_norm.weight
|
272 |
+
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.13.attn_output.weight
|
273 |
+
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.13.attn_q_a.weight
|
274 |
+
214: 1536 | 1536, 1, 1, 1 | F32 | blk.13.attn_q_a_norm.weight
|
275 |
+
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.13.attn_q_b.weight
|
276 |
+
216: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.13.ffn_down_exps.weight
|
277 |
+
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.13.ffn_down_shexp.weight
|
278 |
+
218: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.13.ffn_gate_exps.weight
|
279 |
+
219: 819200 | 5120, 160, 1, 1 | F32 | blk.13.ffn_gate_inp.weight
|
280 |
+
220: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.13.ffn_gate_shexp.weight
|
281 |
+
221: 5120 | 5120, 1, 1, 1 | F32 | blk.13.ffn_norm.weight
|
282 |
+
222: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.13.ffn_up_exps.weight
|
283 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.13.ffn_up_shexp.weight
|
284 |
+
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.14.attn_kv_a_mqa.weight
|
285 |
+
225: 512 | 512, 1, 1, 1 | F32 | blk.14.attn_kv_a_norm.weight
|
286 |
+
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.14.attn_kv_b.weight
|
287 |
+
227: 5120 | 5120, 1, 1, 1 | F32 | blk.14.attn_norm.weight
|
288 |
+
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.14.attn_output.weight
|
289 |
+
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.14.attn_q_a.weight
|
290 |
+
230: 1536 | 1536, 1, 1, 1 | F32 | blk.14.attn_q_a_norm.weight
|
291 |
+
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.14.attn_q_b.weight
|
292 |
+
232: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.14.ffn_down_exps.weight
|
293 |
+
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.14.ffn_down_shexp.weight
|
294 |
+
234: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.14.ffn_gate_exps.weight
|
295 |
+
235: 819200 | 5120, 160, 1, 1 | F32 | blk.14.ffn_gate_inp.weight
|
296 |
+
236: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.14.ffn_gate_shexp.weight
|
297 |
+
237: 5120 | 5120, 1, 1, 1 | F32 | blk.14.ffn_norm.weight
|
298 |
+
238: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.14.ffn_up_exps.weight
|
299 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.14.ffn_up_shexp.weight
|
300 |
+
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.15.attn_kv_a_mqa.weight
|
301 |
+
241: 512 | 512, 1, 1, 1 | F32 | blk.15.attn_kv_a_norm.weight
|
302 |
+
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.15.attn_kv_b.weight
|
303 |
+
243: 5120 | 5120, 1, 1, 1 | F32 | blk.15.attn_norm.weight
|
304 |
+
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.15.attn_output.weight
|
305 |
+
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.15.attn_q_a.weight
|
306 |
+
246: 1536 | 1536, 1, 1, 1 | F32 | blk.15.attn_q_a_norm.weight
|
307 |
+
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.15.attn_q_b.weight
|
308 |
+
248: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.15.ffn_down_exps.weight
|
309 |
+
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.15.ffn_down_shexp.weight
|
310 |
+
250: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.15.ffn_gate_exps.weight
|
311 |
+
251: 819200 | 5120, 160, 1, 1 | F32 | blk.15.ffn_gate_inp.weight
|
312 |
+
252: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.15.ffn_gate_shexp.weight
|
313 |
+
253: 5120 | 5120, 1, 1, 1 | F32 | blk.15.ffn_norm.weight
|
314 |
+
254: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.15.ffn_up_exps.weight
|
315 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.15.ffn_up_shexp.weight
|
316 |
+
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.16.attn_kv_a_mqa.weight
|
317 |
+
257: 512 | 512, 1, 1, 1 | F32 | blk.16.attn_kv_a_norm.weight
|
318 |
+
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.16.attn_kv_b.weight
|
319 |
+
259: 5120 | 5120, 1, 1, 1 | F32 | blk.16.attn_norm.weight
|
320 |
+
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.16.attn_output.weight
|
321 |
+
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.16.attn_q_a.weight
|
322 |
+
262: 1536 | 1536, 1, 1, 1 | F32 | blk.16.attn_q_a_norm.weight
|
323 |
+
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.16.attn_q_b.weight
|
324 |
+
264: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.16.ffn_down_exps.weight
|
325 |
+
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.16.ffn_down_shexp.weight
|
326 |
+
266: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.16.ffn_gate_exps.weight
|
327 |
+
267: 819200 | 5120, 160, 1, 1 | F32 | blk.16.ffn_gate_inp.weight
|
328 |
+
268: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.16.ffn_gate_shexp.weight
|
329 |
+
269: 5120 | 5120, 1, 1, 1 | F32 | blk.16.ffn_norm.weight
|
330 |
+
270: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.16.ffn_up_exps.weight
|
331 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.16.ffn_up_shexp.weight
|
332 |
+
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.17.attn_kv_a_mqa.weight
|
333 |
+
273: 512 | 512, 1, 1, 1 | F32 | blk.17.attn_kv_a_norm.weight
|
334 |
+
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.17.attn_kv_b.weight
|
335 |
+
275: 5120 | 5120, 1, 1, 1 | F32 | blk.17.attn_norm.weight
|
336 |
+
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.17.attn_output.weight
|
337 |
+
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.17.attn_q_a.weight
|
338 |
+
278: 1536 | 1536, 1, 1, 1 | F32 | blk.17.attn_q_a_norm.weight
|
339 |
+
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.17.attn_q_b.weight
|
340 |
+
280: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.17.ffn_down_exps.weight
|
341 |
+
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.17.ffn_down_shexp.weight
|
342 |
+
282: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.17.ffn_gate_exps.weight
|
343 |
+
283: 819200 | 5120, 160, 1, 1 | F32 | blk.17.ffn_gate_inp.weight
|
344 |
+
284: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.17.ffn_gate_shexp.weight
|
345 |
+
285: 5120 | 5120, 1, 1, 1 | F32 | blk.17.ffn_norm.weight
|
346 |
+
286: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.17.ffn_up_exps.weight
|
347 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.17.ffn_up_shexp.weight
|
348 |
+
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.18.attn_kv_a_mqa.weight
|
349 |
+
289: 512 | 512, 1, 1, 1 | F32 | blk.18.attn_kv_a_norm.weight
|
350 |
+
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.18.attn_kv_b.weight
|
351 |
+
291: 5120 | 5120, 1, 1, 1 | F32 | blk.18.attn_norm.weight
|
352 |
+
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.18.attn_output.weight
|
353 |
+
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.18.attn_q_a.weight
|
354 |
+
294: 1536 | 1536, 1, 1, 1 | F32 | blk.18.attn_q_a_norm.weight
|
355 |
+
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.18.attn_q_b.weight
|
356 |
+
296: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.18.ffn_down_exps.weight
|
357 |
+
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.18.ffn_down_shexp.weight
|
358 |
+
298: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.18.ffn_gate_exps.weight
|
359 |
+
299: 819200 | 5120, 160, 1, 1 | F32 | blk.18.ffn_gate_inp.weight
|
360 |
+
300: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.18.ffn_gate_shexp.weight
|
361 |
+
301: 5120 | 5120, 1, 1, 1 | F32 | blk.18.ffn_norm.weight
|
362 |
+
302: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.18.ffn_up_exps.weight
|
363 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.18.ffn_up_shexp.weight
|
364 |
+
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.19.attn_kv_a_mqa.weight
|
365 |
+
305: 512 | 512, 1, 1, 1 | F32 | blk.19.attn_kv_a_norm.weight
|
366 |
+
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.19.attn_kv_b.weight
|
367 |
+
307: 5120 | 5120, 1, 1, 1 | F32 | blk.19.attn_norm.weight
|
368 |
+
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.19.attn_output.weight
|
369 |
+
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.19.attn_q_a.weight
|
370 |
+
310: 1536 | 1536, 1, 1, 1 | F32 | blk.19.attn_q_a_norm.weight
|
371 |
+
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.19.attn_q_b.weight
|
372 |
+
312: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.19.ffn_down_exps.weight
|
373 |
+
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.19.ffn_down_shexp.weight
|
374 |
+
314: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.19.ffn_gate_exps.weight
|
375 |
+
315: 819200 | 5120, 160, 1, 1 | F32 | blk.19.ffn_gate_inp.weight
|
376 |
+
316: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.19.ffn_gate_shexp.weight
|
377 |
+
317: 5120 | 5120, 1, 1, 1 | F32 | blk.19.ffn_norm.weight
|
378 |
+
318: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.19.ffn_up_exps.weight
|
379 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.19.ffn_up_shexp.weight
|
380 |
+
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.20.attn_kv_a_mqa.weight
|
381 |
+
321: 512 | 512, 1, 1, 1 | F32 | blk.20.attn_kv_a_norm.weight
|
382 |
+
322: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.20.attn_kv_b.weight
|
383 |
+
323: 5120 | 5120, 1, 1, 1 | F32 | blk.20.attn_norm.weight
|
384 |
+
324: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.20.attn_output.weight
|
385 |
+
325: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.20.attn_q_a.weight
|
386 |
+
326: 1536 | 1536, 1, 1, 1 | F32 | blk.20.attn_q_a_norm.weight
|
387 |
+
327: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.20.attn_q_b.weight
|
388 |
+
328: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.20.ffn_down_exps.weight
|
389 |
+
329: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.20.ffn_down_shexp.weight
|
390 |
+
330: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.20.ffn_gate_exps.weight
|
391 |
+
331: 819200 | 5120, 160, 1, 1 | F32 | blk.20.ffn_gate_inp.weight
|
392 |
+
332: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.20.ffn_gate_shexp.weight
|
393 |
+
333: 5120 | 5120, 1, 1, 1 | F32 | blk.20.ffn_norm.weight
|
394 |
+
334: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.20.ffn_up_exps.weight
|
395 |
+
335: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.20.ffn_up_shexp.weight
|
396 |
+
336: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.21.attn_kv_a_mqa.weight
|
397 |
+
337: 512 | 512, 1, 1, 1 | F32 | blk.21.attn_kv_a_norm.weight
|
398 |
+
338: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.21.attn_kv_b.weight
|
399 |
+
339: 5120 | 5120, 1, 1, 1 | F32 | blk.21.attn_norm.weight
|
400 |
+
340: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.21.attn_output.weight
|
401 |
+
341: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.21.attn_q_a.weight
|
402 |
+
342: 1536 | 1536, 1, 1, 1 | F32 | blk.21.attn_q_a_norm.weight
|
403 |
+
343: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.21.attn_q_b.weight
|
404 |
+
344: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.21.ffn_down_exps.weight
|
405 |
+
345: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.21.ffn_down_shexp.weight
|
406 |
+
346: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.21.ffn_gate_exps.weight
|
407 |
+
347: 819200 | 5120, 160, 1, 1 | F32 | blk.21.ffn_gate_inp.weight
|
408 |
+
348: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.21.ffn_gate_shexp.weight
|
409 |
+
349: 5120 | 5120, 1, 1, 1 | F32 | blk.21.ffn_norm.weight
|
410 |
+
350: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.21.ffn_up_exps.weight
|
411 |
+
351: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.21.ffn_up_shexp.weight
|
412 |
+
352: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.22.attn_kv_a_mqa.weight
|
413 |
+
353: 512 | 512, 1, 1, 1 | F32 | blk.22.attn_kv_a_norm.weight
|
414 |
+
354: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.22.attn_kv_b.weight
|
415 |
+
355: 5120 | 5120, 1, 1, 1 | F32 | blk.22.attn_norm.weight
|
416 |
+
356: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.22.attn_output.weight
|
417 |
+
357: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.22.attn_q_a.weight
|
418 |
+
358: 1536 | 1536, 1, 1, 1 | F32 | blk.22.attn_q_a_norm.weight
|
419 |
+
359: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.22.attn_q_b.weight
|
420 |
+
360: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.22.ffn_down_exps.weight
|
421 |
+
361: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.22.ffn_down_shexp.weight
|
422 |
+
362: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.22.ffn_gate_exps.weight
|
423 |
+
363: 819200 | 5120, 160, 1, 1 | F32 | blk.22.ffn_gate_inp.weight
|
424 |
+
364: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.22.ffn_gate_shexp.weight
|
425 |
+
365: 5120 | 5120, 1, 1, 1 | F32 | blk.22.ffn_norm.weight
|
426 |
+
366: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.22.ffn_up_exps.weight
|
427 |
+
367: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.22.ffn_up_shexp.weight
|
428 |
+
368: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.23.attn_kv_a_mqa.weight
|
429 |
+
369: 512 | 512, 1, 1, 1 | F32 | blk.23.attn_kv_a_norm.weight
|
430 |
+
370: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.23.attn_kv_b.weight
|
431 |
+
371: 5120 | 5120, 1, 1, 1 | F32 | blk.23.attn_norm.weight
|
432 |
+
372: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.23.attn_output.weight
|
433 |
+
373: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.23.attn_q_a.weight
|
434 |
+
374: 1536 | 1536, 1, 1, 1 | F32 | blk.23.attn_q_a_norm.weight
|
435 |
+
375: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.23.attn_q_b.weight
|
436 |
+
376: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.23.ffn_down_exps.weight
|
437 |
+
377: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.23.ffn_down_shexp.weight
|
438 |
+
378: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.23.ffn_gate_exps.weight
|
439 |
+
379: 819200 | 5120, 160, 1, 1 | F32 | blk.23.ffn_gate_inp.weight
|
440 |
+
380: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.23.ffn_gate_shexp.weight
|
441 |
+
381: 5120 | 5120, 1, 1, 1 | F32 | blk.23.ffn_norm.weight
|
442 |
+
382: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.23.ffn_up_exps.weight
|
443 |
+
383: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.23.ffn_up_shexp.weight
|
444 |
+
384: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.24.attn_kv_a_mqa.weight
|
445 |
+
385: 512 | 512, 1, 1, 1 | F32 | blk.24.attn_kv_a_norm.weight
|
446 |
+
386: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.24.attn_kv_b.weight
|
447 |
+
387: 5120 | 5120, 1, 1, 1 | F32 | blk.24.attn_norm.weight
|
448 |
+
388: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.24.attn_output.weight
|
449 |
+
389: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.24.attn_q_a.weight
|
450 |
+
390: 1536 | 1536, 1, 1, 1 | F32 | blk.24.attn_q_a_norm.weight
|
451 |
+
391: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.24.attn_q_b.weight
|
452 |
+
392: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.24.ffn_down_exps.weight
|
453 |
+
393: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.24.ffn_down_shexp.weight
|
454 |
+
394: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.24.ffn_gate_exps.weight
|
455 |
+
395: 819200 | 5120, 160, 1, 1 | F32 | blk.24.ffn_gate_inp.weight
|
456 |
+
396: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.24.ffn_gate_shexp.weight
|
457 |
+
397: 5120 | 5120, 1, 1, 1 | F32 | blk.24.ffn_norm.weight
|
458 |
+
398: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.24.ffn_up_exps.weight
|
459 |
+
399: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.24.ffn_up_shexp.weight
|
460 |
+
400: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.25.attn_kv_a_mqa.weight
|
461 |
+
401: 512 | 512, 1, 1, 1 | F32 | blk.25.attn_kv_a_norm.weight
|
462 |
+
402: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.25.attn_kv_b.weight
|
463 |
+
403: 5120 | 5120, 1, 1, 1 | F32 | blk.25.attn_norm.weight
|
464 |
+
404: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.25.attn_output.weight
|
465 |
+
405: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.25.attn_q_a.weight
|
466 |
+
406: 1536 | 1536, 1, 1, 1 | F32 | blk.25.attn_q_a_norm.weight
|
467 |
+
407: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.25.attn_q_b.weight
|
468 |
+
408: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.25.ffn_down_exps.weight
|
469 |
+
409: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.25.ffn_down_shexp.weight
|
470 |
+
410: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.25.ffn_gate_exps.weight
|
471 |
+
411: 819200 | 5120, 160, 1, 1 | F32 | blk.25.ffn_gate_inp.weight
|
472 |
+
412: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.25.ffn_gate_shexp.weight
|
473 |
+
413: 5120 | 5120, 1, 1, 1 | F32 | blk.25.ffn_norm.weight
|
474 |
+
414: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.25.ffn_up_exps.weight
|
475 |
+
415: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.25.ffn_up_shexp.weight
|
476 |
+
416: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.26.attn_kv_a_mqa.weight
|
477 |
+
417: 512 | 512, 1, 1, 1 | F32 | blk.26.attn_kv_a_norm.weight
|
478 |
+
418: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.26.attn_kv_b.weight
|
479 |
+
419: 5120 | 5120, 1, 1, 1 | F32 | blk.26.attn_norm.weight
|
480 |
+
420: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.26.attn_output.weight
|
481 |
+
421: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.26.attn_q_a.weight
|
482 |
+
422: 1536 | 1536, 1, 1, 1 | F32 | blk.26.attn_q_a_norm.weight
|
483 |
+
423: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.26.attn_q_b.weight
|
484 |
+
424: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.26.ffn_down_exps.weight
|
485 |
+
425: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.26.ffn_down_shexp.weight
|
486 |
+
426: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.26.ffn_gate_exps.weight
|
487 |
+
427: 819200 | 5120, 160, 1, 1 | F32 | blk.26.ffn_gate_inp.weight
|
488 |
+
428: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.26.ffn_gate_shexp.weight
|
489 |
+
429: 5120 | 5120, 1, 1, 1 | F32 | blk.26.ffn_norm.weight
|
490 |
+
430: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.26.ffn_up_exps.weight
|
491 |
+
431: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.26.ffn_up_shexp.weight
|
492 |
+
432: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.27.attn_kv_a_mqa.weight
|
493 |
+
433: 512 | 512, 1, 1, 1 | F32 | blk.27.attn_kv_a_norm.weight
|
494 |
+
434: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.27.attn_kv_b.weight
|
495 |
+
435: 5120 | 5120, 1, 1, 1 | F32 | blk.27.attn_norm.weight
|
496 |
+
436: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.27.attn_output.weight
|
497 |
+
437: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.27.attn_q_a.weight
|
498 |
+
438: 1536 | 1536, 1, 1, 1 | F32 | blk.27.attn_q_a_norm.weight
|
499 |
+
439: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.27.attn_q_b.weight
|
500 |
+
440: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.27.ffn_down_exps.weight
|
501 |
+
441: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.27.ffn_down_shexp.weight
|
502 |
+
442: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.27.ffn_gate_exps.weight
|
503 |
+
443: 819200 | 5120, 160, 1, 1 | F32 | blk.27.ffn_gate_inp.weight
|
504 |
+
444: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.27.ffn_gate_shexp.weight
|
505 |
+
445: 5120 | 5120, 1, 1, 1 | F32 | blk.27.ffn_norm.weight
|
506 |
+
446: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.27.ffn_up_exps.weight
|
507 |
+
447: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.27.ffn_up_shexp.weight
|
508 |
+
448: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.28.attn_kv_a_mqa.weight
|
509 |
+
449: 512 | 512, 1, 1, 1 | F32 | blk.28.attn_kv_a_norm.weight
|
510 |
+
450: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.28.attn_kv_b.weight
|
511 |
+
451: 5120 | 5120, 1, 1, 1 | F32 | blk.28.attn_norm.weight
|
512 |
+
452: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.28.attn_output.weight
|
513 |
+
453: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.28.attn_q_a.weight
|
514 |
+
454: 1536 | 1536, 1, 1, 1 | F32 | blk.28.attn_q_a_norm.weight
|
515 |
+
455: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.28.attn_q_b.weight
|
516 |
+
456: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.28.ffn_down_exps.weight
|
517 |
+
457: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.28.ffn_down_shexp.weight
|
518 |
+
458: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.28.ffn_gate_exps.weight
|
519 |
+
459: 819200 | 5120, 160, 1, 1 | F32 | blk.28.ffn_gate_inp.weight
|
520 |
+
460: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.28.ffn_gate_shexp.weight
|
521 |
+
461: 5120 | 5120, 1, 1, 1 | F32 | blk.28.ffn_norm.weight
|
522 |
+
462: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.28.ffn_up_exps.weight
|
523 |
+
463: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.28.ffn_up_shexp.weight
|
524 |
+
464: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.29.attn_kv_a_mqa.weight
|
525 |
+
465: 512 | 512, 1, 1, 1 | F32 | blk.29.attn_kv_a_norm.weight
|
526 |
+
466: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.29.attn_kv_b.weight
|
527 |
+
467: 5120 | 5120, 1, 1, 1 | F32 | blk.29.attn_norm.weight
|
528 |
+
468: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.29.attn_output.weight
|
529 |
+
469: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.29.attn_q_a.weight
|
530 |
+
470: 1536 | 1536, 1, 1, 1 | F32 | blk.29.attn_q_a_norm.weight
|
531 |
+
471: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.29.attn_q_b.weight
|
532 |
+
472: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.29.ffn_down_exps.weight
|
533 |
+
473: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.29.ffn_down_shexp.weight
|
534 |
+
474: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.29.ffn_gate_exps.weight
|
535 |
+
475: 819200 | 5120, 160, 1, 1 | F32 | blk.29.ffn_gate_inp.weight
|
536 |
+
476: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.29.ffn_gate_shexp.weight
|
537 |
+
477: 5120 | 5120, 1, 1, 1 | F32 | blk.29.ffn_norm.weight
|
538 |
+
478: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.29.ffn_up_exps.weight
|
539 |
+
479: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.29.ffn_up_shexp.weight
|
540 |
+
480: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.30.attn_kv_a_mqa.weight
|
DeepSeek-v2.5-1210-UD-iq1_s-00002-of-00002.gguf.tensors.txt
ADDED
@@ -0,0 +1,489 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq1_s-00002-of-00002.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 6 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 479
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 3
|
7 |
+
4: UINT16 | 1 | split.no = 1
|
8 |
+
5: INT32 | 1 | split.tensors.count = 959
|
9 |
+
6: UINT16 | 1 | split.count = 2
|
10 |
+
* Dumping 479 tensor(s)
|
11 |
+
1: 512 | 512, 1, 1, 1 | F32 | blk.30.attn_kv_a_norm.weight
|
12 |
+
2: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.30.attn_kv_b.weight
|
13 |
+
3: 5120 | 5120, 1, 1, 1 | F32 | blk.30.attn_norm.weight
|
14 |
+
4: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.30.attn_output.weight
|
15 |
+
5: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.30.attn_q_a.weight
|
16 |
+
6: 1536 | 1536, 1, 1, 1 | F32 | blk.30.attn_q_a_norm.weight
|
17 |
+
7: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.30.attn_q_b.weight
|
18 |
+
8: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.30.ffn_down_exps.weight
|
19 |
+
9: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.30.ffn_down_shexp.weight
|
20 |
+
10: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.30.ffn_gate_exps.weight
|
21 |
+
11: 819200 | 5120, 160, 1, 1 | F32 | blk.30.ffn_gate_inp.weight
|
22 |
+
12: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.30.ffn_gate_shexp.weight
|
23 |
+
13: 5120 | 5120, 1, 1, 1 | F32 | blk.30.ffn_norm.weight
|
24 |
+
14: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.30.ffn_up_exps.weight
|
25 |
+
15: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.30.ffn_up_shexp.weight
|
26 |
+
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.31.attn_kv_a_mqa.weight
|
27 |
+
17: 512 | 512, 1, 1, 1 | F32 | blk.31.attn_kv_a_norm.weight
|
28 |
+
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.31.attn_kv_b.weight
|
29 |
+
19: 5120 | 5120, 1, 1, 1 | F32 | blk.31.attn_norm.weight
|
30 |
+
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.31.attn_output.weight
|
31 |
+
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.31.attn_q_a.weight
|
32 |
+
22: 1536 | 1536, 1, 1, 1 | F32 | blk.31.attn_q_a_norm.weight
|
33 |
+
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.31.attn_q_b.weight
|
34 |
+
24: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.31.ffn_down_exps.weight
|
35 |
+
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.31.ffn_down_shexp.weight
|
36 |
+
26: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.31.ffn_gate_exps.weight
|
37 |
+
27: 819200 | 5120, 160, 1, 1 | F32 | blk.31.ffn_gate_inp.weight
|
38 |
+
28: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.31.ffn_gate_shexp.weight
|
39 |
+
29: 5120 | 5120, 1, 1, 1 | F32 | blk.31.ffn_norm.weight
|
40 |
+
30: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.31.ffn_up_exps.weight
|
41 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.31.ffn_up_shexp.weight
|
42 |
+
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.32.attn_kv_a_mqa.weight
|
43 |
+
33: 512 | 512, 1, 1, 1 | F32 | blk.32.attn_kv_a_norm.weight
|
44 |
+
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.32.attn_kv_b.weight
|
45 |
+
35: 5120 | 5120, 1, 1, 1 | F32 | blk.32.attn_norm.weight
|
46 |
+
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.32.attn_output.weight
|
47 |
+
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.32.attn_q_a.weight
|
48 |
+
38: 1536 | 1536, 1, 1, 1 | F32 | blk.32.attn_q_a_norm.weight
|
49 |
+
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.32.attn_q_b.weight
|
50 |
+
40: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.32.ffn_down_exps.weight
|
51 |
+
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.32.ffn_down_shexp.weight
|
52 |
+
42: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.32.ffn_gate_exps.weight
|
53 |
+
43: 819200 | 5120, 160, 1, 1 | F32 | blk.32.ffn_gate_inp.weight
|
54 |
+
44: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.32.ffn_gate_shexp.weight
|
55 |
+
45: 5120 | 5120, 1, 1, 1 | F32 | blk.32.ffn_norm.weight
|
56 |
+
46: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.32.ffn_up_exps.weight
|
57 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.32.ffn_up_shexp.weight
|
58 |
+
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.33.attn_kv_a_mqa.weight
|
59 |
+
49: 512 | 512, 1, 1, 1 | F32 | blk.33.attn_kv_a_norm.weight
|
60 |
+
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.33.attn_kv_b.weight
|
61 |
+
51: 5120 | 5120, 1, 1, 1 | F32 | blk.33.attn_norm.weight
|
62 |
+
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.33.attn_output.weight
|
63 |
+
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.33.attn_q_a.weight
|
64 |
+
54: 1536 | 1536, 1, 1, 1 | F32 | blk.33.attn_q_a_norm.weight
|
65 |
+
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.33.attn_q_b.weight
|
66 |
+
56: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.33.ffn_down_exps.weight
|
67 |
+
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.33.ffn_down_shexp.weight
|
68 |
+
58: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.33.ffn_gate_exps.weight
|
69 |
+
59: 819200 | 5120, 160, 1, 1 | F32 | blk.33.ffn_gate_inp.weight
|
70 |
+
60: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.33.ffn_gate_shexp.weight
|
71 |
+
61: 5120 | 5120, 1, 1, 1 | F32 | blk.33.ffn_norm.weight
|
72 |
+
62: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.33.ffn_up_exps.weight
|
73 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.33.ffn_up_shexp.weight
|
74 |
+
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.34.attn_kv_a_mqa.weight
|
75 |
+
65: 512 | 512, 1, 1, 1 | F32 | blk.34.attn_kv_a_norm.weight
|
76 |
+
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.34.attn_kv_b.weight
|
77 |
+
67: 5120 | 5120, 1, 1, 1 | F32 | blk.34.attn_norm.weight
|
78 |
+
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.34.attn_output.weight
|
79 |
+
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.34.attn_q_a.weight
|
80 |
+
70: 1536 | 1536, 1, 1, 1 | F32 | blk.34.attn_q_a_norm.weight
|
81 |
+
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.34.attn_q_b.weight
|
82 |
+
72: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.34.ffn_down_exps.weight
|
83 |
+
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.34.ffn_down_shexp.weight
|
84 |
+
74: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.34.ffn_gate_exps.weight
|
85 |
+
75: 819200 | 5120, 160, 1, 1 | F32 | blk.34.ffn_gate_inp.weight
|
86 |
+
76: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.34.ffn_gate_shexp.weight
|
87 |
+
77: 5120 | 5120, 1, 1, 1 | F32 | blk.34.ffn_norm.weight
|
88 |
+
78: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.34.ffn_up_exps.weight
|
89 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.34.ffn_up_shexp.weight
|
90 |
+
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.35.attn_kv_a_mqa.weight
|
91 |
+
81: 512 | 512, 1, 1, 1 | F32 | blk.35.attn_kv_a_norm.weight
|
92 |
+
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.35.attn_kv_b.weight
|
93 |
+
83: 5120 | 5120, 1, 1, 1 | F32 | blk.35.attn_norm.weight
|
94 |
+
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.35.attn_output.weight
|
95 |
+
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.35.attn_q_a.weight
|
96 |
+
86: 1536 | 1536, 1, 1, 1 | F32 | blk.35.attn_q_a_norm.weight
|
97 |
+
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.35.attn_q_b.weight
|
98 |
+
88: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.35.ffn_down_exps.weight
|
99 |
+
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.35.ffn_down_shexp.weight
|
100 |
+
90: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.35.ffn_gate_exps.weight
|
101 |
+
91: 819200 | 5120, 160, 1, 1 | F32 | blk.35.ffn_gate_inp.weight
|
102 |
+
92: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.35.ffn_gate_shexp.weight
|
103 |
+
93: 5120 | 5120, 1, 1, 1 | F32 | blk.35.ffn_norm.weight
|
104 |
+
94: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.35.ffn_up_exps.weight
|
105 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.35.ffn_up_shexp.weight
|
106 |
+
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.36.attn_kv_a_mqa.weight
|
107 |
+
97: 512 | 512, 1, 1, 1 | F32 | blk.36.attn_kv_a_norm.weight
|
108 |
+
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.36.attn_kv_b.weight
|
109 |
+
99: 5120 | 5120, 1, 1, 1 | F32 | blk.36.attn_norm.weight
|
110 |
+
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.36.attn_output.weight
|
111 |
+
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.36.attn_q_a.weight
|
112 |
+
102: 1536 | 1536, 1, 1, 1 | F32 | blk.36.attn_q_a_norm.weight
|
113 |
+
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.36.attn_q_b.weight
|
114 |
+
104: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.36.ffn_down_exps.weight
|
115 |
+
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.36.ffn_down_shexp.weight
|
116 |
+
106: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.36.ffn_gate_exps.weight
|
117 |
+
107: 819200 | 5120, 160, 1, 1 | F32 | blk.36.ffn_gate_inp.weight
|
118 |
+
108: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.36.ffn_gate_shexp.weight
|
119 |
+
109: 5120 | 5120, 1, 1, 1 | F32 | blk.36.ffn_norm.weight
|
120 |
+
110: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.36.ffn_up_exps.weight
|
121 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.36.ffn_up_shexp.weight
|
122 |
+
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.37.attn_kv_a_mqa.weight
|
123 |
+
113: 512 | 512, 1, 1, 1 | F32 | blk.37.attn_kv_a_norm.weight
|
124 |
+
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.37.attn_kv_b.weight
|
125 |
+
115: 5120 | 5120, 1, 1, 1 | F32 | blk.37.attn_norm.weight
|
126 |
+
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.37.attn_output.weight
|
127 |
+
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.37.attn_q_a.weight
|
128 |
+
118: 1536 | 1536, 1, 1, 1 | F32 | blk.37.attn_q_a_norm.weight
|
129 |
+
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.37.attn_q_b.weight
|
130 |
+
120: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.37.ffn_down_exps.weight
|
131 |
+
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.37.ffn_down_shexp.weight
|
132 |
+
122: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.37.ffn_gate_exps.weight
|
133 |
+
123: 819200 | 5120, 160, 1, 1 | F32 | blk.37.ffn_gate_inp.weight
|
134 |
+
124: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.37.ffn_gate_shexp.weight
|
135 |
+
125: 5120 | 5120, 1, 1, 1 | F32 | blk.37.ffn_norm.weight
|
136 |
+
126: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.37.ffn_up_exps.weight
|
137 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.37.ffn_up_shexp.weight
|
138 |
+
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.38.attn_kv_a_mqa.weight
|
139 |
+
129: 512 | 512, 1, 1, 1 | F32 | blk.38.attn_kv_a_norm.weight
|
140 |
+
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.38.attn_kv_b.weight
|
141 |
+
131: 5120 | 5120, 1, 1, 1 | F32 | blk.38.attn_norm.weight
|
142 |
+
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.38.attn_output.weight
|
143 |
+
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.38.attn_q_a.weight
|
144 |
+
134: 1536 | 1536, 1, 1, 1 | F32 | blk.38.attn_q_a_norm.weight
|
145 |
+
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.38.attn_q_b.weight
|
146 |
+
136: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.38.ffn_down_exps.weight
|
147 |
+
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.38.ffn_down_shexp.weight
|
148 |
+
138: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.38.ffn_gate_exps.weight
|
149 |
+
139: 819200 | 5120, 160, 1, 1 | F32 | blk.38.ffn_gate_inp.weight
|
150 |
+
140: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.38.ffn_gate_shexp.weight
|
151 |
+
141: 5120 | 5120, 1, 1, 1 | F32 | blk.38.ffn_norm.weight
|
152 |
+
142: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.38.ffn_up_exps.weight
|
153 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.38.ffn_up_shexp.weight
|
154 |
+
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.39.attn_kv_a_mqa.weight
|
155 |
+
145: 512 | 512, 1, 1, 1 | F32 | blk.39.attn_kv_a_norm.weight
|
156 |
+
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.39.attn_kv_b.weight
|
157 |
+
147: 5120 | 5120, 1, 1, 1 | F32 | blk.39.attn_norm.weight
|
158 |
+
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.39.attn_output.weight
|
159 |
+
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.39.attn_q_a.weight
|
160 |
+
150: 1536 | 1536, 1, 1, 1 | F32 | blk.39.attn_q_a_norm.weight
|
161 |
+
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.39.attn_q_b.weight
|
162 |
+
152: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.39.ffn_down_exps.weight
|
163 |
+
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.39.ffn_down_shexp.weight
|
164 |
+
154: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.39.ffn_gate_exps.weight
|
165 |
+
155: 819200 | 5120, 160, 1, 1 | F32 | blk.39.ffn_gate_inp.weight
|
166 |
+
156: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.39.ffn_gate_shexp.weight
|
167 |
+
157: 5120 | 5120, 1, 1, 1 | F32 | blk.39.ffn_norm.weight
|
168 |
+
158: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.39.ffn_up_exps.weight
|
169 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.39.ffn_up_shexp.weight
|
170 |
+
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.40.attn_kv_a_mqa.weight
|
171 |
+
161: 512 | 512, 1, 1, 1 | F32 | blk.40.attn_kv_a_norm.weight
|
172 |
+
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.40.attn_kv_b.weight
|
173 |
+
163: 5120 | 5120, 1, 1, 1 | F32 | blk.40.attn_norm.weight
|
174 |
+
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.40.attn_output.weight
|
175 |
+
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.40.attn_q_a.weight
|
176 |
+
166: 1536 | 1536, 1, 1, 1 | F32 | blk.40.attn_q_a_norm.weight
|
177 |
+
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.40.attn_q_b.weight
|
178 |
+
168: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.40.ffn_down_exps.weight
|
179 |
+
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.40.ffn_down_shexp.weight
|
180 |
+
170: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.40.ffn_gate_exps.weight
|
181 |
+
171: 819200 | 5120, 160, 1, 1 | F32 | blk.40.ffn_gate_inp.weight
|
182 |
+
172: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.40.ffn_gate_shexp.weight
|
183 |
+
173: 5120 | 5120, 1, 1, 1 | F32 | blk.40.ffn_norm.weight
|
184 |
+
174: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.40.ffn_up_exps.weight
|
185 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.40.ffn_up_shexp.weight
|
186 |
+
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.41.attn_kv_a_mqa.weight
|
187 |
+
177: 512 | 512, 1, 1, 1 | F32 | blk.41.attn_kv_a_norm.weight
|
188 |
+
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.41.attn_kv_b.weight
|
189 |
+
179: 5120 | 5120, 1, 1, 1 | F32 | blk.41.attn_norm.weight
|
190 |
+
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.41.attn_output.weight
|
191 |
+
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.41.attn_q_a.weight
|
192 |
+
182: 1536 | 1536, 1, 1, 1 | F32 | blk.41.attn_q_a_norm.weight
|
193 |
+
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.41.attn_q_b.weight
|
194 |
+
184: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.41.ffn_down_exps.weight
|
195 |
+
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.41.ffn_down_shexp.weight
|
196 |
+
186: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.41.ffn_gate_exps.weight
|
197 |
+
187: 819200 | 5120, 160, 1, 1 | F32 | blk.41.ffn_gate_inp.weight
|
198 |
+
188: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.41.ffn_gate_shexp.weight
|
199 |
+
189: 5120 | 5120, 1, 1, 1 | F32 | blk.41.ffn_norm.weight
|
200 |
+
190: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.41.ffn_up_exps.weight
|
201 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.41.ffn_up_shexp.weight
|
202 |
+
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.42.attn_kv_a_mqa.weight
|
203 |
+
193: 512 | 512, 1, 1, 1 | F32 | blk.42.attn_kv_a_norm.weight
|
204 |
+
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.42.attn_kv_b.weight
|
205 |
+
195: 5120 | 5120, 1, 1, 1 | F32 | blk.42.attn_norm.weight
|
206 |
+
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.42.attn_output.weight
|
207 |
+
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.42.attn_q_a.weight
|
208 |
+
198: 1536 | 1536, 1, 1, 1 | F32 | blk.42.attn_q_a_norm.weight
|
209 |
+
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.42.attn_q_b.weight
|
210 |
+
200: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.42.ffn_down_exps.weight
|
211 |
+
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.42.ffn_down_shexp.weight
|
212 |
+
202: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.42.ffn_gate_exps.weight
|
213 |
+
203: 819200 | 5120, 160, 1, 1 | F32 | blk.42.ffn_gate_inp.weight
|
214 |
+
204: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.42.ffn_gate_shexp.weight
|
215 |
+
205: 5120 | 5120, 1, 1, 1 | F32 | blk.42.ffn_norm.weight
|
216 |
+
206: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.42.ffn_up_exps.weight
|
217 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.42.ffn_up_shexp.weight
|
218 |
+
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.43.attn_kv_a_mqa.weight
|
219 |
+
209: 512 | 512, 1, 1, 1 | F32 | blk.43.attn_kv_a_norm.weight
|
220 |
+
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.43.attn_kv_b.weight
|
221 |
+
211: 5120 | 5120, 1, 1, 1 | F32 | blk.43.attn_norm.weight
|
222 |
+
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.43.attn_output.weight
|
223 |
+
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.43.attn_q_a.weight
|
224 |
+
214: 1536 | 1536, 1, 1, 1 | F32 | blk.43.attn_q_a_norm.weight
|
225 |
+
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.43.attn_q_b.weight
|
226 |
+
216: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.43.ffn_down_exps.weight
|
227 |
+
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.43.ffn_down_shexp.weight
|
228 |
+
218: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.43.ffn_gate_exps.weight
|
229 |
+
219: 819200 | 5120, 160, 1, 1 | F32 | blk.43.ffn_gate_inp.weight
|
230 |
+
220: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.43.ffn_gate_shexp.weight
|
231 |
+
221: 5120 | 5120, 1, 1, 1 | F32 | blk.43.ffn_norm.weight
|
232 |
+
222: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.43.ffn_up_exps.weight
|
233 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.43.ffn_up_shexp.weight
|
234 |
+
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.44.attn_kv_a_mqa.weight
|
235 |
+
225: 512 | 512, 1, 1, 1 | F32 | blk.44.attn_kv_a_norm.weight
|
236 |
+
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.44.attn_kv_b.weight
|
237 |
+
227: 5120 | 5120, 1, 1, 1 | F32 | blk.44.attn_norm.weight
|
238 |
+
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.44.attn_output.weight
|
239 |
+
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.44.attn_q_a.weight
|
240 |
+
230: 1536 | 1536, 1, 1, 1 | F32 | blk.44.attn_q_a_norm.weight
|
241 |
+
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.44.attn_q_b.weight
|
242 |
+
232: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.44.ffn_down_exps.weight
|
243 |
+
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.44.ffn_down_shexp.weight
|
244 |
+
234: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.44.ffn_gate_exps.weight
|
245 |
+
235: 819200 | 5120, 160, 1, 1 | F32 | blk.44.ffn_gate_inp.weight
|
246 |
+
236: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.44.ffn_gate_shexp.weight
|
247 |
+
237: 5120 | 5120, 1, 1, 1 | F32 | blk.44.ffn_norm.weight
|
248 |
+
238: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.44.ffn_up_exps.weight
|
249 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.44.ffn_up_shexp.weight
|
250 |
+
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.45.attn_kv_a_mqa.weight
|
251 |
+
241: 512 | 512, 1, 1, 1 | F32 | blk.45.attn_kv_a_norm.weight
|
252 |
+
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.45.attn_kv_b.weight
|
253 |
+
243: 5120 | 5120, 1, 1, 1 | F32 | blk.45.attn_norm.weight
|
254 |
+
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.45.attn_output.weight
|
255 |
+
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.45.attn_q_a.weight
|
256 |
+
246: 1536 | 1536, 1, 1, 1 | F32 | blk.45.attn_q_a_norm.weight
|
257 |
+
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.45.attn_q_b.weight
|
258 |
+
248: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.45.ffn_down_exps.weight
|
259 |
+
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.45.ffn_down_shexp.weight
|
260 |
+
250: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.45.ffn_gate_exps.weight
|
261 |
+
251: 819200 | 5120, 160, 1, 1 | F32 | blk.45.ffn_gate_inp.weight
|
262 |
+
252: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.45.ffn_gate_shexp.weight
|
263 |
+
253: 5120 | 5120, 1, 1, 1 | F32 | blk.45.ffn_norm.weight
|
264 |
+
254: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.45.ffn_up_exps.weight
|
265 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.45.ffn_up_shexp.weight
|
266 |
+
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.46.attn_kv_a_mqa.weight
|
267 |
+
257: 512 | 512, 1, 1, 1 | F32 | blk.46.attn_kv_a_norm.weight
|
268 |
+
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.46.attn_kv_b.weight
|
269 |
+
259: 5120 | 5120, 1, 1, 1 | F32 | blk.46.attn_norm.weight
|
270 |
+
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.46.attn_output.weight
|
271 |
+
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.46.attn_q_a.weight
|
272 |
+
262: 1536 | 1536, 1, 1, 1 | F32 | blk.46.attn_q_a_norm.weight
|
273 |
+
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.46.attn_q_b.weight
|
274 |
+
264: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.46.ffn_down_exps.weight
|
275 |
+
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.46.ffn_down_shexp.weight
|
276 |
+
266: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.46.ffn_gate_exps.weight
|
277 |
+
267: 819200 | 5120, 160, 1, 1 | F32 | blk.46.ffn_gate_inp.weight
|
278 |
+
268: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.46.ffn_gate_shexp.weight
|
279 |
+
269: 5120 | 5120, 1, 1, 1 | F32 | blk.46.ffn_norm.weight
|
280 |
+
270: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.46.ffn_up_exps.weight
|
281 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.46.ffn_up_shexp.weight
|
282 |
+
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.47.attn_kv_a_mqa.weight
|
283 |
+
273: 512 | 512, 1, 1, 1 | F32 | blk.47.attn_kv_a_norm.weight
|
284 |
+
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.47.attn_kv_b.weight
|
285 |
+
275: 5120 | 5120, 1, 1, 1 | F32 | blk.47.attn_norm.weight
|
286 |
+
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.47.attn_output.weight
|
287 |
+
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.47.attn_q_a.weight
|
288 |
+
278: 1536 | 1536, 1, 1, 1 | F32 | blk.47.attn_q_a_norm.weight
|
289 |
+
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.47.attn_q_b.weight
|
290 |
+
280: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.47.ffn_down_exps.weight
|
291 |
+
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.47.ffn_down_shexp.weight
|
292 |
+
282: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.47.ffn_gate_exps.weight
|
293 |
+
283: 819200 | 5120, 160, 1, 1 | F32 | blk.47.ffn_gate_inp.weight
|
294 |
+
284: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.47.ffn_gate_shexp.weight
|
295 |
+
285: 5120 | 5120, 1, 1, 1 | F32 | blk.47.ffn_norm.weight
|
296 |
+
286: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.47.ffn_up_exps.weight
|
297 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.47.ffn_up_shexp.weight
|
298 |
+
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.48.attn_kv_a_mqa.weight
|
299 |
+
289: 512 | 512, 1, 1, 1 | F32 | blk.48.attn_kv_a_norm.weight
|
300 |
+
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.48.attn_kv_b.weight
|
301 |
+
291: 5120 | 5120, 1, 1, 1 | F32 | blk.48.attn_norm.weight
|
302 |
+
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.48.attn_output.weight
|
303 |
+
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.48.attn_q_a.weight
|
304 |
+
294: 1536 | 1536, 1, 1, 1 | F32 | blk.48.attn_q_a_norm.weight
|
305 |
+
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.48.attn_q_b.weight
|
306 |
+
296: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.48.ffn_down_exps.weight
|
307 |
+
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.48.ffn_down_shexp.weight
|
308 |
+
298: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.48.ffn_gate_exps.weight
|
309 |
+
299: 819200 | 5120, 160, 1, 1 | F32 | blk.48.ffn_gate_inp.weight
|
310 |
+
300: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.48.ffn_gate_shexp.weight
|
311 |
+
301: 5120 | 5120, 1, 1, 1 | F32 | blk.48.ffn_norm.weight
|
312 |
+
302: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.48.ffn_up_exps.weight
|
313 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.48.ffn_up_shexp.weight
|
314 |
+
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.49.attn_kv_a_mqa.weight
|
315 |
+
305: 512 | 512, 1, 1, 1 | F32 | blk.49.attn_kv_a_norm.weight
|
316 |
+
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.49.attn_kv_b.weight
|
317 |
+
307: 5120 | 5120, 1, 1, 1 | F32 | blk.49.attn_norm.weight
|
318 |
+
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.49.attn_output.weight
|
319 |
+
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.49.attn_q_a.weight
|
320 |
+
310: 1536 | 1536, 1, 1, 1 | F32 | blk.49.attn_q_a_norm.weight
|
321 |
+
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.49.attn_q_b.weight
|
322 |
+
312: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.49.ffn_down_exps.weight
|
323 |
+
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.49.ffn_down_shexp.weight
|
324 |
+
314: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.49.ffn_gate_exps.weight
|
325 |
+
315: 819200 | 5120, 160, 1, 1 | F32 | blk.49.ffn_gate_inp.weight
|
326 |
+
316: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.49.ffn_gate_shexp.weight
|
327 |
+
317: 5120 | 5120, 1, 1, 1 | F32 | blk.49.ffn_norm.weight
|
328 |
+
318: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.49.ffn_up_exps.weight
|
329 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.49.ffn_up_shexp.weight
|
330 |
+
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.50.attn_kv_a_mqa.weight
|
331 |
+
321: 512 | 512, 1, 1, 1 | F32 | blk.50.attn_kv_a_norm.weight
|
332 |
+
322: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.50.attn_kv_b.weight
|
333 |
+
323: 5120 | 5120, 1, 1, 1 | F32 | blk.50.attn_norm.weight
|
334 |
+
324: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.50.attn_output.weight
|
335 |
+
325: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.50.attn_q_a.weight
|
336 |
+
326: 1536 | 1536, 1, 1, 1 | F32 | blk.50.attn_q_a_norm.weight
|
337 |
+
327: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.50.attn_q_b.weight
|
338 |
+
328: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.50.ffn_down_exps.weight
|
339 |
+
329: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.50.ffn_down_shexp.weight
|
340 |
+
330: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.50.ffn_gate_exps.weight
|
341 |
+
331: 819200 | 5120, 160, 1, 1 | F32 | blk.50.ffn_gate_inp.weight
|
342 |
+
332: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.50.ffn_gate_shexp.weight
|
343 |
+
333: 5120 | 5120, 1, 1, 1 | F32 | blk.50.ffn_norm.weight
|
344 |
+
334: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.50.ffn_up_exps.weight
|
345 |
+
335: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.50.ffn_up_shexp.weight
|
346 |
+
336: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.51.attn_kv_a_mqa.weight
|
347 |
+
337: 512 | 512, 1, 1, 1 | F32 | blk.51.attn_kv_a_norm.weight
|
348 |
+
338: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.51.attn_kv_b.weight
|
349 |
+
339: 5120 | 5120, 1, 1, 1 | F32 | blk.51.attn_norm.weight
|
350 |
+
340: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.51.attn_output.weight
|
351 |
+
341: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.51.attn_q_a.weight
|
352 |
+
342: 1536 | 1536, 1, 1, 1 | F32 | blk.51.attn_q_a_norm.weight
|
353 |
+
343: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.51.attn_q_b.weight
|
354 |
+
344: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.51.ffn_down_exps.weight
|
355 |
+
345: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.51.ffn_down_shexp.weight
|
356 |
+
346: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.51.ffn_gate_exps.weight
|
357 |
+
347: 819200 | 5120, 160, 1, 1 | F32 | blk.51.ffn_gate_inp.weight
|
358 |
+
348: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.51.ffn_gate_shexp.weight
|
359 |
+
349: 5120 | 5120, 1, 1, 1 | F32 | blk.51.ffn_norm.weight
|
360 |
+
350: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.51.ffn_up_exps.weight
|
361 |
+
351: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.51.ffn_up_shexp.weight
|
362 |
+
352: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.52.attn_kv_a_mqa.weight
|
363 |
+
353: 512 | 512, 1, 1, 1 | F32 | blk.52.attn_kv_a_norm.weight
|
364 |
+
354: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.52.attn_kv_b.weight
|
365 |
+
355: 5120 | 5120, 1, 1, 1 | F32 | blk.52.attn_norm.weight
|
366 |
+
356: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.52.attn_output.weight
|
367 |
+
357: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.52.attn_q_a.weight
|
368 |
+
358: 1536 | 1536, 1, 1, 1 | F32 | blk.52.attn_q_a_norm.weight
|
369 |
+
359: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.52.attn_q_b.weight
|
370 |
+
360: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.52.ffn_down_exps.weight
|
371 |
+
361: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.52.ffn_down_shexp.weight
|
372 |
+
362: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.52.ffn_gate_exps.weight
|
373 |
+
363: 819200 | 5120, 160, 1, 1 | F32 | blk.52.ffn_gate_inp.weight
|
374 |
+
364: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.52.ffn_gate_shexp.weight
|
375 |
+
365: 5120 | 5120, 1, 1, 1 | F32 | blk.52.ffn_norm.weight
|
376 |
+
366: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.52.ffn_up_exps.weight
|
377 |
+
367: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.52.ffn_up_shexp.weight
|
378 |
+
368: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.53.attn_kv_a_mqa.weight
|
379 |
+
369: 512 | 512, 1, 1, 1 | F32 | blk.53.attn_kv_a_norm.weight
|
380 |
+
370: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.53.attn_kv_b.weight
|
381 |
+
371: 5120 | 5120, 1, 1, 1 | F32 | blk.53.attn_norm.weight
|
382 |
+
372: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.53.attn_output.weight
|
383 |
+
373: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.53.attn_q_a.weight
|
384 |
+
374: 1536 | 1536, 1, 1, 1 | F32 | blk.53.attn_q_a_norm.weight
|
385 |
+
375: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.53.attn_q_b.weight
|
386 |
+
376: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.53.ffn_down_exps.weight
|
387 |
+
377: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.53.ffn_down_shexp.weight
|
388 |
+
378: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.53.ffn_gate_exps.weight
|
389 |
+
379: 819200 | 5120, 160, 1, 1 | F32 | blk.53.ffn_gate_inp.weight
|
390 |
+
380: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.53.ffn_gate_shexp.weight
|
391 |
+
381: 5120 | 5120, 1, 1, 1 | F32 | blk.53.ffn_norm.weight
|
392 |
+
382: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.53.ffn_up_exps.weight
|
393 |
+
383: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.53.ffn_up_shexp.weight
|
394 |
+
384: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.54.attn_kv_a_mqa.weight
|
395 |
+
385: 512 | 512, 1, 1, 1 | F32 | blk.54.attn_kv_a_norm.weight
|
396 |
+
386: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.54.attn_kv_b.weight
|
397 |
+
387: 5120 | 5120, 1, 1, 1 | F32 | blk.54.attn_norm.weight
|
398 |
+
388: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.54.attn_output.weight
|
399 |
+
389: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.54.attn_q_a.weight
|
400 |
+
390: 1536 | 1536, 1, 1, 1 | F32 | blk.54.attn_q_a_norm.weight
|
401 |
+
391: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.54.attn_q_b.weight
|
402 |
+
392: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.54.ffn_down_exps.weight
|
403 |
+
393: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.54.ffn_down_shexp.weight
|
404 |
+
394: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.54.ffn_gate_exps.weight
|
405 |
+
395: 819200 | 5120, 160, 1, 1 | F32 | blk.54.ffn_gate_inp.weight
|
406 |
+
396: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.54.ffn_gate_shexp.weight
|
407 |
+
397: 5120 | 5120, 1, 1, 1 | F32 | blk.54.ffn_norm.weight
|
408 |
+
398: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.54.ffn_up_exps.weight
|
409 |
+
399: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.54.ffn_up_shexp.weight
|
410 |
+
400: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.55.attn_kv_a_mqa.weight
|
411 |
+
401: 512 | 512, 1, 1, 1 | F32 | blk.55.attn_kv_a_norm.weight
|
412 |
+
402: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.55.attn_kv_b.weight
|
413 |
+
403: 5120 | 5120, 1, 1, 1 | F32 | blk.55.attn_norm.weight
|
414 |
+
404: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.55.attn_output.weight
|
415 |
+
405: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.55.attn_q_a.weight
|
416 |
+
406: 1536 | 1536, 1, 1, 1 | F32 | blk.55.attn_q_a_norm.weight
|
417 |
+
407: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.55.attn_q_b.weight
|
418 |
+
408: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.55.ffn_down_exps.weight
|
419 |
+
409: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.55.ffn_down_shexp.weight
|
420 |
+
410: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.55.ffn_gate_exps.weight
|
421 |
+
411: 819200 | 5120, 160, 1, 1 | F32 | blk.55.ffn_gate_inp.weight
|
422 |
+
412: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.55.ffn_gate_shexp.weight
|
423 |
+
413: 5120 | 5120, 1, 1, 1 | F32 | blk.55.ffn_norm.weight
|
424 |
+
414: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.55.ffn_up_exps.weight
|
425 |
+
415: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.55.ffn_up_shexp.weight
|
426 |
+
416: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.56.attn_kv_a_mqa.weight
|
427 |
+
417: 512 | 512, 1, 1, 1 | F32 | blk.56.attn_kv_a_norm.weight
|
428 |
+
418: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.56.attn_kv_b.weight
|
429 |
+
419: 5120 | 5120, 1, 1, 1 | F32 | blk.56.attn_norm.weight
|
430 |
+
420: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.56.attn_output.weight
|
431 |
+
421: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.56.attn_q_a.weight
|
432 |
+
422: 1536 | 1536, 1, 1, 1 | F32 | blk.56.attn_q_a_norm.weight
|
433 |
+
423: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.56.attn_q_b.weight
|
434 |
+
424: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.56.ffn_down_exps.weight
|
435 |
+
425: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.56.ffn_down_shexp.weight
|
436 |
+
426: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.56.ffn_gate_exps.weight
|
437 |
+
427: 819200 | 5120, 160, 1, 1 | F32 | blk.56.ffn_gate_inp.weight
|
438 |
+
428: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.56.ffn_gate_shexp.weight
|
439 |
+
429: 5120 | 5120, 1, 1, 1 | F32 | blk.56.ffn_norm.weight
|
440 |
+
430: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.56.ffn_up_exps.weight
|
441 |
+
431: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.56.ffn_up_shexp.weight
|
442 |
+
432: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.57.attn_kv_a_mqa.weight
|
443 |
+
433: 512 | 512, 1, 1, 1 | F32 | blk.57.attn_kv_a_norm.weight
|
444 |
+
434: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.57.attn_kv_b.weight
|
445 |
+
435: 5120 | 5120, 1, 1, 1 | F32 | blk.57.attn_norm.weight
|
446 |
+
436: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.57.attn_output.weight
|
447 |
+
437: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.57.attn_q_a.weight
|
448 |
+
438: 1536 | 1536, 1, 1, 1 | F32 | blk.57.attn_q_a_norm.weight
|
449 |
+
439: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.57.attn_q_b.weight
|
450 |
+
440: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.57.ffn_down_exps.weight
|
451 |
+
441: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.57.ffn_down_shexp.weight
|
452 |
+
442: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.57.ffn_gate_exps.weight
|
453 |
+
443: 819200 | 5120, 160, 1, 1 | F32 | blk.57.ffn_gate_inp.weight
|
454 |
+
444: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.57.ffn_gate_shexp.weight
|
455 |
+
445: 5120 | 5120, 1, 1, 1 | F32 | blk.57.ffn_norm.weight
|
456 |
+
446: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.57.ffn_up_exps.weight
|
457 |
+
447: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.57.ffn_up_shexp.weight
|
458 |
+
448: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.58.attn_kv_a_mqa.weight
|
459 |
+
449: 512 | 512, 1, 1, 1 | F32 | blk.58.attn_kv_a_norm.weight
|
460 |
+
450: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.58.attn_kv_b.weight
|
461 |
+
451: 5120 | 5120, 1, 1, 1 | F32 | blk.58.attn_norm.weight
|
462 |
+
452: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.58.attn_output.weight
|
463 |
+
453: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.58.attn_q_a.weight
|
464 |
+
454: 1536 | 1536, 1, 1, 1 | F32 | blk.58.attn_q_a_norm.weight
|
465 |
+
455: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.58.attn_q_b.weight
|
466 |
+
456: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.58.ffn_down_exps.weight
|
467 |
+
457: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.58.ffn_down_shexp.weight
|
468 |
+
458: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.58.ffn_gate_exps.weight
|
469 |
+
459: 819200 | 5120, 160, 1, 1 | F32 | blk.58.ffn_gate_inp.weight
|
470 |
+
460: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.58.ffn_gate_shexp.weight
|
471 |
+
461: 5120 | 5120, 1, 1, 1 | F32 | blk.58.ffn_norm.weight
|
472 |
+
462: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.58.ffn_up_exps.weight
|
473 |
+
463: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.58.ffn_up_shexp.weight
|
474 |
+
464: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.59.attn_kv_a_mqa.weight
|
475 |
+
465: 512 | 512, 1, 1, 1 | F32 | blk.59.attn_kv_a_norm.weight
|
476 |
+
466: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.59.attn_kv_b.weight
|
477 |
+
467: 5120 | 5120, 1, 1, 1 | F32 | blk.59.attn_norm.weight
|
478 |
+
468: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.59.attn_output.weight
|
479 |
+
469: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.59.attn_q_a.weight
|
480 |
+
470: 1536 | 1536, 1, 1, 1 | F32 | blk.59.attn_q_a_norm.weight
|
481 |
+
471: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.59.attn_q_b.weight
|
482 |
+
472: 1258291200 | 1536, 5120, 160, 1 | IQ1_S | blk.59.ffn_down_exps.weight
|
483 |
+
473: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.59.ffn_down_shexp.weight
|
484 |
+
474: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.59.ffn_gate_exps.weight
|
485 |
+
475: 819200 | 5120, 160, 1, 1 | F32 | blk.59.ffn_gate_inp.weight
|
486 |
+
476: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.59.ffn_gate_shexp.weight
|
487 |
+
477: 5120 | 5120, 1, 1, 1 | F32 | blk.59.ffn_norm.weight
|
488 |
+
478: 1258291200 | 5120, 1536, 160, 1 | IQ1_S | blk.59.ffn_up_exps.weight
|
489 |
+
479: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.59.ffn_up_shexp.weight
|
DeepSeek-v2.5-1210-UD-iq2_s-00001-of-00002.gguf.tensors.txt
ADDED
@@ -0,0 +1,540 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq2_s-00001-of-00002.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 56 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 480
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 53
|
7 |
+
4: STRING | 1 | general.architecture = 'deepseek2'
|
8 |
+
5: STRING | 1 | general.type = 'model'
|
9 |
+
6: STRING | 1 | general.name = 'Dsv25'
|
10 |
+
7: STRING | 1 | general.size_label = '160x14B'
|
11 |
+
8: STRING | 1 | general.license = 'other'
|
12 |
+
9: STRING | 1 | general.license.name = 'deepseek'
|
13 |
+
10: STRING | 1 | general.license.link = 'https://github.com/deepseek-ai/DeepSeek-V2/blob/main/LICENSE'
|
14 |
+
11: UINT32 | 1 | deepseek2.block_count = 60
|
15 |
+
12: UINT32 | 1 | deepseek2.context_length = 163840
|
16 |
+
13: UINT32 | 1 | deepseek2.embedding_length = 5120
|
17 |
+
14: UINT32 | 1 | deepseek2.feed_forward_length = 12288
|
18 |
+
15: UINT32 | 1 | deepseek2.attention.head_count = 128
|
19 |
+
16: UINT32 | 1 | deepseek2.attention.head_count_kv = 128
|
20 |
+
17: FLOAT32 | 1 | deepseek2.rope.freq_base = 10000.0
|
21 |
+
18: FLOAT32 | 1 | deepseek2.attention.layer_norm_rms_epsilon = 9.999999974752427e-07
|
22 |
+
19: UINT32 | 1 | deepseek2.expert_used_count = 6
|
23 |
+
20: UINT32 | 1 | deepseek2.leading_dense_block_count = 1
|
24 |
+
21: UINT32 | 1 | deepseek2.vocab_size = 102400
|
25 |
+
22: UINT32 | 1 | deepseek2.attention.q_lora_rank = 1536
|
26 |
+
23: UINT32 | 1 | deepseek2.attention.kv_lora_rank = 512
|
27 |
+
24: UINT32 | 1 | deepseek2.attention.key_length = 192
|
28 |
+
25: UINT32 | 1 | deepseek2.attention.value_length = 128
|
29 |
+
26: UINT32 | 1 | deepseek2.expert_feed_forward_length = 1536
|
30 |
+
27: UINT32 | 1 | deepseek2.expert_count = 160
|
31 |
+
28: UINT32 | 1 | deepseek2.expert_shared_count = 2
|
32 |
+
29: FLOAT32 | 1 | deepseek2.expert_weights_scale = 16.0
|
33 |
+
30: BOOL | 1 | deepseek2.expert_weights_norm = False
|
34 |
+
31: UINT32 | 1 | deepseek2.expert_gating_func = 1
|
35 |
+
32: UINT32 | 1 | deepseek2.rope.dimension_count = 64
|
36 |
+
33: STRING | 1 | deepseek2.rope.scaling.type = 'yarn'
|
37 |
+
34: FLOAT32 | 1 | deepseek2.rope.scaling.factor = 40.0
|
38 |
+
35: UINT32 | 1 | deepseek2.rope.scaling.original_context_length = 4096
|
39 |
+
36: FLOAT32 | 1 | deepseek2.rope.scaling.yarn_log_multiplier = 0.10000000149011612
|
40 |
+
37: STRING | 1 | tokenizer.ggml.model = 'gpt2'
|
41 |
+
38: STRING | 1 | tokenizer.ggml.pre = 'deepseek-llm'
|
42 |
+
39: [STRING] | 102400 | tokenizer.ggml.tokens
|
43 |
+
40: [INT32] | 102400 | tokenizer.ggml.token_type
|
44 |
+
41: [STRING] | 99757 | tokenizer.ggml.merges
|
45 |
+
42: UINT32 | 1 | tokenizer.ggml.bos_token_id = 100000
|
46 |
+
43: UINT32 | 1 | tokenizer.ggml.eos_token_id = 100001
|
47 |
+
44: UINT32 | 1 | tokenizer.ggml.padding_token_id = 100001
|
48 |
+
45: BOOL | 1 | tokenizer.ggml.add_bos_token = True
|
49 |
+
46: BOOL | 1 | tokenizer.ggml.add_eos_token = False
|
50 |
+
47: STRING | 1 | tokenizer.chat_template = '{% if not add_generation_prompt is defined %}{% set add_gene'
|
51 |
+
48: UINT32 | 1 | general.quantization_version = 2
|
52 |
+
49: UINT32 | 1 | general.file_type = 28
|
53 |
+
50: STRING | 1 | quantize.imatrix.file = '/archive/nuc/LLM/raw/imatrix-DeepSeek-V2.5-1210-bartowski.da'
|
54 |
+
51: STRING | 1 | quantize.imatrix.dataset = '/training_dir/calibration_datav3.txt'
|
55 |
+
52: INT32 | 1 | quantize.imatrix.entries_count = 716
|
56 |
+
53: INT32 | 1 | quantize.imatrix.chunks_count = 139
|
57 |
+
54: UINT16 | 1 | split.no = 0
|
58 |
+
55: INT32 | 1 | split.tensors.count = 959
|
59 |
+
56: UINT16 | 1 | split.count = 2
|
60 |
+
* Dumping 480 tensor(s)
|
61 |
+
1: 524288000 | 5120, 102400, 1, 1 | Q6_K | output.weight
|
62 |
+
2: 5120 | 5120, 1, 1, 1 | F32 | output_norm.weight
|
63 |
+
3: 524288000 | 5120, 102400, 1, 1 | Q6_K | token_embd.weight
|
64 |
+
4: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.0.attn_kv_a_mqa.weight
|
65 |
+
5: 512 | 512, 1, 1, 1 | F32 | blk.0.attn_kv_a_norm.weight
|
66 |
+
6: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.0.attn_kv_b.weight
|
67 |
+
7: 5120 | 5120, 1, 1, 1 | F32 | blk.0.attn_norm.weight
|
68 |
+
8: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.0.attn_output.weight
|
69 |
+
9: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.0.attn_q_a.weight
|
70 |
+
10: 1536 | 1536, 1, 1, 1 | F32 | blk.0.attn_q_a_norm.weight
|
71 |
+
11: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.0.attn_q_b.weight
|
72 |
+
12: 62914560 | 12288, 5120, 1, 1 | Q6_K | blk.0.ffn_down.weight
|
73 |
+
13: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_gate.weight
|
74 |
+
14: 5120 | 5120, 1, 1, 1 | F32 | blk.0.ffn_norm.weight
|
75 |
+
15: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_up.weight
|
76 |
+
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.1.attn_kv_a_mqa.weight
|
77 |
+
17: 512 | 512, 1, 1, 1 | F32 | blk.1.attn_kv_a_norm.weight
|
78 |
+
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.1.attn_kv_b.weight
|
79 |
+
19: 5120 | 5120, 1, 1, 1 | F32 | blk.1.attn_norm.weight
|
80 |
+
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.1.attn_output.weight
|
81 |
+
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.1.attn_q_a.weight
|
82 |
+
22: 1536 | 1536, 1, 1, 1 | F32 | blk.1.attn_q_a_norm.weight
|
83 |
+
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.1.attn_q_b.weight
|
84 |
+
24: 1258291200 | 1536, 5120, 160, 1 | Q3_K | blk.1.ffn_down_exps.weight
|
85 |
+
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.1.ffn_down_shexp.weight
|
86 |
+
26: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.1.ffn_gate_exps.weight
|
87 |
+
27: 819200 | 5120, 160, 1, 1 | F32 | blk.1.ffn_gate_inp.weight
|
88 |
+
28: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.1.ffn_gate_shexp.weight
|
89 |
+
29: 5120 | 5120, 1, 1, 1 | F32 | blk.1.ffn_norm.weight
|
90 |
+
30: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.1.ffn_up_exps.weight
|
91 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.1.ffn_up_shexp.weight
|
92 |
+
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.2.attn_kv_a_mqa.weight
|
93 |
+
33: 512 | 512, 1, 1, 1 | F32 | blk.2.attn_kv_a_norm.weight
|
94 |
+
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.2.attn_kv_b.weight
|
95 |
+
35: 5120 | 5120, 1, 1, 1 | F32 | blk.2.attn_norm.weight
|
96 |
+
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.2.attn_output.weight
|
97 |
+
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.2.attn_q_a.weight
|
98 |
+
38: 1536 | 1536, 1, 1, 1 | F32 | blk.2.attn_q_a_norm.weight
|
99 |
+
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.2.attn_q_b.weight
|
100 |
+
40: 1258291200 | 1536, 5120, 160, 1 | Q3_K | blk.2.ffn_down_exps.weight
|
101 |
+
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.2.ffn_down_shexp.weight
|
102 |
+
42: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.2.ffn_gate_exps.weight
|
103 |
+
43: 819200 | 5120, 160, 1, 1 | F32 | blk.2.ffn_gate_inp.weight
|
104 |
+
44: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.2.ffn_gate_shexp.weight
|
105 |
+
45: 5120 | 5120, 1, 1, 1 | F32 | blk.2.ffn_norm.weight
|
106 |
+
46: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.2.ffn_up_exps.weight
|
107 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.2.ffn_up_shexp.weight
|
108 |
+
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.3.attn_kv_a_mqa.weight
|
109 |
+
49: 512 | 512, 1, 1, 1 | F32 | blk.3.attn_kv_a_norm.weight
|
110 |
+
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.3.attn_kv_b.weight
|
111 |
+
51: 5120 | 5120, 1, 1, 1 | F32 | blk.3.attn_norm.weight
|
112 |
+
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.3.attn_output.weight
|
113 |
+
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.3.attn_q_a.weight
|
114 |
+
54: 1536 | 1536, 1, 1, 1 | F32 | blk.3.attn_q_a_norm.weight
|
115 |
+
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.3.attn_q_b.weight
|
116 |
+
56: 1258291200 | 1536, 5120, 160, 1 | Q3_K | blk.3.ffn_down_exps.weight
|
117 |
+
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.3.ffn_down_shexp.weight
|
118 |
+
58: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.3.ffn_gate_exps.weight
|
119 |
+
59: 819200 | 5120, 160, 1, 1 | F32 | blk.3.ffn_gate_inp.weight
|
120 |
+
60: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.3.ffn_gate_shexp.weight
|
121 |
+
61: 5120 | 5120, 1, 1, 1 | F32 | blk.3.ffn_norm.weight
|
122 |
+
62: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.3.ffn_up_exps.weight
|
123 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.3.ffn_up_shexp.weight
|
124 |
+
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.4.attn_kv_a_mqa.weight
|
125 |
+
65: 512 | 512, 1, 1, 1 | F32 | blk.4.attn_kv_a_norm.weight
|
126 |
+
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.4.attn_kv_b.weight
|
127 |
+
67: 5120 | 5120, 1, 1, 1 | F32 | blk.4.attn_norm.weight
|
128 |
+
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.4.attn_output.weight
|
129 |
+
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.4.attn_q_a.weight
|
130 |
+
70: 1536 | 1536, 1, 1, 1 | F32 | blk.4.attn_q_a_norm.weight
|
131 |
+
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.4.attn_q_b.weight
|
132 |
+
72: 1258291200 | 1536, 5120, 160, 1 | Q3_K | blk.4.ffn_down_exps.weight
|
133 |
+
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.4.ffn_down_shexp.weight
|
134 |
+
74: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.4.ffn_gate_exps.weight
|
135 |
+
75: 819200 | 5120, 160, 1, 1 | F32 | blk.4.ffn_gate_inp.weight
|
136 |
+
76: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.4.ffn_gate_shexp.weight
|
137 |
+
77: 5120 | 5120, 1, 1, 1 | F32 | blk.4.ffn_norm.weight
|
138 |
+
78: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.4.ffn_up_exps.weight
|
139 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.4.ffn_up_shexp.weight
|
140 |
+
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.5.attn_kv_a_mqa.weight
|
141 |
+
81: 512 | 512, 1, 1, 1 | F32 | blk.5.attn_kv_a_norm.weight
|
142 |
+
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.5.attn_kv_b.weight
|
143 |
+
83: 5120 | 5120, 1, 1, 1 | F32 | blk.5.attn_norm.weight
|
144 |
+
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.5.attn_output.weight
|
145 |
+
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.5.attn_q_a.weight
|
146 |
+
86: 1536 | 1536, 1, 1, 1 | F32 | blk.5.attn_q_a_norm.weight
|
147 |
+
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.5.attn_q_b.weight
|
148 |
+
88: 1258291200 | 1536, 5120, 160, 1 | Q3_K | blk.5.ffn_down_exps.weight
|
149 |
+
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.5.ffn_down_shexp.weight
|
150 |
+
90: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.5.ffn_gate_exps.weight
|
151 |
+
91: 819200 | 5120, 160, 1, 1 | F32 | blk.5.ffn_gate_inp.weight
|
152 |
+
92: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.5.ffn_gate_shexp.weight
|
153 |
+
93: 5120 | 5120, 1, 1, 1 | F32 | blk.5.ffn_norm.weight
|
154 |
+
94: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.5.ffn_up_exps.weight
|
155 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.5.ffn_up_shexp.weight
|
156 |
+
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.6.attn_kv_a_mqa.weight
|
157 |
+
97: 512 | 512, 1, 1, 1 | F32 | blk.6.attn_kv_a_norm.weight
|
158 |
+
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.6.attn_kv_b.weight
|
159 |
+
99: 5120 | 5120, 1, 1, 1 | F32 | blk.6.attn_norm.weight
|
160 |
+
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.6.attn_output.weight
|
161 |
+
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.6.attn_q_a.weight
|
162 |
+
102: 1536 | 1536, 1, 1, 1 | F32 | blk.6.attn_q_a_norm.weight
|
163 |
+
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.6.attn_q_b.weight
|
164 |
+
104: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.6.ffn_down_exps.weight
|
165 |
+
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.6.ffn_down_shexp.weight
|
166 |
+
106: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.6.ffn_gate_exps.weight
|
167 |
+
107: 819200 | 5120, 160, 1, 1 | F32 | blk.6.ffn_gate_inp.weight
|
168 |
+
108: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.6.ffn_gate_shexp.weight
|
169 |
+
109: 5120 | 5120, 1, 1, 1 | F32 | blk.6.ffn_norm.weight
|
170 |
+
110: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.6.ffn_up_exps.weight
|
171 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.6.ffn_up_shexp.weight
|
172 |
+
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.7.attn_kv_a_mqa.weight
|
173 |
+
113: 512 | 512, 1, 1, 1 | F32 | blk.7.attn_kv_a_norm.weight
|
174 |
+
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.7.attn_kv_b.weight
|
175 |
+
115: 5120 | 5120, 1, 1, 1 | F32 | blk.7.attn_norm.weight
|
176 |
+
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.7.attn_output.weight
|
177 |
+
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.7.attn_q_a.weight
|
178 |
+
118: 1536 | 1536, 1, 1, 1 | F32 | blk.7.attn_q_a_norm.weight
|
179 |
+
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.7.attn_q_b.weight
|
180 |
+
120: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.7.ffn_down_exps.weight
|
181 |
+
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.7.ffn_down_shexp.weight
|
182 |
+
122: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.7.ffn_gate_exps.weight
|
183 |
+
123: 819200 | 5120, 160, 1, 1 | F32 | blk.7.ffn_gate_inp.weight
|
184 |
+
124: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.7.ffn_gate_shexp.weight
|
185 |
+
125: 5120 | 5120, 1, 1, 1 | F32 | blk.7.ffn_norm.weight
|
186 |
+
126: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.7.ffn_up_exps.weight
|
187 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.7.ffn_up_shexp.weight
|
188 |
+
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.8.attn_kv_a_mqa.weight
|
189 |
+
129: 512 | 512, 1, 1, 1 | F32 | blk.8.attn_kv_a_norm.weight
|
190 |
+
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.8.attn_kv_b.weight
|
191 |
+
131: 5120 | 5120, 1, 1, 1 | F32 | blk.8.attn_norm.weight
|
192 |
+
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.8.attn_output.weight
|
193 |
+
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.8.attn_q_a.weight
|
194 |
+
134: 1536 | 1536, 1, 1, 1 | F32 | blk.8.attn_q_a_norm.weight
|
195 |
+
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.8.attn_q_b.weight
|
196 |
+
136: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.8.ffn_down_exps.weight
|
197 |
+
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.8.ffn_down_shexp.weight
|
198 |
+
138: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.8.ffn_gate_exps.weight
|
199 |
+
139: 819200 | 5120, 160, 1, 1 | F32 | blk.8.ffn_gate_inp.weight
|
200 |
+
140: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.8.ffn_gate_shexp.weight
|
201 |
+
141: 5120 | 5120, 1, 1, 1 | F32 | blk.8.ffn_norm.weight
|
202 |
+
142: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.8.ffn_up_exps.weight
|
203 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.8.ffn_up_shexp.weight
|
204 |
+
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.9.attn_kv_a_mqa.weight
|
205 |
+
145: 512 | 512, 1, 1, 1 | F32 | blk.9.attn_kv_a_norm.weight
|
206 |
+
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.9.attn_kv_b.weight
|
207 |
+
147: 5120 | 5120, 1, 1, 1 | F32 | blk.9.attn_norm.weight
|
208 |
+
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.9.attn_output.weight
|
209 |
+
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.9.attn_q_a.weight
|
210 |
+
150: 1536 | 1536, 1, 1, 1 | F32 | blk.9.attn_q_a_norm.weight
|
211 |
+
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.9.attn_q_b.weight
|
212 |
+
152: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.9.ffn_down_exps.weight
|
213 |
+
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.9.ffn_down_shexp.weight
|
214 |
+
154: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.9.ffn_gate_exps.weight
|
215 |
+
155: 819200 | 5120, 160, 1, 1 | F32 | blk.9.ffn_gate_inp.weight
|
216 |
+
156: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.9.ffn_gate_shexp.weight
|
217 |
+
157: 5120 | 5120, 1, 1, 1 | F32 | blk.9.ffn_norm.weight
|
218 |
+
158: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.9.ffn_up_exps.weight
|
219 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.9.ffn_up_shexp.weight
|
220 |
+
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.10.attn_kv_a_mqa.weight
|
221 |
+
161: 512 | 512, 1, 1, 1 | F32 | blk.10.attn_kv_a_norm.weight
|
222 |
+
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.10.attn_kv_b.weight
|
223 |
+
163: 5120 | 5120, 1, 1, 1 | F32 | blk.10.attn_norm.weight
|
224 |
+
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.10.attn_output.weight
|
225 |
+
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.10.attn_q_a.weight
|
226 |
+
166: 1536 | 1536, 1, 1, 1 | F32 | blk.10.attn_q_a_norm.weight
|
227 |
+
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.10.attn_q_b.weight
|
228 |
+
168: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.10.ffn_down_exps.weight
|
229 |
+
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.10.ffn_down_shexp.weight
|
230 |
+
170: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.10.ffn_gate_exps.weight
|
231 |
+
171: 819200 | 5120, 160, 1, 1 | F32 | blk.10.ffn_gate_inp.weight
|
232 |
+
172: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.10.ffn_gate_shexp.weight
|
233 |
+
173: 5120 | 5120, 1, 1, 1 | F32 | blk.10.ffn_norm.weight
|
234 |
+
174: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.10.ffn_up_exps.weight
|
235 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.10.ffn_up_shexp.weight
|
236 |
+
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.11.attn_kv_a_mqa.weight
|
237 |
+
177: 512 | 512, 1, 1, 1 | F32 | blk.11.attn_kv_a_norm.weight
|
238 |
+
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.11.attn_kv_b.weight
|
239 |
+
179: 5120 | 5120, 1, 1, 1 | F32 | blk.11.attn_norm.weight
|
240 |
+
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.11.attn_output.weight
|
241 |
+
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.11.attn_q_a.weight
|
242 |
+
182: 1536 | 1536, 1, 1, 1 | F32 | blk.11.attn_q_a_norm.weight
|
243 |
+
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.11.attn_q_b.weight
|
244 |
+
184: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.11.ffn_down_exps.weight
|
245 |
+
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.11.ffn_down_shexp.weight
|
246 |
+
186: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.11.ffn_gate_exps.weight
|
247 |
+
187: 819200 | 5120, 160, 1, 1 | F32 | blk.11.ffn_gate_inp.weight
|
248 |
+
188: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.11.ffn_gate_shexp.weight
|
249 |
+
189: 5120 | 5120, 1, 1, 1 | F32 | blk.11.ffn_norm.weight
|
250 |
+
190: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.11.ffn_up_exps.weight
|
251 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.11.ffn_up_shexp.weight
|
252 |
+
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.12.attn_kv_a_mqa.weight
|
253 |
+
193: 512 | 512, 1, 1, 1 | F32 | blk.12.attn_kv_a_norm.weight
|
254 |
+
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.12.attn_kv_b.weight
|
255 |
+
195: 5120 | 5120, 1, 1, 1 | F32 | blk.12.attn_norm.weight
|
256 |
+
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.12.attn_output.weight
|
257 |
+
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.12.attn_q_a.weight
|
258 |
+
198: 1536 | 1536, 1, 1, 1 | F32 | blk.12.attn_q_a_norm.weight
|
259 |
+
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.12.attn_q_b.weight
|
260 |
+
200: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.12.ffn_down_exps.weight
|
261 |
+
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.12.ffn_down_shexp.weight
|
262 |
+
202: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.12.ffn_gate_exps.weight
|
263 |
+
203: 819200 | 5120, 160, 1, 1 | F32 | blk.12.ffn_gate_inp.weight
|
264 |
+
204: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.12.ffn_gate_shexp.weight
|
265 |
+
205: 5120 | 5120, 1, 1, 1 | F32 | blk.12.ffn_norm.weight
|
266 |
+
206: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.12.ffn_up_exps.weight
|
267 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.12.ffn_up_shexp.weight
|
268 |
+
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.13.attn_kv_a_mqa.weight
|
269 |
+
209: 512 | 512, 1, 1, 1 | F32 | blk.13.attn_kv_a_norm.weight
|
270 |
+
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.13.attn_kv_b.weight
|
271 |
+
211: 5120 | 5120, 1, 1, 1 | F32 | blk.13.attn_norm.weight
|
272 |
+
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.13.attn_output.weight
|
273 |
+
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.13.attn_q_a.weight
|
274 |
+
214: 1536 | 1536, 1, 1, 1 | F32 | blk.13.attn_q_a_norm.weight
|
275 |
+
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.13.attn_q_b.weight
|
276 |
+
216: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.13.ffn_down_exps.weight
|
277 |
+
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.13.ffn_down_shexp.weight
|
278 |
+
218: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.13.ffn_gate_exps.weight
|
279 |
+
219: 819200 | 5120, 160, 1, 1 | F32 | blk.13.ffn_gate_inp.weight
|
280 |
+
220: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.13.ffn_gate_shexp.weight
|
281 |
+
221: 5120 | 5120, 1, 1, 1 | F32 | blk.13.ffn_norm.weight
|
282 |
+
222: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.13.ffn_up_exps.weight
|
283 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.13.ffn_up_shexp.weight
|
284 |
+
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.14.attn_kv_a_mqa.weight
|
285 |
+
225: 512 | 512, 1, 1, 1 | F32 | blk.14.attn_kv_a_norm.weight
|
286 |
+
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.14.attn_kv_b.weight
|
287 |
+
227: 5120 | 5120, 1, 1, 1 | F32 | blk.14.attn_norm.weight
|
288 |
+
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.14.attn_output.weight
|
289 |
+
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.14.attn_q_a.weight
|
290 |
+
230: 1536 | 1536, 1, 1, 1 | F32 | blk.14.attn_q_a_norm.weight
|
291 |
+
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.14.attn_q_b.weight
|
292 |
+
232: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.14.ffn_down_exps.weight
|
293 |
+
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.14.ffn_down_shexp.weight
|
294 |
+
234: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.14.ffn_gate_exps.weight
|
295 |
+
235: 819200 | 5120, 160, 1, 1 | F32 | blk.14.ffn_gate_inp.weight
|
296 |
+
236: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.14.ffn_gate_shexp.weight
|
297 |
+
237: 5120 | 5120, 1, 1, 1 | F32 | blk.14.ffn_norm.weight
|
298 |
+
238: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.14.ffn_up_exps.weight
|
299 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.14.ffn_up_shexp.weight
|
300 |
+
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.15.attn_kv_a_mqa.weight
|
301 |
+
241: 512 | 512, 1, 1, 1 | F32 | blk.15.attn_kv_a_norm.weight
|
302 |
+
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.15.attn_kv_b.weight
|
303 |
+
243: 5120 | 5120, 1, 1, 1 | F32 | blk.15.attn_norm.weight
|
304 |
+
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.15.attn_output.weight
|
305 |
+
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.15.attn_q_a.weight
|
306 |
+
246: 1536 | 1536, 1, 1, 1 | F32 | blk.15.attn_q_a_norm.weight
|
307 |
+
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.15.attn_q_b.weight
|
308 |
+
248: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.15.ffn_down_exps.weight
|
309 |
+
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.15.ffn_down_shexp.weight
|
310 |
+
250: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.15.ffn_gate_exps.weight
|
311 |
+
251: 819200 | 5120, 160, 1, 1 | F32 | blk.15.ffn_gate_inp.weight
|
312 |
+
252: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.15.ffn_gate_shexp.weight
|
313 |
+
253: 5120 | 5120, 1, 1, 1 | F32 | blk.15.ffn_norm.weight
|
314 |
+
254: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.15.ffn_up_exps.weight
|
315 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.15.ffn_up_shexp.weight
|
316 |
+
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.16.attn_kv_a_mqa.weight
|
317 |
+
257: 512 | 512, 1, 1, 1 | F32 | blk.16.attn_kv_a_norm.weight
|
318 |
+
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.16.attn_kv_b.weight
|
319 |
+
259: 5120 | 5120, 1, 1, 1 | F32 | blk.16.attn_norm.weight
|
320 |
+
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.16.attn_output.weight
|
321 |
+
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.16.attn_q_a.weight
|
322 |
+
262: 1536 | 1536, 1, 1, 1 | F32 | blk.16.attn_q_a_norm.weight
|
323 |
+
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.16.attn_q_b.weight
|
324 |
+
264: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.16.ffn_down_exps.weight
|
325 |
+
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.16.ffn_down_shexp.weight
|
326 |
+
266: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.16.ffn_gate_exps.weight
|
327 |
+
267: 819200 | 5120, 160, 1, 1 | F32 | blk.16.ffn_gate_inp.weight
|
328 |
+
268: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.16.ffn_gate_shexp.weight
|
329 |
+
269: 5120 | 5120, 1, 1, 1 | F32 | blk.16.ffn_norm.weight
|
330 |
+
270: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.16.ffn_up_exps.weight
|
331 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.16.ffn_up_shexp.weight
|
332 |
+
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.17.attn_kv_a_mqa.weight
|
333 |
+
273: 512 | 512, 1, 1, 1 | F32 | blk.17.attn_kv_a_norm.weight
|
334 |
+
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.17.attn_kv_b.weight
|
335 |
+
275: 5120 | 5120, 1, 1, 1 | F32 | blk.17.attn_norm.weight
|
336 |
+
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.17.attn_output.weight
|
337 |
+
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.17.attn_q_a.weight
|
338 |
+
278: 1536 | 1536, 1, 1, 1 | F32 | blk.17.attn_q_a_norm.weight
|
339 |
+
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.17.attn_q_b.weight
|
340 |
+
280: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.17.ffn_down_exps.weight
|
341 |
+
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.17.ffn_down_shexp.weight
|
342 |
+
282: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.17.ffn_gate_exps.weight
|
343 |
+
283: 819200 | 5120, 160, 1, 1 | F32 | blk.17.ffn_gate_inp.weight
|
344 |
+
284: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.17.ffn_gate_shexp.weight
|
345 |
+
285: 5120 | 5120, 1, 1, 1 | F32 | blk.17.ffn_norm.weight
|
346 |
+
286: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.17.ffn_up_exps.weight
|
347 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.17.ffn_up_shexp.weight
|
348 |
+
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.18.attn_kv_a_mqa.weight
|
349 |
+
289: 512 | 512, 1, 1, 1 | F32 | blk.18.attn_kv_a_norm.weight
|
350 |
+
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.18.attn_kv_b.weight
|
351 |
+
291: 5120 | 5120, 1, 1, 1 | F32 | blk.18.attn_norm.weight
|
352 |
+
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.18.attn_output.weight
|
353 |
+
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.18.attn_q_a.weight
|
354 |
+
294: 1536 | 1536, 1, 1, 1 | F32 | blk.18.attn_q_a_norm.weight
|
355 |
+
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.18.attn_q_b.weight
|
356 |
+
296: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.18.ffn_down_exps.weight
|
357 |
+
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.18.ffn_down_shexp.weight
|
358 |
+
298: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.18.ffn_gate_exps.weight
|
359 |
+
299: 819200 | 5120, 160, 1, 1 | F32 | blk.18.ffn_gate_inp.weight
|
360 |
+
300: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.18.ffn_gate_shexp.weight
|
361 |
+
301: 5120 | 5120, 1, 1, 1 | F32 | blk.18.ffn_norm.weight
|
362 |
+
302: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.18.ffn_up_exps.weight
|
363 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.18.ffn_up_shexp.weight
|
364 |
+
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.19.attn_kv_a_mqa.weight
|
365 |
+
305: 512 | 512, 1, 1, 1 | F32 | blk.19.attn_kv_a_norm.weight
|
366 |
+
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.19.attn_kv_b.weight
|
367 |
+
307: 5120 | 5120, 1, 1, 1 | F32 | blk.19.attn_norm.weight
|
368 |
+
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.19.attn_output.weight
|
369 |
+
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.19.attn_q_a.weight
|
370 |
+
310: 1536 | 1536, 1, 1, 1 | F32 | blk.19.attn_q_a_norm.weight
|
371 |
+
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.19.attn_q_b.weight
|
372 |
+
312: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.19.ffn_down_exps.weight
|
373 |
+
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.19.ffn_down_shexp.weight
|
374 |
+
314: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.19.ffn_gate_exps.weight
|
375 |
+
315: 819200 | 5120, 160, 1, 1 | F32 | blk.19.ffn_gate_inp.weight
|
376 |
+
316: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.19.ffn_gate_shexp.weight
|
377 |
+
317: 5120 | 5120, 1, 1, 1 | F32 | blk.19.ffn_norm.weight
|
378 |
+
318: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.19.ffn_up_exps.weight
|
379 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.19.ffn_up_shexp.weight
|
380 |
+
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.20.attn_kv_a_mqa.weight
|
381 |
+
321: 512 | 512, 1, 1, 1 | F32 | blk.20.attn_kv_a_norm.weight
|
382 |
+
322: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.20.attn_kv_b.weight
|
383 |
+
323: 5120 | 5120, 1, 1, 1 | F32 | blk.20.attn_norm.weight
|
384 |
+
324: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.20.attn_output.weight
|
385 |
+
325: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.20.attn_q_a.weight
|
386 |
+
326: 1536 | 1536, 1, 1, 1 | F32 | blk.20.attn_q_a_norm.weight
|
387 |
+
327: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.20.attn_q_b.weight
|
388 |
+
328: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.20.ffn_down_exps.weight
|
389 |
+
329: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.20.ffn_down_shexp.weight
|
390 |
+
330: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.20.ffn_gate_exps.weight
|
391 |
+
331: 819200 | 5120, 160, 1, 1 | F32 | blk.20.ffn_gate_inp.weight
|
392 |
+
332: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.20.ffn_gate_shexp.weight
|
393 |
+
333: 5120 | 5120, 1, 1, 1 | F32 | blk.20.ffn_norm.weight
|
394 |
+
334: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.20.ffn_up_exps.weight
|
395 |
+
335: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.20.ffn_up_shexp.weight
|
396 |
+
336: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.21.attn_kv_a_mqa.weight
|
397 |
+
337: 512 | 512, 1, 1, 1 | F32 | blk.21.attn_kv_a_norm.weight
|
398 |
+
338: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.21.attn_kv_b.weight
|
399 |
+
339: 5120 | 5120, 1, 1, 1 | F32 | blk.21.attn_norm.weight
|
400 |
+
340: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.21.attn_output.weight
|
401 |
+
341: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.21.attn_q_a.weight
|
402 |
+
342: 1536 | 1536, 1, 1, 1 | F32 | blk.21.attn_q_a_norm.weight
|
403 |
+
343: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.21.attn_q_b.weight
|
404 |
+
344: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.21.ffn_down_exps.weight
|
405 |
+
345: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.21.ffn_down_shexp.weight
|
406 |
+
346: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.21.ffn_gate_exps.weight
|
407 |
+
347: 819200 | 5120, 160, 1, 1 | F32 | blk.21.ffn_gate_inp.weight
|
408 |
+
348: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.21.ffn_gate_shexp.weight
|
409 |
+
349: 5120 | 5120, 1, 1, 1 | F32 | blk.21.ffn_norm.weight
|
410 |
+
350: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.21.ffn_up_exps.weight
|
411 |
+
351: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.21.ffn_up_shexp.weight
|
412 |
+
352: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.22.attn_kv_a_mqa.weight
|
413 |
+
353: 512 | 512, 1, 1, 1 | F32 | blk.22.attn_kv_a_norm.weight
|
414 |
+
354: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.22.attn_kv_b.weight
|
415 |
+
355: 5120 | 5120, 1, 1, 1 | F32 | blk.22.attn_norm.weight
|
416 |
+
356: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.22.attn_output.weight
|
417 |
+
357: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.22.attn_q_a.weight
|
418 |
+
358: 1536 | 1536, 1, 1, 1 | F32 | blk.22.attn_q_a_norm.weight
|
419 |
+
359: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.22.attn_q_b.weight
|
420 |
+
360: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.22.ffn_down_exps.weight
|
421 |
+
361: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.22.ffn_down_shexp.weight
|
422 |
+
362: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.22.ffn_gate_exps.weight
|
423 |
+
363: 819200 | 5120, 160, 1, 1 | F32 | blk.22.ffn_gate_inp.weight
|
424 |
+
364: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.22.ffn_gate_shexp.weight
|
425 |
+
365: 5120 | 5120, 1, 1, 1 | F32 | blk.22.ffn_norm.weight
|
426 |
+
366: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.22.ffn_up_exps.weight
|
427 |
+
367: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.22.ffn_up_shexp.weight
|
428 |
+
368: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.23.attn_kv_a_mqa.weight
|
429 |
+
369: 512 | 512, 1, 1, 1 | F32 | blk.23.attn_kv_a_norm.weight
|
430 |
+
370: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.23.attn_kv_b.weight
|
431 |
+
371: 5120 | 5120, 1, 1, 1 | F32 | blk.23.attn_norm.weight
|
432 |
+
372: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.23.attn_output.weight
|
433 |
+
373: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.23.attn_q_a.weight
|
434 |
+
374: 1536 | 1536, 1, 1, 1 | F32 | blk.23.attn_q_a_norm.weight
|
435 |
+
375: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.23.attn_q_b.weight
|
436 |
+
376: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.23.ffn_down_exps.weight
|
437 |
+
377: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.23.ffn_down_shexp.weight
|
438 |
+
378: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.23.ffn_gate_exps.weight
|
439 |
+
379: 819200 | 5120, 160, 1, 1 | F32 | blk.23.ffn_gate_inp.weight
|
440 |
+
380: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.23.ffn_gate_shexp.weight
|
441 |
+
381: 5120 | 5120, 1, 1, 1 | F32 | blk.23.ffn_norm.weight
|
442 |
+
382: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.23.ffn_up_exps.weight
|
443 |
+
383: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.23.ffn_up_shexp.weight
|
444 |
+
384: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.24.attn_kv_a_mqa.weight
|
445 |
+
385: 512 | 512, 1, 1, 1 | F32 | blk.24.attn_kv_a_norm.weight
|
446 |
+
386: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.24.attn_kv_b.weight
|
447 |
+
387: 5120 | 5120, 1, 1, 1 | F32 | blk.24.attn_norm.weight
|
448 |
+
388: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.24.attn_output.weight
|
449 |
+
389: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.24.attn_q_a.weight
|
450 |
+
390: 1536 | 1536, 1, 1, 1 | F32 | blk.24.attn_q_a_norm.weight
|
451 |
+
391: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.24.attn_q_b.weight
|
452 |
+
392: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.24.ffn_down_exps.weight
|
453 |
+
393: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.24.ffn_down_shexp.weight
|
454 |
+
394: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.24.ffn_gate_exps.weight
|
455 |
+
395: 819200 | 5120, 160, 1, 1 | F32 | blk.24.ffn_gate_inp.weight
|
456 |
+
396: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.24.ffn_gate_shexp.weight
|
457 |
+
397: 5120 | 5120, 1, 1, 1 | F32 | blk.24.ffn_norm.weight
|
458 |
+
398: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.24.ffn_up_exps.weight
|
459 |
+
399: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.24.ffn_up_shexp.weight
|
460 |
+
400: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.25.attn_kv_a_mqa.weight
|
461 |
+
401: 512 | 512, 1, 1, 1 | F32 | blk.25.attn_kv_a_norm.weight
|
462 |
+
402: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.25.attn_kv_b.weight
|
463 |
+
403: 5120 | 5120, 1, 1, 1 | F32 | blk.25.attn_norm.weight
|
464 |
+
404: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.25.attn_output.weight
|
465 |
+
405: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.25.attn_q_a.weight
|
466 |
+
406: 1536 | 1536, 1, 1, 1 | F32 | blk.25.attn_q_a_norm.weight
|
467 |
+
407: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.25.attn_q_b.weight
|
468 |
+
408: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.25.ffn_down_exps.weight
|
469 |
+
409: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.25.ffn_down_shexp.weight
|
470 |
+
410: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.25.ffn_gate_exps.weight
|
471 |
+
411: 819200 | 5120, 160, 1, 1 | F32 | blk.25.ffn_gate_inp.weight
|
472 |
+
412: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.25.ffn_gate_shexp.weight
|
473 |
+
413: 5120 | 5120, 1, 1, 1 | F32 | blk.25.ffn_norm.weight
|
474 |
+
414: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.25.ffn_up_exps.weight
|
475 |
+
415: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.25.ffn_up_shexp.weight
|
476 |
+
416: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.26.attn_kv_a_mqa.weight
|
477 |
+
417: 512 | 512, 1, 1, 1 | F32 | blk.26.attn_kv_a_norm.weight
|
478 |
+
418: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.26.attn_kv_b.weight
|
479 |
+
419: 5120 | 5120, 1, 1, 1 | F32 | blk.26.attn_norm.weight
|
480 |
+
420: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.26.attn_output.weight
|
481 |
+
421: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.26.attn_q_a.weight
|
482 |
+
422: 1536 | 1536, 1, 1, 1 | F32 | blk.26.attn_q_a_norm.weight
|
483 |
+
423: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.26.attn_q_b.weight
|
484 |
+
424: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.26.ffn_down_exps.weight
|
485 |
+
425: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.26.ffn_down_shexp.weight
|
486 |
+
426: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.26.ffn_gate_exps.weight
|
487 |
+
427: 819200 | 5120, 160, 1, 1 | F32 | blk.26.ffn_gate_inp.weight
|
488 |
+
428: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.26.ffn_gate_shexp.weight
|
489 |
+
429: 5120 | 5120, 1, 1, 1 | F32 | blk.26.ffn_norm.weight
|
490 |
+
430: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.26.ffn_up_exps.weight
|
491 |
+
431: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.26.ffn_up_shexp.weight
|
492 |
+
432: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.27.attn_kv_a_mqa.weight
|
493 |
+
433: 512 | 512, 1, 1, 1 | F32 | blk.27.attn_kv_a_norm.weight
|
494 |
+
434: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.27.attn_kv_b.weight
|
495 |
+
435: 5120 | 5120, 1, 1, 1 | F32 | blk.27.attn_norm.weight
|
496 |
+
436: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.27.attn_output.weight
|
497 |
+
437: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.27.attn_q_a.weight
|
498 |
+
438: 1536 | 1536, 1, 1, 1 | F32 | blk.27.attn_q_a_norm.weight
|
499 |
+
439: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.27.attn_q_b.weight
|
500 |
+
440: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.27.ffn_down_exps.weight
|
501 |
+
441: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.27.ffn_down_shexp.weight
|
502 |
+
442: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.27.ffn_gate_exps.weight
|
503 |
+
443: 819200 | 5120, 160, 1, 1 | F32 | blk.27.ffn_gate_inp.weight
|
504 |
+
444: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.27.ffn_gate_shexp.weight
|
505 |
+
445: 5120 | 5120, 1, 1, 1 | F32 | blk.27.ffn_norm.weight
|
506 |
+
446: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.27.ffn_up_exps.weight
|
507 |
+
447: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.27.ffn_up_shexp.weight
|
508 |
+
448: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.28.attn_kv_a_mqa.weight
|
509 |
+
449: 512 | 512, 1, 1, 1 | F32 | blk.28.attn_kv_a_norm.weight
|
510 |
+
450: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.28.attn_kv_b.weight
|
511 |
+
451: 5120 | 5120, 1, 1, 1 | F32 | blk.28.attn_norm.weight
|
512 |
+
452: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.28.attn_output.weight
|
513 |
+
453: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.28.attn_q_a.weight
|
514 |
+
454: 1536 | 1536, 1, 1, 1 | F32 | blk.28.attn_q_a_norm.weight
|
515 |
+
455: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.28.attn_q_b.weight
|
516 |
+
456: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.28.ffn_down_exps.weight
|
517 |
+
457: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.28.ffn_down_shexp.weight
|
518 |
+
458: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.28.ffn_gate_exps.weight
|
519 |
+
459: 819200 | 5120, 160, 1, 1 | F32 | blk.28.ffn_gate_inp.weight
|
520 |
+
460: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.28.ffn_gate_shexp.weight
|
521 |
+
461: 5120 | 5120, 1, 1, 1 | F32 | blk.28.ffn_norm.weight
|
522 |
+
462: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.28.ffn_up_exps.weight
|
523 |
+
463: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.28.ffn_up_shexp.weight
|
524 |
+
464: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.29.attn_kv_a_mqa.weight
|
525 |
+
465: 512 | 512, 1, 1, 1 | F32 | blk.29.attn_kv_a_norm.weight
|
526 |
+
466: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.29.attn_kv_b.weight
|
527 |
+
467: 5120 | 5120, 1, 1, 1 | F32 | blk.29.attn_norm.weight
|
528 |
+
468: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.29.attn_output.weight
|
529 |
+
469: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.29.attn_q_a.weight
|
530 |
+
470: 1536 | 1536, 1, 1, 1 | F32 | blk.29.attn_q_a_norm.weight
|
531 |
+
471: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.29.attn_q_b.weight
|
532 |
+
472: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.29.ffn_down_exps.weight
|
533 |
+
473: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.29.ffn_down_shexp.weight
|
534 |
+
474: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.29.ffn_gate_exps.weight
|
535 |
+
475: 819200 | 5120, 160, 1, 1 | F32 | blk.29.ffn_gate_inp.weight
|
536 |
+
476: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.29.ffn_gate_shexp.weight
|
537 |
+
477: 5120 | 5120, 1, 1, 1 | F32 | blk.29.ffn_norm.weight
|
538 |
+
478: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.29.ffn_up_exps.weight
|
539 |
+
479: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.29.ffn_up_shexp.weight
|
540 |
+
480: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.30.attn_kv_a_mqa.weight
|
DeepSeek-v2.5-1210-UD-iq2_s-00002-of-00002.gguf.tensors.txt
ADDED
@@ -0,0 +1,489 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq2_s-00002-of-00002.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 6 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 479
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 3
|
7 |
+
4: UINT16 | 1 | split.no = 1
|
8 |
+
5: INT32 | 1 | split.tensors.count = 959
|
9 |
+
6: UINT16 | 1 | split.count = 2
|
10 |
+
* Dumping 479 tensor(s)
|
11 |
+
1: 512 | 512, 1, 1, 1 | F32 | blk.30.attn_kv_a_norm.weight
|
12 |
+
2: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.30.attn_kv_b.weight
|
13 |
+
3: 5120 | 5120, 1, 1, 1 | F32 | blk.30.attn_norm.weight
|
14 |
+
4: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.30.attn_output.weight
|
15 |
+
5: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.30.attn_q_a.weight
|
16 |
+
6: 1536 | 1536, 1, 1, 1 | F32 | blk.30.attn_q_a_norm.weight
|
17 |
+
7: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.30.attn_q_b.weight
|
18 |
+
8: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.30.ffn_down_exps.weight
|
19 |
+
9: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.30.ffn_down_shexp.weight
|
20 |
+
10: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.30.ffn_gate_exps.weight
|
21 |
+
11: 819200 | 5120, 160, 1, 1 | F32 | blk.30.ffn_gate_inp.weight
|
22 |
+
12: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.30.ffn_gate_shexp.weight
|
23 |
+
13: 5120 | 5120, 1, 1, 1 | F32 | blk.30.ffn_norm.weight
|
24 |
+
14: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.30.ffn_up_exps.weight
|
25 |
+
15: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.30.ffn_up_shexp.weight
|
26 |
+
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.31.attn_kv_a_mqa.weight
|
27 |
+
17: 512 | 512, 1, 1, 1 | F32 | blk.31.attn_kv_a_norm.weight
|
28 |
+
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.31.attn_kv_b.weight
|
29 |
+
19: 5120 | 5120, 1, 1, 1 | F32 | blk.31.attn_norm.weight
|
30 |
+
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.31.attn_output.weight
|
31 |
+
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.31.attn_q_a.weight
|
32 |
+
22: 1536 | 1536, 1, 1, 1 | F32 | blk.31.attn_q_a_norm.weight
|
33 |
+
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.31.attn_q_b.weight
|
34 |
+
24: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.31.ffn_down_exps.weight
|
35 |
+
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.31.ffn_down_shexp.weight
|
36 |
+
26: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.31.ffn_gate_exps.weight
|
37 |
+
27: 819200 | 5120, 160, 1, 1 | F32 | blk.31.ffn_gate_inp.weight
|
38 |
+
28: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.31.ffn_gate_shexp.weight
|
39 |
+
29: 5120 | 5120, 1, 1, 1 | F32 | blk.31.ffn_norm.weight
|
40 |
+
30: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.31.ffn_up_exps.weight
|
41 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.31.ffn_up_shexp.weight
|
42 |
+
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.32.attn_kv_a_mqa.weight
|
43 |
+
33: 512 | 512, 1, 1, 1 | F32 | blk.32.attn_kv_a_norm.weight
|
44 |
+
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.32.attn_kv_b.weight
|
45 |
+
35: 5120 | 5120, 1, 1, 1 | F32 | blk.32.attn_norm.weight
|
46 |
+
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.32.attn_output.weight
|
47 |
+
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.32.attn_q_a.weight
|
48 |
+
38: 1536 | 1536, 1, 1, 1 | F32 | blk.32.attn_q_a_norm.weight
|
49 |
+
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.32.attn_q_b.weight
|
50 |
+
40: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.32.ffn_down_exps.weight
|
51 |
+
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.32.ffn_down_shexp.weight
|
52 |
+
42: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.32.ffn_gate_exps.weight
|
53 |
+
43: 819200 | 5120, 160, 1, 1 | F32 | blk.32.ffn_gate_inp.weight
|
54 |
+
44: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.32.ffn_gate_shexp.weight
|
55 |
+
45: 5120 | 5120, 1, 1, 1 | F32 | blk.32.ffn_norm.weight
|
56 |
+
46: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.32.ffn_up_exps.weight
|
57 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.32.ffn_up_shexp.weight
|
58 |
+
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.33.attn_kv_a_mqa.weight
|
59 |
+
49: 512 | 512, 1, 1, 1 | F32 | blk.33.attn_kv_a_norm.weight
|
60 |
+
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.33.attn_kv_b.weight
|
61 |
+
51: 5120 | 5120, 1, 1, 1 | F32 | blk.33.attn_norm.weight
|
62 |
+
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.33.attn_output.weight
|
63 |
+
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.33.attn_q_a.weight
|
64 |
+
54: 1536 | 1536, 1, 1, 1 | F32 | blk.33.attn_q_a_norm.weight
|
65 |
+
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.33.attn_q_b.weight
|
66 |
+
56: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.33.ffn_down_exps.weight
|
67 |
+
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.33.ffn_down_shexp.weight
|
68 |
+
58: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.33.ffn_gate_exps.weight
|
69 |
+
59: 819200 | 5120, 160, 1, 1 | F32 | blk.33.ffn_gate_inp.weight
|
70 |
+
60: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.33.ffn_gate_shexp.weight
|
71 |
+
61: 5120 | 5120, 1, 1, 1 | F32 | blk.33.ffn_norm.weight
|
72 |
+
62: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.33.ffn_up_exps.weight
|
73 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.33.ffn_up_shexp.weight
|
74 |
+
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.34.attn_kv_a_mqa.weight
|
75 |
+
65: 512 | 512, 1, 1, 1 | F32 | blk.34.attn_kv_a_norm.weight
|
76 |
+
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.34.attn_kv_b.weight
|
77 |
+
67: 5120 | 5120, 1, 1, 1 | F32 | blk.34.attn_norm.weight
|
78 |
+
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.34.attn_output.weight
|
79 |
+
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.34.attn_q_a.weight
|
80 |
+
70: 1536 | 1536, 1, 1, 1 | F32 | blk.34.attn_q_a_norm.weight
|
81 |
+
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.34.attn_q_b.weight
|
82 |
+
72: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.34.ffn_down_exps.weight
|
83 |
+
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.34.ffn_down_shexp.weight
|
84 |
+
74: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.34.ffn_gate_exps.weight
|
85 |
+
75: 819200 | 5120, 160, 1, 1 | F32 | blk.34.ffn_gate_inp.weight
|
86 |
+
76: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.34.ffn_gate_shexp.weight
|
87 |
+
77: 5120 | 5120, 1, 1, 1 | F32 | blk.34.ffn_norm.weight
|
88 |
+
78: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.34.ffn_up_exps.weight
|
89 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.34.ffn_up_shexp.weight
|
90 |
+
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.35.attn_kv_a_mqa.weight
|
91 |
+
81: 512 | 512, 1, 1, 1 | F32 | blk.35.attn_kv_a_norm.weight
|
92 |
+
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.35.attn_kv_b.weight
|
93 |
+
83: 5120 | 5120, 1, 1, 1 | F32 | blk.35.attn_norm.weight
|
94 |
+
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.35.attn_output.weight
|
95 |
+
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.35.attn_q_a.weight
|
96 |
+
86: 1536 | 1536, 1, 1, 1 | F32 | blk.35.attn_q_a_norm.weight
|
97 |
+
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.35.attn_q_b.weight
|
98 |
+
88: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.35.ffn_down_exps.weight
|
99 |
+
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.35.ffn_down_shexp.weight
|
100 |
+
90: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.35.ffn_gate_exps.weight
|
101 |
+
91: 819200 | 5120, 160, 1, 1 | F32 | blk.35.ffn_gate_inp.weight
|
102 |
+
92: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.35.ffn_gate_shexp.weight
|
103 |
+
93: 5120 | 5120, 1, 1, 1 | F32 | blk.35.ffn_norm.weight
|
104 |
+
94: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.35.ffn_up_exps.weight
|
105 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.35.ffn_up_shexp.weight
|
106 |
+
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.36.attn_kv_a_mqa.weight
|
107 |
+
97: 512 | 512, 1, 1, 1 | F32 | blk.36.attn_kv_a_norm.weight
|
108 |
+
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.36.attn_kv_b.weight
|
109 |
+
99: 5120 | 5120, 1, 1, 1 | F32 | blk.36.attn_norm.weight
|
110 |
+
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.36.attn_output.weight
|
111 |
+
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.36.attn_q_a.weight
|
112 |
+
102: 1536 | 1536, 1, 1, 1 | F32 | blk.36.attn_q_a_norm.weight
|
113 |
+
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.36.attn_q_b.weight
|
114 |
+
104: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.36.ffn_down_exps.weight
|
115 |
+
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.36.ffn_down_shexp.weight
|
116 |
+
106: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.36.ffn_gate_exps.weight
|
117 |
+
107: 819200 | 5120, 160, 1, 1 | F32 | blk.36.ffn_gate_inp.weight
|
118 |
+
108: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.36.ffn_gate_shexp.weight
|
119 |
+
109: 5120 | 5120, 1, 1, 1 | F32 | blk.36.ffn_norm.weight
|
120 |
+
110: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.36.ffn_up_exps.weight
|
121 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.36.ffn_up_shexp.weight
|
122 |
+
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.37.attn_kv_a_mqa.weight
|
123 |
+
113: 512 | 512, 1, 1, 1 | F32 | blk.37.attn_kv_a_norm.weight
|
124 |
+
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.37.attn_kv_b.weight
|
125 |
+
115: 5120 | 5120, 1, 1, 1 | F32 | blk.37.attn_norm.weight
|
126 |
+
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.37.attn_output.weight
|
127 |
+
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.37.attn_q_a.weight
|
128 |
+
118: 1536 | 1536, 1, 1, 1 | F32 | blk.37.attn_q_a_norm.weight
|
129 |
+
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.37.attn_q_b.weight
|
130 |
+
120: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.37.ffn_down_exps.weight
|
131 |
+
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.37.ffn_down_shexp.weight
|
132 |
+
122: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.37.ffn_gate_exps.weight
|
133 |
+
123: 819200 | 5120, 160, 1, 1 | F32 | blk.37.ffn_gate_inp.weight
|
134 |
+
124: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.37.ffn_gate_shexp.weight
|
135 |
+
125: 5120 | 5120, 1, 1, 1 | F32 | blk.37.ffn_norm.weight
|
136 |
+
126: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.37.ffn_up_exps.weight
|
137 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.37.ffn_up_shexp.weight
|
138 |
+
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.38.attn_kv_a_mqa.weight
|
139 |
+
129: 512 | 512, 1, 1, 1 | F32 | blk.38.attn_kv_a_norm.weight
|
140 |
+
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.38.attn_kv_b.weight
|
141 |
+
131: 5120 | 5120, 1, 1, 1 | F32 | blk.38.attn_norm.weight
|
142 |
+
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.38.attn_output.weight
|
143 |
+
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.38.attn_q_a.weight
|
144 |
+
134: 1536 | 1536, 1, 1, 1 | F32 | blk.38.attn_q_a_norm.weight
|
145 |
+
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.38.attn_q_b.weight
|
146 |
+
136: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.38.ffn_down_exps.weight
|
147 |
+
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.38.ffn_down_shexp.weight
|
148 |
+
138: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.38.ffn_gate_exps.weight
|
149 |
+
139: 819200 | 5120, 160, 1, 1 | F32 | blk.38.ffn_gate_inp.weight
|
150 |
+
140: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.38.ffn_gate_shexp.weight
|
151 |
+
141: 5120 | 5120, 1, 1, 1 | F32 | blk.38.ffn_norm.weight
|
152 |
+
142: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.38.ffn_up_exps.weight
|
153 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.38.ffn_up_shexp.weight
|
154 |
+
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.39.attn_kv_a_mqa.weight
|
155 |
+
145: 512 | 512, 1, 1, 1 | F32 | blk.39.attn_kv_a_norm.weight
|
156 |
+
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.39.attn_kv_b.weight
|
157 |
+
147: 5120 | 5120, 1, 1, 1 | F32 | blk.39.attn_norm.weight
|
158 |
+
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.39.attn_output.weight
|
159 |
+
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.39.attn_q_a.weight
|
160 |
+
150: 1536 | 1536, 1, 1, 1 | F32 | blk.39.attn_q_a_norm.weight
|
161 |
+
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.39.attn_q_b.weight
|
162 |
+
152: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.39.ffn_down_exps.weight
|
163 |
+
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.39.ffn_down_shexp.weight
|
164 |
+
154: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.39.ffn_gate_exps.weight
|
165 |
+
155: 819200 | 5120, 160, 1, 1 | F32 | blk.39.ffn_gate_inp.weight
|
166 |
+
156: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.39.ffn_gate_shexp.weight
|
167 |
+
157: 5120 | 5120, 1, 1, 1 | F32 | blk.39.ffn_norm.weight
|
168 |
+
158: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.39.ffn_up_exps.weight
|
169 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.39.ffn_up_shexp.weight
|
170 |
+
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.40.attn_kv_a_mqa.weight
|
171 |
+
161: 512 | 512, 1, 1, 1 | F32 | blk.40.attn_kv_a_norm.weight
|
172 |
+
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.40.attn_kv_b.weight
|
173 |
+
163: 5120 | 5120, 1, 1, 1 | F32 | blk.40.attn_norm.weight
|
174 |
+
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.40.attn_output.weight
|
175 |
+
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.40.attn_q_a.weight
|
176 |
+
166: 1536 | 1536, 1, 1, 1 | F32 | blk.40.attn_q_a_norm.weight
|
177 |
+
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.40.attn_q_b.weight
|
178 |
+
168: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.40.ffn_down_exps.weight
|
179 |
+
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.40.ffn_down_shexp.weight
|
180 |
+
170: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.40.ffn_gate_exps.weight
|
181 |
+
171: 819200 | 5120, 160, 1, 1 | F32 | blk.40.ffn_gate_inp.weight
|
182 |
+
172: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.40.ffn_gate_shexp.weight
|
183 |
+
173: 5120 | 5120, 1, 1, 1 | F32 | blk.40.ffn_norm.weight
|
184 |
+
174: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.40.ffn_up_exps.weight
|
185 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.40.ffn_up_shexp.weight
|
186 |
+
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.41.attn_kv_a_mqa.weight
|
187 |
+
177: 512 | 512, 1, 1, 1 | F32 | blk.41.attn_kv_a_norm.weight
|
188 |
+
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.41.attn_kv_b.weight
|
189 |
+
179: 5120 | 5120, 1, 1, 1 | F32 | blk.41.attn_norm.weight
|
190 |
+
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.41.attn_output.weight
|
191 |
+
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.41.attn_q_a.weight
|
192 |
+
182: 1536 | 1536, 1, 1, 1 | F32 | blk.41.attn_q_a_norm.weight
|
193 |
+
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.41.attn_q_b.weight
|
194 |
+
184: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.41.ffn_down_exps.weight
|
195 |
+
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.41.ffn_down_shexp.weight
|
196 |
+
186: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.41.ffn_gate_exps.weight
|
197 |
+
187: 819200 | 5120, 160, 1, 1 | F32 | blk.41.ffn_gate_inp.weight
|
198 |
+
188: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.41.ffn_gate_shexp.weight
|
199 |
+
189: 5120 | 5120, 1, 1, 1 | F32 | blk.41.ffn_norm.weight
|
200 |
+
190: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.41.ffn_up_exps.weight
|
201 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.41.ffn_up_shexp.weight
|
202 |
+
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.42.attn_kv_a_mqa.weight
|
203 |
+
193: 512 | 512, 1, 1, 1 | F32 | blk.42.attn_kv_a_norm.weight
|
204 |
+
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.42.attn_kv_b.weight
|
205 |
+
195: 5120 | 5120, 1, 1, 1 | F32 | blk.42.attn_norm.weight
|
206 |
+
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.42.attn_output.weight
|
207 |
+
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.42.attn_q_a.weight
|
208 |
+
198: 1536 | 1536, 1, 1, 1 | F32 | blk.42.attn_q_a_norm.weight
|
209 |
+
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.42.attn_q_b.weight
|
210 |
+
200: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.42.ffn_down_exps.weight
|
211 |
+
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.42.ffn_down_shexp.weight
|
212 |
+
202: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.42.ffn_gate_exps.weight
|
213 |
+
203: 819200 | 5120, 160, 1, 1 | F32 | blk.42.ffn_gate_inp.weight
|
214 |
+
204: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.42.ffn_gate_shexp.weight
|
215 |
+
205: 5120 | 5120, 1, 1, 1 | F32 | blk.42.ffn_norm.weight
|
216 |
+
206: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.42.ffn_up_exps.weight
|
217 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.42.ffn_up_shexp.weight
|
218 |
+
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.43.attn_kv_a_mqa.weight
|
219 |
+
209: 512 | 512, 1, 1, 1 | F32 | blk.43.attn_kv_a_norm.weight
|
220 |
+
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.43.attn_kv_b.weight
|
221 |
+
211: 5120 | 5120, 1, 1, 1 | F32 | blk.43.attn_norm.weight
|
222 |
+
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.43.attn_output.weight
|
223 |
+
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.43.attn_q_a.weight
|
224 |
+
214: 1536 | 1536, 1, 1, 1 | F32 | blk.43.attn_q_a_norm.weight
|
225 |
+
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.43.attn_q_b.weight
|
226 |
+
216: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.43.ffn_down_exps.weight
|
227 |
+
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.43.ffn_down_shexp.weight
|
228 |
+
218: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.43.ffn_gate_exps.weight
|
229 |
+
219: 819200 | 5120, 160, 1, 1 | F32 | blk.43.ffn_gate_inp.weight
|
230 |
+
220: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.43.ffn_gate_shexp.weight
|
231 |
+
221: 5120 | 5120, 1, 1, 1 | F32 | blk.43.ffn_norm.weight
|
232 |
+
222: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.43.ffn_up_exps.weight
|
233 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.43.ffn_up_shexp.weight
|
234 |
+
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.44.attn_kv_a_mqa.weight
|
235 |
+
225: 512 | 512, 1, 1, 1 | F32 | blk.44.attn_kv_a_norm.weight
|
236 |
+
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.44.attn_kv_b.weight
|
237 |
+
227: 5120 | 5120, 1, 1, 1 | F32 | blk.44.attn_norm.weight
|
238 |
+
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.44.attn_output.weight
|
239 |
+
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.44.attn_q_a.weight
|
240 |
+
230: 1536 | 1536, 1, 1, 1 | F32 | blk.44.attn_q_a_norm.weight
|
241 |
+
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.44.attn_q_b.weight
|
242 |
+
232: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.44.ffn_down_exps.weight
|
243 |
+
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.44.ffn_down_shexp.weight
|
244 |
+
234: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.44.ffn_gate_exps.weight
|
245 |
+
235: 819200 | 5120, 160, 1, 1 | F32 | blk.44.ffn_gate_inp.weight
|
246 |
+
236: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.44.ffn_gate_shexp.weight
|
247 |
+
237: 5120 | 5120, 1, 1, 1 | F32 | blk.44.ffn_norm.weight
|
248 |
+
238: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.44.ffn_up_exps.weight
|
249 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.44.ffn_up_shexp.weight
|
250 |
+
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.45.attn_kv_a_mqa.weight
|
251 |
+
241: 512 | 512, 1, 1, 1 | F32 | blk.45.attn_kv_a_norm.weight
|
252 |
+
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.45.attn_kv_b.weight
|
253 |
+
243: 5120 | 5120, 1, 1, 1 | F32 | blk.45.attn_norm.weight
|
254 |
+
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.45.attn_output.weight
|
255 |
+
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.45.attn_q_a.weight
|
256 |
+
246: 1536 | 1536, 1, 1, 1 | F32 | blk.45.attn_q_a_norm.weight
|
257 |
+
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.45.attn_q_b.weight
|
258 |
+
248: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.45.ffn_down_exps.weight
|
259 |
+
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.45.ffn_down_shexp.weight
|
260 |
+
250: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.45.ffn_gate_exps.weight
|
261 |
+
251: 819200 | 5120, 160, 1, 1 | F32 | blk.45.ffn_gate_inp.weight
|
262 |
+
252: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.45.ffn_gate_shexp.weight
|
263 |
+
253: 5120 | 5120, 1, 1, 1 | F32 | blk.45.ffn_norm.weight
|
264 |
+
254: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.45.ffn_up_exps.weight
|
265 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.45.ffn_up_shexp.weight
|
266 |
+
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.46.attn_kv_a_mqa.weight
|
267 |
+
257: 512 | 512, 1, 1, 1 | F32 | blk.46.attn_kv_a_norm.weight
|
268 |
+
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.46.attn_kv_b.weight
|
269 |
+
259: 5120 | 5120, 1, 1, 1 | F32 | blk.46.attn_norm.weight
|
270 |
+
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.46.attn_output.weight
|
271 |
+
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.46.attn_q_a.weight
|
272 |
+
262: 1536 | 1536, 1, 1, 1 | F32 | blk.46.attn_q_a_norm.weight
|
273 |
+
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.46.attn_q_b.weight
|
274 |
+
264: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.46.ffn_down_exps.weight
|
275 |
+
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.46.ffn_down_shexp.weight
|
276 |
+
266: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.46.ffn_gate_exps.weight
|
277 |
+
267: 819200 | 5120, 160, 1, 1 | F32 | blk.46.ffn_gate_inp.weight
|
278 |
+
268: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.46.ffn_gate_shexp.weight
|
279 |
+
269: 5120 | 5120, 1, 1, 1 | F32 | blk.46.ffn_norm.weight
|
280 |
+
270: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.46.ffn_up_exps.weight
|
281 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.46.ffn_up_shexp.weight
|
282 |
+
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.47.attn_kv_a_mqa.weight
|
283 |
+
273: 512 | 512, 1, 1, 1 | F32 | blk.47.attn_kv_a_norm.weight
|
284 |
+
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.47.attn_kv_b.weight
|
285 |
+
275: 5120 | 5120, 1, 1, 1 | F32 | blk.47.attn_norm.weight
|
286 |
+
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.47.attn_output.weight
|
287 |
+
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.47.attn_q_a.weight
|
288 |
+
278: 1536 | 1536, 1, 1, 1 | F32 | blk.47.attn_q_a_norm.weight
|
289 |
+
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.47.attn_q_b.weight
|
290 |
+
280: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.47.ffn_down_exps.weight
|
291 |
+
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.47.ffn_down_shexp.weight
|
292 |
+
282: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.47.ffn_gate_exps.weight
|
293 |
+
283: 819200 | 5120, 160, 1, 1 | F32 | blk.47.ffn_gate_inp.weight
|
294 |
+
284: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.47.ffn_gate_shexp.weight
|
295 |
+
285: 5120 | 5120, 1, 1, 1 | F32 | blk.47.ffn_norm.weight
|
296 |
+
286: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.47.ffn_up_exps.weight
|
297 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.47.ffn_up_shexp.weight
|
298 |
+
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.48.attn_kv_a_mqa.weight
|
299 |
+
289: 512 | 512, 1, 1, 1 | F32 | blk.48.attn_kv_a_norm.weight
|
300 |
+
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.48.attn_kv_b.weight
|
301 |
+
291: 5120 | 5120, 1, 1, 1 | F32 | blk.48.attn_norm.weight
|
302 |
+
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.48.attn_output.weight
|
303 |
+
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.48.attn_q_a.weight
|
304 |
+
294: 1536 | 1536, 1, 1, 1 | F32 | blk.48.attn_q_a_norm.weight
|
305 |
+
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.48.attn_q_b.weight
|
306 |
+
296: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.48.ffn_down_exps.weight
|
307 |
+
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.48.ffn_down_shexp.weight
|
308 |
+
298: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.48.ffn_gate_exps.weight
|
309 |
+
299: 819200 | 5120, 160, 1, 1 | F32 | blk.48.ffn_gate_inp.weight
|
310 |
+
300: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.48.ffn_gate_shexp.weight
|
311 |
+
301: 5120 | 5120, 1, 1, 1 | F32 | blk.48.ffn_norm.weight
|
312 |
+
302: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.48.ffn_up_exps.weight
|
313 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.48.ffn_up_shexp.weight
|
314 |
+
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.49.attn_kv_a_mqa.weight
|
315 |
+
305: 512 | 512, 1, 1, 1 | F32 | blk.49.attn_kv_a_norm.weight
|
316 |
+
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.49.attn_kv_b.weight
|
317 |
+
307: 5120 | 5120, 1, 1, 1 | F32 | blk.49.attn_norm.weight
|
318 |
+
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.49.attn_output.weight
|
319 |
+
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.49.attn_q_a.weight
|
320 |
+
310: 1536 | 1536, 1, 1, 1 | F32 | blk.49.attn_q_a_norm.weight
|
321 |
+
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.49.attn_q_b.weight
|
322 |
+
312: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.49.ffn_down_exps.weight
|
323 |
+
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.49.ffn_down_shexp.weight
|
324 |
+
314: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.49.ffn_gate_exps.weight
|
325 |
+
315: 819200 | 5120, 160, 1, 1 | F32 | blk.49.ffn_gate_inp.weight
|
326 |
+
316: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.49.ffn_gate_shexp.weight
|
327 |
+
317: 5120 | 5120, 1, 1, 1 | F32 | blk.49.ffn_norm.weight
|
328 |
+
318: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.49.ffn_up_exps.weight
|
329 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.49.ffn_up_shexp.weight
|
330 |
+
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.50.attn_kv_a_mqa.weight
|
331 |
+
321: 512 | 512, 1, 1, 1 | F32 | blk.50.attn_kv_a_norm.weight
|
332 |
+
322: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.50.attn_kv_b.weight
|
333 |
+
323: 5120 | 5120, 1, 1, 1 | F32 | blk.50.attn_norm.weight
|
334 |
+
324: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.50.attn_output.weight
|
335 |
+
325: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.50.attn_q_a.weight
|
336 |
+
326: 1536 | 1536, 1, 1, 1 | F32 | blk.50.attn_q_a_norm.weight
|
337 |
+
327: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.50.attn_q_b.weight
|
338 |
+
328: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.50.ffn_down_exps.weight
|
339 |
+
329: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.50.ffn_down_shexp.weight
|
340 |
+
330: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.50.ffn_gate_exps.weight
|
341 |
+
331: 819200 | 5120, 160, 1, 1 | F32 | blk.50.ffn_gate_inp.weight
|
342 |
+
332: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.50.ffn_gate_shexp.weight
|
343 |
+
333: 5120 | 5120, 1, 1, 1 | F32 | blk.50.ffn_norm.weight
|
344 |
+
334: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.50.ffn_up_exps.weight
|
345 |
+
335: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.50.ffn_up_shexp.weight
|
346 |
+
336: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.51.attn_kv_a_mqa.weight
|
347 |
+
337: 512 | 512, 1, 1, 1 | F32 | blk.51.attn_kv_a_norm.weight
|
348 |
+
338: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.51.attn_kv_b.weight
|
349 |
+
339: 5120 | 5120, 1, 1, 1 | F32 | blk.51.attn_norm.weight
|
350 |
+
340: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.51.attn_output.weight
|
351 |
+
341: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.51.attn_q_a.weight
|
352 |
+
342: 1536 | 1536, 1, 1, 1 | F32 | blk.51.attn_q_a_norm.weight
|
353 |
+
343: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.51.attn_q_b.weight
|
354 |
+
344: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.51.ffn_down_exps.weight
|
355 |
+
345: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.51.ffn_down_shexp.weight
|
356 |
+
346: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.51.ffn_gate_exps.weight
|
357 |
+
347: 819200 | 5120, 160, 1, 1 | F32 | blk.51.ffn_gate_inp.weight
|
358 |
+
348: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.51.ffn_gate_shexp.weight
|
359 |
+
349: 5120 | 5120, 1, 1, 1 | F32 | blk.51.ffn_norm.weight
|
360 |
+
350: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.51.ffn_up_exps.weight
|
361 |
+
351: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.51.ffn_up_shexp.weight
|
362 |
+
352: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.52.attn_kv_a_mqa.weight
|
363 |
+
353: 512 | 512, 1, 1, 1 | F32 | blk.52.attn_kv_a_norm.weight
|
364 |
+
354: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.52.attn_kv_b.weight
|
365 |
+
355: 5120 | 5120, 1, 1, 1 | F32 | blk.52.attn_norm.weight
|
366 |
+
356: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.52.attn_output.weight
|
367 |
+
357: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.52.attn_q_a.weight
|
368 |
+
358: 1536 | 1536, 1, 1, 1 | F32 | blk.52.attn_q_a_norm.weight
|
369 |
+
359: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.52.attn_q_b.weight
|
370 |
+
360: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.52.ffn_down_exps.weight
|
371 |
+
361: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.52.ffn_down_shexp.weight
|
372 |
+
362: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.52.ffn_gate_exps.weight
|
373 |
+
363: 819200 | 5120, 160, 1, 1 | F32 | blk.52.ffn_gate_inp.weight
|
374 |
+
364: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.52.ffn_gate_shexp.weight
|
375 |
+
365: 5120 | 5120, 1, 1, 1 | F32 | blk.52.ffn_norm.weight
|
376 |
+
366: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.52.ffn_up_exps.weight
|
377 |
+
367: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.52.ffn_up_shexp.weight
|
378 |
+
368: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.53.attn_kv_a_mqa.weight
|
379 |
+
369: 512 | 512, 1, 1, 1 | F32 | blk.53.attn_kv_a_norm.weight
|
380 |
+
370: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.53.attn_kv_b.weight
|
381 |
+
371: 5120 | 5120, 1, 1, 1 | F32 | blk.53.attn_norm.weight
|
382 |
+
372: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.53.attn_output.weight
|
383 |
+
373: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.53.attn_q_a.weight
|
384 |
+
374: 1536 | 1536, 1, 1, 1 | F32 | blk.53.attn_q_a_norm.weight
|
385 |
+
375: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.53.attn_q_b.weight
|
386 |
+
376: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.53.ffn_down_exps.weight
|
387 |
+
377: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.53.ffn_down_shexp.weight
|
388 |
+
378: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.53.ffn_gate_exps.weight
|
389 |
+
379: 819200 | 5120, 160, 1, 1 | F32 | blk.53.ffn_gate_inp.weight
|
390 |
+
380: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.53.ffn_gate_shexp.weight
|
391 |
+
381: 5120 | 5120, 1, 1, 1 | F32 | blk.53.ffn_norm.weight
|
392 |
+
382: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.53.ffn_up_exps.weight
|
393 |
+
383: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.53.ffn_up_shexp.weight
|
394 |
+
384: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.54.attn_kv_a_mqa.weight
|
395 |
+
385: 512 | 512, 1, 1, 1 | F32 | blk.54.attn_kv_a_norm.weight
|
396 |
+
386: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.54.attn_kv_b.weight
|
397 |
+
387: 5120 | 5120, 1, 1, 1 | F32 | blk.54.attn_norm.weight
|
398 |
+
388: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.54.attn_output.weight
|
399 |
+
389: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.54.attn_q_a.weight
|
400 |
+
390: 1536 | 1536, 1, 1, 1 | F32 | blk.54.attn_q_a_norm.weight
|
401 |
+
391: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.54.attn_q_b.weight
|
402 |
+
392: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.54.ffn_down_exps.weight
|
403 |
+
393: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.54.ffn_down_shexp.weight
|
404 |
+
394: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.54.ffn_gate_exps.weight
|
405 |
+
395: 819200 | 5120, 160, 1, 1 | F32 | blk.54.ffn_gate_inp.weight
|
406 |
+
396: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.54.ffn_gate_shexp.weight
|
407 |
+
397: 5120 | 5120, 1, 1, 1 | F32 | blk.54.ffn_norm.weight
|
408 |
+
398: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.54.ffn_up_exps.weight
|
409 |
+
399: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.54.ffn_up_shexp.weight
|
410 |
+
400: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.55.attn_kv_a_mqa.weight
|
411 |
+
401: 512 | 512, 1, 1, 1 | F32 | blk.55.attn_kv_a_norm.weight
|
412 |
+
402: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.55.attn_kv_b.weight
|
413 |
+
403: 5120 | 5120, 1, 1, 1 | F32 | blk.55.attn_norm.weight
|
414 |
+
404: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.55.attn_output.weight
|
415 |
+
405: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.55.attn_q_a.weight
|
416 |
+
406: 1536 | 1536, 1, 1, 1 | F32 | blk.55.attn_q_a_norm.weight
|
417 |
+
407: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.55.attn_q_b.weight
|
418 |
+
408: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.55.ffn_down_exps.weight
|
419 |
+
409: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.55.ffn_down_shexp.weight
|
420 |
+
410: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.55.ffn_gate_exps.weight
|
421 |
+
411: 819200 | 5120, 160, 1, 1 | F32 | blk.55.ffn_gate_inp.weight
|
422 |
+
412: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.55.ffn_gate_shexp.weight
|
423 |
+
413: 5120 | 5120, 1, 1, 1 | F32 | blk.55.ffn_norm.weight
|
424 |
+
414: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.55.ffn_up_exps.weight
|
425 |
+
415: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.55.ffn_up_shexp.weight
|
426 |
+
416: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.56.attn_kv_a_mqa.weight
|
427 |
+
417: 512 | 512, 1, 1, 1 | F32 | blk.56.attn_kv_a_norm.weight
|
428 |
+
418: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.56.attn_kv_b.weight
|
429 |
+
419: 5120 | 5120, 1, 1, 1 | F32 | blk.56.attn_norm.weight
|
430 |
+
420: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.56.attn_output.weight
|
431 |
+
421: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.56.attn_q_a.weight
|
432 |
+
422: 1536 | 1536, 1, 1, 1 | F32 | blk.56.attn_q_a_norm.weight
|
433 |
+
423: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.56.attn_q_b.weight
|
434 |
+
424: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.56.ffn_down_exps.weight
|
435 |
+
425: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.56.ffn_down_shexp.weight
|
436 |
+
426: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.56.ffn_gate_exps.weight
|
437 |
+
427: 819200 | 5120, 160, 1, 1 | F32 | blk.56.ffn_gate_inp.weight
|
438 |
+
428: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.56.ffn_gate_shexp.weight
|
439 |
+
429: 5120 | 5120, 1, 1, 1 | F32 | blk.56.ffn_norm.weight
|
440 |
+
430: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.56.ffn_up_exps.weight
|
441 |
+
431: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.56.ffn_up_shexp.weight
|
442 |
+
432: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.57.attn_kv_a_mqa.weight
|
443 |
+
433: 512 | 512, 1, 1, 1 | F32 | blk.57.attn_kv_a_norm.weight
|
444 |
+
434: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.57.attn_kv_b.weight
|
445 |
+
435: 5120 | 5120, 1, 1, 1 | F32 | blk.57.attn_norm.weight
|
446 |
+
436: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.57.attn_output.weight
|
447 |
+
437: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.57.attn_q_a.weight
|
448 |
+
438: 1536 | 1536, 1, 1, 1 | F32 | blk.57.attn_q_a_norm.weight
|
449 |
+
439: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.57.attn_q_b.weight
|
450 |
+
440: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.57.ffn_down_exps.weight
|
451 |
+
441: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.57.ffn_down_shexp.weight
|
452 |
+
442: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.57.ffn_gate_exps.weight
|
453 |
+
443: 819200 | 5120, 160, 1, 1 | F32 | blk.57.ffn_gate_inp.weight
|
454 |
+
444: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.57.ffn_gate_shexp.weight
|
455 |
+
445: 5120 | 5120, 1, 1, 1 | F32 | blk.57.ffn_norm.weight
|
456 |
+
446: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.57.ffn_up_exps.weight
|
457 |
+
447: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.57.ffn_up_shexp.weight
|
458 |
+
448: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.58.attn_kv_a_mqa.weight
|
459 |
+
449: 512 | 512, 1, 1, 1 | F32 | blk.58.attn_kv_a_norm.weight
|
460 |
+
450: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.58.attn_kv_b.weight
|
461 |
+
451: 5120 | 5120, 1, 1, 1 | F32 | blk.58.attn_norm.weight
|
462 |
+
452: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.58.attn_output.weight
|
463 |
+
453: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.58.attn_q_a.weight
|
464 |
+
454: 1536 | 1536, 1, 1, 1 | F32 | blk.58.attn_q_a_norm.weight
|
465 |
+
455: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.58.attn_q_b.weight
|
466 |
+
456: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.58.ffn_down_exps.weight
|
467 |
+
457: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.58.ffn_down_shexp.weight
|
468 |
+
458: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.58.ffn_gate_exps.weight
|
469 |
+
459: 819200 | 5120, 160, 1, 1 | F32 | blk.58.ffn_gate_inp.weight
|
470 |
+
460: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.58.ffn_gate_shexp.weight
|
471 |
+
461: 5120 | 5120, 1, 1, 1 | F32 | blk.58.ffn_norm.weight
|
472 |
+
462: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.58.ffn_up_exps.weight
|
473 |
+
463: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.58.ffn_up_shexp.weight
|
474 |
+
464: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.59.attn_kv_a_mqa.weight
|
475 |
+
465: 512 | 512, 1, 1, 1 | F32 | blk.59.attn_kv_a_norm.weight
|
476 |
+
466: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.59.attn_kv_b.weight
|
477 |
+
467: 5120 | 5120, 1, 1, 1 | F32 | blk.59.attn_norm.weight
|
478 |
+
468: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.59.attn_output.weight
|
479 |
+
469: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.59.attn_q_a.weight
|
480 |
+
470: 1536 | 1536, 1, 1, 1 | F32 | blk.59.attn_q_a_norm.weight
|
481 |
+
471: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.59.attn_q_b.weight
|
482 |
+
472: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.59.ffn_down_exps.weight
|
483 |
+
473: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.59.ffn_down_shexp.weight
|
484 |
+
474: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.59.ffn_gate_exps.weight
|
485 |
+
475: 819200 | 5120, 160, 1, 1 | F32 | blk.59.ffn_gate_inp.weight
|
486 |
+
476: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.59.ffn_gate_shexp.weight
|
487 |
+
477: 5120 | 5120, 1, 1, 1 | F32 | blk.59.ffn_norm.weight
|
488 |
+
478: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.59.ffn_up_exps.weight
|
489 |
+
479: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.59.ffn_up_shexp.weight
|
DeepSeek-v2.5-1210-UD-iq2_xxs-00001-of-00002.gguf.tensors.txt
ADDED
@@ -0,0 +1,537 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq2_xxs-00001-of-00002.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 56 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 477
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 53
|
7 |
+
4: STRING | 1 | general.architecture = 'deepseek2'
|
8 |
+
5: STRING | 1 | general.type = 'model'
|
9 |
+
6: STRING | 1 | general.name = 'Dsv25'
|
10 |
+
7: STRING | 1 | general.size_label = '160x14B'
|
11 |
+
8: STRING | 1 | general.license = 'other'
|
12 |
+
9: STRING | 1 | general.license.name = 'deepseek'
|
13 |
+
10: STRING | 1 | general.license.link = 'https://github.com/deepseek-ai/DeepSeek-V2/blob/main/LICENSE'
|
14 |
+
11: UINT32 | 1 | deepseek2.block_count = 60
|
15 |
+
12: UINT32 | 1 | deepseek2.context_length = 163840
|
16 |
+
13: UINT32 | 1 | deepseek2.embedding_length = 5120
|
17 |
+
14: UINT32 | 1 | deepseek2.feed_forward_length = 12288
|
18 |
+
15: UINT32 | 1 | deepseek2.attention.head_count = 128
|
19 |
+
16: UINT32 | 1 | deepseek2.attention.head_count_kv = 128
|
20 |
+
17: FLOAT32 | 1 | deepseek2.rope.freq_base = 10000.0
|
21 |
+
18: FLOAT32 | 1 | deepseek2.attention.layer_norm_rms_epsilon = 9.999999974752427e-07
|
22 |
+
19: UINT32 | 1 | deepseek2.expert_used_count = 6
|
23 |
+
20: UINT32 | 1 | deepseek2.leading_dense_block_count = 1
|
24 |
+
21: UINT32 | 1 | deepseek2.vocab_size = 102400
|
25 |
+
22: UINT32 | 1 | deepseek2.attention.q_lora_rank = 1536
|
26 |
+
23: UINT32 | 1 | deepseek2.attention.kv_lora_rank = 512
|
27 |
+
24: UINT32 | 1 | deepseek2.attention.key_length = 192
|
28 |
+
25: UINT32 | 1 | deepseek2.attention.value_length = 128
|
29 |
+
26: UINT32 | 1 | deepseek2.expert_feed_forward_length = 1536
|
30 |
+
27: UINT32 | 1 | deepseek2.expert_count = 160
|
31 |
+
28: UINT32 | 1 | deepseek2.expert_shared_count = 2
|
32 |
+
29: FLOAT32 | 1 | deepseek2.expert_weights_scale = 16.0
|
33 |
+
30: BOOL | 1 | deepseek2.expert_weights_norm = False
|
34 |
+
31: UINT32 | 1 | deepseek2.expert_gating_func = 1
|
35 |
+
32: UINT32 | 1 | deepseek2.rope.dimension_count = 64
|
36 |
+
33: STRING | 1 | deepseek2.rope.scaling.type = 'yarn'
|
37 |
+
34: FLOAT32 | 1 | deepseek2.rope.scaling.factor = 40.0
|
38 |
+
35: UINT32 | 1 | deepseek2.rope.scaling.original_context_length = 4096
|
39 |
+
36: FLOAT32 | 1 | deepseek2.rope.scaling.yarn_log_multiplier = 0.10000000149011612
|
40 |
+
37: STRING | 1 | tokenizer.ggml.model = 'gpt2'
|
41 |
+
38: STRING | 1 | tokenizer.ggml.pre = 'deepseek-llm'
|
42 |
+
39: [STRING] | 102400 | tokenizer.ggml.tokens
|
43 |
+
40: [INT32] | 102400 | tokenizer.ggml.token_type
|
44 |
+
41: [STRING] | 99757 | tokenizer.ggml.merges
|
45 |
+
42: UINT32 | 1 | tokenizer.ggml.bos_token_id = 100000
|
46 |
+
43: UINT32 | 1 | tokenizer.ggml.eos_token_id = 100001
|
47 |
+
44: UINT32 | 1 | tokenizer.ggml.padding_token_id = 100001
|
48 |
+
45: BOOL | 1 | tokenizer.ggml.add_bos_token = True
|
49 |
+
46: BOOL | 1 | tokenizer.ggml.add_eos_token = False
|
50 |
+
47: STRING | 1 | tokenizer.chat_template = '{% if not add_generation_prompt is defined %}{% set add_gene'
|
51 |
+
48: UINT32 | 1 | general.quantization_version = 2
|
52 |
+
49: UINT32 | 1 | general.file_type = 19
|
53 |
+
50: STRING | 1 | quantize.imatrix.file = '/spare/llama/dsv25/imatrix-DeepSeek-V2.5-1210-bartowski.dat'
|
54 |
+
51: STRING | 1 | quantize.imatrix.dataset = '/training_dir/calibration_datav3.txt'
|
55 |
+
52: INT32 | 1 | quantize.imatrix.entries_count = 716
|
56 |
+
53: INT32 | 1 | quantize.imatrix.chunks_count = 139
|
57 |
+
54: UINT16 | 1 | split.no = 0
|
58 |
+
55: INT32 | 1 | split.tensors.count = 959
|
59 |
+
56: UINT16 | 1 | split.count = 2
|
60 |
+
* Dumping 477 tensor(s)
|
61 |
+
1: 524288000 | 5120, 102400, 1, 1 | Q6_K | output.weight
|
62 |
+
2: 5120 | 5120, 1, 1, 1 | F32 | output_norm.weight
|
63 |
+
3: 524288000 | 5120, 102400, 1, 1 | Q4_K | token_embd.weight
|
64 |
+
4: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.0.attn_kv_a_mqa.weight
|
65 |
+
5: 512 | 512, 1, 1, 1 | F32 | blk.0.attn_kv_a_norm.weight
|
66 |
+
6: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.0.attn_kv_b.weight
|
67 |
+
7: 5120 | 5120, 1, 1, 1 | F32 | blk.0.attn_norm.weight
|
68 |
+
8: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.0.attn_output.weight
|
69 |
+
9: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.0.attn_q_a.weight
|
70 |
+
10: 1536 | 1536, 1, 1, 1 | F32 | blk.0.attn_q_a_norm.weight
|
71 |
+
11: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.0.attn_q_b.weight
|
72 |
+
12: 62914560 | 12288, 5120, 1, 1 | Q6_K | blk.0.ffn_down.weight
|
73 |
+
13: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_gate.weight
|
74 |
+
14: 5120 | 5120, 1, 1, 1 | F32 | blk.0.ffn_norm.weight
|
75 |
+
15: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_up.weight
|
76 |
+
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.1.attn_kv_a_mqa.weight
|
77 |
+
17: 512 | 512, 1, 1, 1 | F32 | blk.1.attn_kv_a_norm.weight
|
78 |
+
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.1.attn_kv_b.weight
|
79 |
+
19: 5120 | 5120, 1, 1, 1 | F32 | blk.1.attn_norm.weight
|
80 |
+
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.1.attn_output.weight
|
81 |
+
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.1.attn_q_a.weight
|
82 |
+
22: 1536 | 1536, 1, 1, 1 | F32 | blk.1.attn_q_a_norm.weight
|
83 |
+
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.1.attn_q_b.weight
|
84 |
+
24: 1258291200 | 1536, 5120, 160, 1 | Q3_K | blk.1.ffn_down_exps.weight
|
85 |
+
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.1.ffn_down_shexp.weight
|
86 |
+
26: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.1.ffn_gate_exps.weight
|
87 |
+
27: 819200 | 5120, 160, 1, 1 | F32 | blk.1.ffn_gate_inp.weight
|
88 |
+
28: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.1.ffn_gate_shexp.weight
|
89 |
+
29: 5120 | 5120, 1, 1, 1 | F32 | blk.1.ffn_norm.weight
|
90 |
+
30: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.1.ffn_up_exps.weight
|
91 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.1.ffn_up_shexp.weight
|
92 |
+
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.2.attn_kv_a_mqa.weight
|
93 |
+
33: 512 | 512, 1, 1, 1 | F32 | blk.2.attn_kv_a_norm.weight
|
94 |
+
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.2.attn_kv_b.weight
|
95 |
+
35: 5120 | 5120, 1, 1, 1 | F32 | blk.2.attn_norm.weight
|
96 |
+
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.2.attn_output.weight
|
97 |
+
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.2.attn_q_a.weight
|
98 |
+
38: 1536 | 1536, 1, 1, 1 | F32 | blk.2.attn_q_a_norm.weight
|
99 |
+
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.2.attn_q_b.weight
|
100 |
+
40: 1258291200 | 1536, 5120, 160, 1 | Q3_K | blk.2.ffn_down_exps.weight
|
101 |
+
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.2.ffn_down_shexp.weight
|
102 |
+
42: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.2.ffn_gate_exps.weight
|
103 |
+
43: 819200 | 5120, 160, 1, 1 | F32 | blk.2.ffn_gate_inp.weight
|
104 |
+
44: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.2.ffn_gate_shexp.weight
|
105 |
+
45: 5120 | 5120, 1, 1, 1 | F32 | blk.2.ffn_norm.weight
|
106 |
+
46: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.2.ffn_up_exps.weight
|
107 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.2.ffn_up_shexp.weight
|
108 |
+
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.3.attn_kv_a_mqa.weight
|
109 |
+
49: 512 | 512, 1, 1, 1 | F32 | blk.3.attn_kv_a_norm.weight
|
110 |
+
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.3.attn_kv_b.weight
|
111 |
+
51: 5120 | 5120, 1, 1, 1 | F32 | blk.3.attn_norm.weight
|
112 |
+
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.3.attn_output.weight
|
113 |
+
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.3.attn_q_a.weight
|
114 |
+
54: 1536 | 1536, 1, 1, 1 | F32 | blk.3.attn_q_a_norm.weight
|
115 |
+
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.3.attn_q_b.weight
|
116 |
+
56: 1258291200 | 1536, 5120, 160, 1 | Q3_K | blk.3.ffn_down_exps.weight
|
117 |
+
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.3.ffn_down_shexp.weight
|
118 |
+
58: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.3.ffn_gate_exps.weight
|
119 |
+
59: 819200 | 5120, 160, 1, 1 | F32 | blk.3.ffn_gate_inp.weight
|
120 |
+
60: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.3.ffn_gate_shexp.weight
|
121 |
+
61: 5120 | 5120, 1, 1, 1 | F32 | blk.3.ffn_norm.weight
|
122 |
+
62: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.3.ffn_up_exps.weight
|
123 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.3.ffn_up_shexp.weight
|
124 |
+
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.4.attn_kv_a_mqa.weight
|
125 |
+
65: 512 | 512, 1, 1, 1 | F32 | blk.4.attn_kv_a_norm.weight
|
126 |
+
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.4.attn_kv_b.weight
|
127 |
+
67: 5120 | 5120, 1, 1, 1 | F32 | blk.4.attn_norm.weight
|
128 |
+
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.4.attn_output.weight
|
129 |
+
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.4.attn_q_a.weight
|
130 |
+
70: 1536 | 1536, 1, 1, 1 | F32 | blk.4.attn_q_a_norm.weight
|
131 |
+
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.4.attn_q_b.weight
|
132 |
+
72: 1258291200 | 1536, 5120, 160, 1 | Q3_K | blk.4.ffn_down_exps.weight
|
133 |
+
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.4.ffn_down_shexp.weight
|
134 |
+
74: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.4.ffn_gate_exps.weight
|
135 |
+
75: 819200 | 5120, 160, 1, 1 | F32 | blk.4.ffn_gate_inp.weight
|
136 |
+
76: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.4.ffn_gate_shexp.weight
|
137 |
+
77: 5120 | 5120, 1, 1, 1 | F32 | blk.4.ffn_norm.weight
|
138 |
+
78: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.4.ffn_up_exps.weight
|
139 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.4.ffn_up_shexp.weight
|
140 |
+
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.5.attn_kv_a_mqa.weight
|
141 |
+
81: 512 | 512, 1, 1, 1 | F32 | blk.5.attn_kv_a_norm.weight
|
142 |
+
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.5.attn_kv_b.weight
|
143 |
+
83: 5120 | 5120, 1, 1, 1 | F32 | blk.5.attn_norm.weight
|
144 |
+
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.5.attn_output.weight
|
145 |
+
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.5.attn_q_a.weight
|
146 |
+
86: 1536 | 1536, 1, 1, 1 | F32 | blk.5.attn_q_a_norm.weight
|
147 |
+
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.5.attn_q_b.weight
|
148 |
+
88: 1258291200 | 1536, 5120, 160, 1 | Q3_K | blk.5.ffn_down_exps.weight
|
149 |
+
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.5.ffn_down_shexp.weight
|
150 |
+
90: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.5.ffn_gate_exps.weight
|
151 |
+
91: 819200 | 5120, 160, 1, 1 | F32 | blk.5.ffn_gate_inp.weight
|
152 |
+
92: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.5.ffn_gate_shexp.weight
|
153 |
+
93: 5120 | 5120, 1, 1, 1 | F32 | blk.5.ffn_norm.weight
|
154 |
+
94: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.5.ffn_up_exps.weight
|
155 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.5.ffn_up_shexp.weight
|
156 |
+
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.6.attn_kv_a_mqa.weight
|
157 |
+
97: 512 | 512, 1, 1, 1 | F32 | blk.6.attn_kv_a_norm.weight
|
158 |
+
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.6.attn_kv_b.weight
|
159 |
+
99: 5120 | 5120, 1, 1, 1 | F32 | blk.6.attn_norm.weight
|
160 |
+
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.6.attn_output.weight
|
161 |
+
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.6.attn_q_a.weight
|
162 |
+
102: 1536 | 1536, 1, 1, 1 | F32 | blk.6.attn_q_a_norm.weight
|
163 |
+
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.6.attn_q_b.weight
|
164 |
+
104: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.6.ffn_down_exps.weight
|
165 |
+
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.6.ffn_down_shexp.weight
|
166 |
+
106: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.6.ffn_gate_exps.weight
|
167 |
+
107: 819200 | 5120, 160, 1, 1 | F32 | blk.6.ffn_gate_inp.weight
|
168 |
+
108: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.6.ffn_gate_shexp.weight
|
169 |
+
109: 5120 | 5120, 1, 1, 1 | F32 | blk.6.ffn_norm.weight
|
170 |
+
110: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.6.ffn_up_exps.weight
|
171 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.6.ffn_up_shexp.weight
|
172 |
+
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.7.attn_kv_a_mqa.weight
|
173 |
+
113: 512 | 512, 1, 1, 1 | F32 | blk.7.attn_kv_a_norm.weight
|
174 |
+
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.7.attn_kv_b.weight
|
175 |
+
115: 5120 | 5120, 1, 1, 1 | F32 | blk.7.attn_norm.weight
|
176 |
+
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.7.attn_output.weight
|
177 |
+
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.7.attn_q_a.weight
|
178 |
+
118: 1536 | 1536, 1, 1, 1 | F32 | blk.7.attn_q_a_norm.weight
|
179 |
+
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.7.attn_q_b.weight
|
180 |
+
120: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.7.ffn_down_exps.weight
|
181 |
+
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.7.ffn_down_shexp.weight
|
182 |
+
122: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.7.ffn_gate_exps.weight
|
183 |
+
123: 819200 | 5120, 160, 1, 1 | F32 | blk.7.ffn_gate_inp.weight
|
184 |
+
124: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.7.ffn_gate_shexp.weight
|
185 |
+
125: 5120 | 5120, 1, 1, 1 | F32 | blk.7.ffn_norm.weight
|
186 |
+
126: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.7.ffn_up_exps.weight
|
187 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.7.ffn_up_shexp.weight
|
188 |
+
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.8.attn_kv_a_mqa.weight
|
189 |
+
129: 512 | 512, 1, 1, 1 | F32 | blk.8.attn_kv_a_norm.weight
|
190 |
+
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.8.attn_kv_b.weight
|
191 |
+
131: 5120 | 5120, 1, 1, 1 | F32 | blk.8.attn_norm.weight
|
192 |
+
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.8.attn_output.weight
|
193 |
+
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.8.attn_q_a.weight
|
194 |
+
134: 1536 | 1536, 1, 1, 1 | F32 | blk.8.attn_q_a_norm.weight
|
195 |
+
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.8.attn_q_b.weight
|
196 |
+
136: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.8.ffn_down_exps.weight
|
197 |
+
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.8.ffn_down_shexp.weight
|
198 |
+
138: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.8.ffn_gate_exps.weight
|
199 |
+
139: 819200 | 5120, 160, 1, 1 | F32 | blk.8.ffn_gate_inp.weight
|
200 |
+
140: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.8.ffn_gate_shexp.weight
|
201 |
+
141: 5120 | 5120, 1, 1, 1 | F32 | blk.8.ffn_norm.weight
|
202 |
+
142: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.8.ffn_up_exps.weight
|
203 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.8.ffn_up_shexp.weight
|
204 |
+
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.9.attn_kv_a_mqa.weight
|
205 |
+
145: 512 | 512, 1, 1, 1 | F32 | blk.9.attn_kv_a_norm.weight
|
206 |
+
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.9.attn_kv_b.weight
|
207 |
+
147: 5120 | 5120, 1, 1, 1 | F32 | blk.9.attn_norm.weight
|
208 |
+
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.9.attn_output.weight
|
209 |
+
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.9.attn_q_a.weight
|
210 |
+
150: 1536 | 1536, 1, 1, 1 | F32 | blk.9.attn_q_a_norm.weight
|
211 |
+
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.9.attn_q_b.weight
|
212 |
+
152: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.9.ffn_down_exps.weight
|
213 |
+
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.9.ffn_down_shexp.weight
|
214 |
+
154: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.9.ffn_gate_exps.weight
|
215 |
+
155: 819200 | 5120, 160, 1, 1 | F32 | blk.9.ffn_gate_inp.weight
|
216 |
+
156: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.9.ffn_gate_shexp.weight
|
217 |
+
157: 5120 | 5120, 1, 1, 1 | F32 | blk.9.ffn_norm.weight
|
218 |
+
158: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.9.ffn_up_exps.weight
|
219 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.9.ffn_up_shexp.weight
|
220 |
+
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.10.attn_kv_a_mqa.weight
|
221 |
+
161: 512 | 512, 1, 1, 1 | F32 | blk.10.attn_kv_a_norm.weight
|
222 |
+
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.10.attn_kv_b.weight
|
223 |
+
163: 5120 | 5120, 1, 1, 1 | F32 | blk.10.attn_norm.weight
|
224 |
+
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.10.attn_output.weight
|
225 |
+
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.10.attn_q_a.weight
|
226 |
+
166: 1536 | 1536, 1, 1, 1 | F32 | blk.10.attn_q_a_norm.weight
|
227 |
+
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.10.attn_q_b.weight
|
228 |
+
168: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.10.ffn_down_exps.weight
|
229 |
+
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.10.ffn_down_shexp.weight
|
230 |
+
170: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.10.ffn_gate_exps.weight
|
231 |
+
171: 819200 | 5120, 160, 1, 1 | F32 | blk.10.ffn_gate_inp.weight
|
232 |
+
172: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.10.ffn_gate_shexp.weight
|
233 |
+
173: 5120 | 5120, 1, 1, 1 | F32 | blk.10.ffn_norm.weight
|
234 |
+
174: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.10.ffn_up_exps.weight
|
235 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.10.ffn_up_shexp.weight
|
236 |
+
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.11.attn_kv_a_mqa.weight
|
237 |
+
177: 512 | 512, 1, 1, 1 | F32 | blk.11.attn_kv_a_norm.weight
|
238 |
+
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.11.attn_kv_b.weight
|
239 |
+
179: 5120 | 5120, 1, 1, 1 | F32 | blk.11.attn_norm.weight
|
240 |
+
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.11.attn_output.weight
|
241 |
+
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.11.attn_q_a.weight
|
242 |
+
182: 1536 | 1536, 1, 1, 1 | F32 | blk.11.attn_q_a_norm.weight
|
243 |
+
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.11.attn_q_b.weight
|
244 |
+
184: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.11.ffn_down_exps.weight
|
245 |
+
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.11.ffn_down_shexp.weight
|
246 |
+
186: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.11.ffn_gate_exps.weight
|
247 |
+
187: 819200 | 5120, 160, 1, 1 | F32 | blk.11.ffn_gate_inp.weight
|
248 |
+
188: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.11.ffn_gate_shexp.weight
|
249 |
+
189: 5120 | 5120, 1, 1, 1 | F32 | blk.11.ffn_norm.weight
|
250 |
+
190: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.11.ffn_up_exps.weight
|
251 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.11.ffn_up_shexp.weight
|
252 |
+
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.12.attn_kv_a_mqa.weight
|
253 |
+
193: 512 | 512, 1, 1, 1 | F32 | blk.12.attn_kv_a_norm.weight
|
254 |
+
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.12.attn_kv_b.weight
|
255 |
+
195: 5120 | 5120, 1, 1, 1 | F32 | blk.12.attn_norm.weight
|
256 |
+
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.12.attn_output.weight
|
257 |
+
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.12.attn_q_a.weight
|
258 |
+
198: 1536 | 1536, 1, 1, 1 | F32 | blk.12.attn_q_a_norm.weight
|
259 |
+
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.12.attn_q_b.weight
|
260 |
+
200: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.12.ffn_down_exps.weight
|
261 |
+
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.12.ffn_down_shexp.weight
|
262 |
+
202: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.12.ffn_gate_exps.weight
|
263 |
+
203: 819200 | 5120, 160, 1, 1 | F32 | blk.12.ffn_gate_inp.weight
|
264 |
+
204: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.12.ffn_gate_shexp.weight
|
265 |
+
205: 5120 | 5120, 1, 1, 1 | F32 | blk.12.ffn_norm.weight
|
266 |
+
206: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.12.ffn_up_exps.weight
|
267 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.12.ffn_up_shexp.weight
|
268 |
+
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.13.attn_kv_a_mqa.weight
|
269 |
+
209: 512 | 512, 1, 1, 1 | F32 | blk.13.attn_kv_a_norm.weight
|
270 |
+
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.13.attn_kv_b.weight
|
271 |
+
211: 5120 | 5120, 1, 1, 1 | F32 | blk.13.attn_norm.weight
|
272 |
+
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.13.attn_output.weight
|
273 |
+
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.13.attn_q_a.weight
|
274 |
+
214: 1536 | 1536, 1, 1, 1 | F32 | blk.13.attn_q_a_norm.weight
|
275 |
+
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.13.attn_q_b.weight
|
276 |
+
216: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.13.ffn_down_exps.weight
|
277 |
+
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.13.ffn_down_shexp.weight
|
278 |
+
218: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.13.ffn_gate_exps.weight
|
279 |
+
219: 819200 | 5120, 160, 1, 1 | F32 | blk.13.ffn_gate_inp.weight
|
280 |
+
220: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.13.ffn_gate_shexp.weight
|
281 |
+
221: 5120 | 5120, 1, 1, 1 | F32 | blk.13.ffn_norm.weight
|
282 |
+
222: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.13.ffn_up_exps.weight
|
283 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.13.ffn_up_shexp.weight
|
284 |
+
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.14.attn_kv_a_mqa.weight
|
285 |
+
225: 512 | 512, 1, 1, 1 | F32 | blk.14.attn_kv_a_norm.weight
|
286 |
+
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.14.attn_kv_b.weight
|
287 |
+
227: 5120 | 5120, 1, 1, 1 | F32 | blk.14.attn_norm.weight
|
288 |
+
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.14.attn_output.weight
|
289 |
+
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.14.attn_q_a.weight
|
290 |
+
230: 1536 | 1536, 1, 1, 1 | F32 | blk.14.attn_q_a_norm.weight
|
291 |
+
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.14.attn_q_b.weight
|
292 |
+
232: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.14.ffn_down_exps.weight
|
293 |
+
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.14.ffn_down_shexp.weight
|
294 |
+
234: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.14.ffn_gate_exps.weight
|
295 |
+
235: 819200 | 5120, 160, 1, 1 | F32 | blk.14.ffn_gate_inp.weight
|
296 |
+
236: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.14.ffn_gate_shexp.weight
|
297 |
+
237: 5120 | 5120, 1, 1, 1 | F32 | blk.14.ffn_norm.weight
|
298 |
+
238: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.14.ffn_up_exps.weight
|
299 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.14.ffn_up_shexp.weight
|
300 |
+
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.15.attn_kv_a_mqa.weight
|
301 |
+
241: 512 | 512, 1, 1, 1 | F32 | blk.15.attn_kv_a_norm.weight
|
302 |
+
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.15.attn_kv_b.weight
|
303 |
+
243: 5120 | 5120, 1, 1, 1 | F32 | blk.15.attn_norm.weight
|
304 |
+
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.15.attn_output.weight
|
305 |
+
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.15.attn_q_a.weight
|
306 |
+
246: 1536 | 1536, 1, 1, 1 | F32 | blk.15.attn_q_a_norm.weight
|
307 |
+
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.15.attn_q_b.weight
|
308 |
+
248: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.15.ffn_down_exps.weight
|
309 |
+
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.15.ffn_down_shexp.weight
|
310 |
+
250: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.15.ffn_gate_exps.weight
|
311 |
+
251: 819200 | 5120, 160, 1, 1 | F32 | blk.15.ffn_gate_inp.weight
|
312 |
+
252: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.15.ffn_gate_shexp.weight
|
313 |
+
253: 5120 | 5120, 1, 1, 1 | F32 | blk.15.ffn_norm.weight
|
314 |
+
254: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.15.ffn_up_exps.weight
|
315 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.15.ffn_up_shexp.weight
|
316 |
+
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.16.attn_kv_a_mqa.weight
|
317 |
+
257: 512 | 512, 1, 1, 1 | F32 | blk.16.attn_kv_a_norm.weight
|
318 |
+
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.16.attn_kv_b.weight
|
319 |
+
259: 5120 | 5120, 1, 1, 1 | F32 | blk.16.attn_norm.weight
|
320 |
+
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.16.attn_output.weight
|
321 |
+
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.16.attn_q_a.weight
|
322 |
+
262: 1536 | 1536, 1, 1, 1 | F32 | blk.16.attn_q_a_norm.weight
|
323 |
+
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.16.attn_q_b.weight
|
324 |
+
264: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.16.ffn_down_exps.weight
|
325 |
+
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.16.ffn_down_shexp.weight
|
326 |
+
266: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.16.ffn_gate_exps.weight
|
327 |
+
267: 819200 | 5120, 160, 1, 1 | F32 | blk.16.ffn_gate_inp.weight
|
328 |
+
268: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.16.ffn_gate_shexp.weight
|
329 |
+
269: 5120 | 5120, 1, 1, 1 | F32 | blk.16.ffn_norm.weight
|
330 |
+
270: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.16.ffn_up_exps.weight
|
331 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.16.ffn_up_shexp.weight
|
332 |
+
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.17.attn_kv_a_mqa.weight
|
333 |
+
273: 512 | 512, 1, 1, 1 | F32 | blk.17.attn_kv_a_norm.weight
|
334 |
+
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.17.attn_kv_b.weight
|
335 |
+
275: 5120 | 5120, 1, 1, 1 | F32 | blk.17.attn_norm.weight
|
336 |
+
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.17.attn_output.weight
|
337 |
+
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.17.attn_q_a.weight
|
338 |
+
278: 1536 | 1536, 1, 1, 1 | F32 | blk.17.attn_q_a_norm.weight
|
339 |
+
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.17.attn_q_b.weight
|
340 |
+
280: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.17.ffn_down_exps.weight
|
341 |
+
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.17.ffn_down_shexp.weight
|
342 |
+
282: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.17.ffn_gate_exps.weight
|
343 |
+
283: 819200 | 5120, 160, 1, 1 | F32 | blk.17.ffn_gate_inp.weight
|
344 |
+
284: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.17.ffn_gate_shexp.weight
|
345 |
+
285: 5120 | 5120, 1, 1, 1 | F32 | blk.17.ffn_norm.weight
|
346 |
+
286: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.17.ffn_up_exps.weight
|
347 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.17.ffn_up_shexp.weight
|
348 |
+
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.18.attn_kv_a_mqa.weight
|
349 |
+
289: 512 | 512, 1, 1, 1 | F32 | blk.18.attn_kv_a_norm.weight
|
350 |
+
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.18.attn_kv_b.weight
|
351 |
+
291: 5120 | 5120, 1, 1, 1 | F32 | blk.18.attn_norm.weight
|
352 |
+
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.18.attn_output.weight
|
353 |
+
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.18.attn_q_a.weight
|
354 |
+
294: 1536 | 1536, 1, 1, 1 | F32 | blk.18.attn_q_a_norm.weight
|
355 |
+
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.18.attn_q_b.weight
|
356 |
+
296: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.18.ffn_down_exps.weight
|
357 |
+
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.18.ffn_down_shexp.weight
|
358 |
+
298: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.18.ffn_gate_exps.weight
|
359 |
+
299: 819200 | 5120, 160, 1, 1 | F32 | blk.18.ffn_gate_inp.weight
|
360 |
+
300: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.18.ffn_gate_shexp.weight
|
361 |
+
301: 5120 | 5120, 1, 1, 1 | F32 | blk.18.ffn_norm.weight
|
362 |
+
302: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.18.ffn_up_exps.weight
|
363 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.18.ffn_up_shexp.weight
|
364 |
+
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.19.attn_kv_a_mqa.weight
|
365 |
+
305: 512 | 512, 1, 1, 1 | F32 | blk.19.attn_kv_a_norm.weight
|
366 |
+
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.19.attn_kv_b.weight
|
367 |
+
307: 5120 | 5120, 1, 1, 1 | F32 | blk.19.attn_norm.weight
|
368 |
+
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.19.attn_output.weight
|
369 |
+
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.19.attn_q_a.weight
|
370 |
+
310: 1536 | 1536, 1, 1, 1 | F32 | blk.19.attn_q_a_norm.weight
|
371 |
+
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.19.attn_q_b.weight
|
372 |
+
312: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.19.ffn_down_exps.weight
|
373 |
+
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.19.ffn_down_shexp.weight
|
374 |
+
314: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.19.ffn_gate_exps.weight
|
375 |
+
315: 819200 | 5120, 160, 1, 1 | F32 | blk.19.ffn_gate_inp.weight
|
376 |
+
316: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.19.ffn_gate_shexp.weight
|
377 |
+
317: 5120 | 5120, 1, 1, 1 | F32 | blk.19.ffn_norm.weight
|
378 |
+
318: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.19.ffn_up_exps.weight
|
379 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.19.ffn_up_shexp.weight
|
380 |
+
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.20.attn_kv_a_mqa.weight
|
381 |
+
321: 512 | 512, 1, 1, 1 | F32 | blk.20.attn_kv_a_norm.weight
|
382 |
+
322: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.20.attn_kv_b.weight
|
383 |
+
323: 5120 | 5120, 1, 1, 1 | F32 | blk.20.attn_norm.weight
|
384 |
+
324: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.20.attn_output.weight
|
385 |
+
325: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.20.attn_q_a.weight
|
386 |
+
326: 1536 | 1536, 1, 1, 1 | F32 | blk.20.attn_q_a_norm.weight
|
387 |
+
327: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.20.attn_q_b.weight
|
388 |
+
328: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.20.ffn_down_exps.weight
|
389 |
+
329: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.20.ffn_down_shexp.weight
|
390 |
+
330: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.20.ffn_gate_exps.weight
|
391 |
+
331: 819200 | 5120, 160, 1, 1 | F32 | blk.20.ffn_gate_inp.weight
|
392 |
+
332: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.20.ffn_gate_shexp.weight
|
393 |
+
333: 5120 | 5120, 1, 1, 1 | F32 | blk.20.ffn_norm.weight
|
394 |
+
334: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.20.ffn_up_exps.weight
|
395 |
+
335: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.20.ffn_up_shexp.weight
|
396 |
+
336: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.21.attn_kv_a_mqa.weight
|
397 |
+
337: 512 | 512, 1, 1, 1 | F32 | blk.21.attn_kv_a_norm.weight
|
398 |
+
338: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.21.attn_kv_b.weight
|
399 |
+
339: 5120 | 5120, 1, 1, 1 | F32 | blk.21.attn_norm.weight
|
400 |
+
340: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.21.attn_output.weight
|
401 |
+
341: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.21.attn_q_a.weight
|
402 |
+
342: 1536 | 1536, 1, 1, 1 | F32 | blk.21.attn_q_a_norm.weight
|
403 |
+
343: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.21.attn_q_b.weight
|
404 |
+
344: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.21.ffn_down_exps.weight
|
405 |
+
345: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.21.ffn_down_shexp.weight
|
406 |
+
346: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.21.ffn_gate_exps.weight
|
407 |
+
347: 819200 | 5120, 160, 1, 1 | F32 | blk.21.ffn_gate_inp.weight
|
408 |
+
348: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.21.ffn_gate_shexp.weight
|
409 |
+
349: 5120 | 5120, 1, 1, 1 | F32 | blk.21.ffn_norm.weight
|
410 |
+
350: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.21.ffn_up_exps.weight
|
411 |
+
351: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.21.ffn_up_shexp.weight
|
412 |
+
352: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.22.attn_kv_a_mqa.weight
|
413 |
+
353: 512 | 512, 1, 1, 1 | F32 | blk.22.attn_kv_a_norm.weight
|
414 |
+
354: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.22.attn_kv_b.weight
|
415 |
+
355: 5120 | 5120, 1, 1, 1 | F32 | blk.22.attn_norm.weight
|
416 |
+
356: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.22.attn_output.weight
|
417 |
+
357: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.22.attn_q_a.weight
|
418 |
+
358: 1536 | 1536, 1, 1, 1 | F32 | blk.22.attn_q_a_norm.weight
|
419 |
+
359: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.22.attn_q_b.weight
|
420 |
+
360: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.22.ffn_down_exps.weight
|
421 |
+
361: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.22.ffn_down_shexp.weight
|
422 |
+
362: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.22.ffn_gate_exps.weight
|
423 |
+
363: 819200 | 5120, 160, 1, 1 | F32 | blk.22.ffn_gate_inp.weight
|
424 |
+
364: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.22.ffn_gate_shexp.weight
|
425 |
+
365: 5120 | 5120, 1, 1, 1 | F32 | blk.22.ffn_norm.weight
|
426 |
+
366: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.22.ffn_up_exps.weight
|
427 |
+
367: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.22.ffn_up_shexp.weight
|
428 |
+
368: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.23.attn_kv_a_mqa.weight
|
429 |
+
369: 512 | 512, 1, 1, 1 | F32 | blk.23.attn_kv_a_norm.weight
|
430 |
+
370: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.23.attn_kv_b.weight
|
431 |
+
371: 5120 | 5120, 1, 1, 1 | F32 | blk.23.attn_norm.weight
|
432 |
+
372: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.23.attn_output.weight
|
433 |
+
373: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.23.attn_q_a.weight
|
434 |
+
374: 1536 | 1536, 1, 1, 1 | F32 | blk.23.attn_q_a_norm.weight
|
435 |
+
375: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.23.attn_q_b.weight
|
436 |
+
376: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.23.ffn_down_exps.weight
|
437 |
+
377: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.23.ffn_down_shexp.weight
|
438 |
+
378: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.23.ffn_gate_exps.weight
|
439 |
+
379: 819200 | 5120, 160, 1, 1 | F32 | blk.23.ffn_gate_inp.weight
|
440 |
+
380: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.23.ffn_gate_shexp.weight
|
441 |
+
381: 5120 | 5120, 1, 1, 1 | F32 | blk.23.ffn_norm.weight
|
442 |
+
382: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.23.ffn_up_exps.weight
|
443 |
+
383: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.23.ffn_up_shexp.weight
|
444 |
+
384: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.24.attn_kv_a_mqa.weight
|
445 |
+
385: 512 | 512, 1, 1, 1 | F32 | blk.24.attn_kv_a_norm.weight
|
446 |
+
386: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.24.attn_kv_b.weight
|
447 |
+
387: 5120 | 5120, 1, 1, 1 | F32 | blk.24.attn_norm.weight
|
448 |
+
388: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.24.attn_output.weight
|
449 |
+
389: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.24.attn_q_a.weight
|
450 |
+
390: 1536 | 1536, 1, 1, 1 | F32 | blk.24.attn_q_a_norm.weight
|
451 |
+
391: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.24.attn_q_b.weight
|
452 |
+
392: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.24.ffn_down_exps.weight
|
453 |
+
393: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.24.ffn_down_shexp.weight
|
454 |
+
394: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.24.ffn_gate_exps.weight
|
455 |
+
395: 819200 | 5120, 160, 1, 1 | F32 | blk.24.ffn_gate_inp.weight
|
456 |
+
396: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.24.ffn_gate_shexp.weight
|
457 |
+
397: 5120 | 5120, 1, 1, 1 | F32 | blk.24.ffn_norm.weight
|
458 |
+
398: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.24.ffn_up_exps.weight
|
459 |
+
399: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.24.ffn_up_shexp.weight
|
460 |
+
400: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.25.attn_kv_a_mqa.weight
|
461 |
+
401: 512 | 512, 1, 1, 1 | F32 | blk.25.attn_kv_a_norm.weight
|
462 |
+
402: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.25.attn_kv_b.weight
|
463 |
+
403: 5120 | 5120, 1, 1, 1 | F32 | blk.25.attn_norm.weight
|
464 |
+
404: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.25.attn_output.weight
|
465 |
+
405: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.25.attn_q_a.weight
|
466 |
+
406: 1536 | 1536, 1, 1, 1 | F32 | blk.25.attn_q_a_norm.weight
|
467 |
+
407: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.25.attn_q_b.weight
|
468 |
+
408: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.25.ffn_down_exps.weight
|
469 |
+
409: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.25.ffn_down_shexp.weight
|
470 |
+
410: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.25.ffn_gate_exps.weight
|
471 |
+
411: 819200 | 5120, 160, 1, 1 | F32 | blk.25.ffn_gate_inp.weight
|
472 |
+
412: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.25.ffn_gate_shexp.weight
|
473 |
+
413: 5120 | 5120, 1, 1, 1 | F32 | blk.25.ffn_norm.weight
|
474 |
+
414: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.25.ffn_up_exps.weight
|
475 |
+
415: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.25.ffn_up_shexp.weight
|
476 |
+
416: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.26.attn_kv_a_mqa.weight
|
477 |
+
417: 512 | 512, 1, 1, 1 | F32 | blk.26.attn_kv_a_norm.weight
|
478 |
+
418: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.26.attn_kv_b.weight
|
479 |
+
419: 5120 | 5120, 1, 1, 1 | F32 | blk.26.attn_norm.weight
|
480 |
+
420: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.26.attn_output.weight
|
481 |
+
421: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.26.attn_q_a.weight
|
482 |
+
422: 1536 | 1536, 1, 1, 1 | F32 | blk.26.attn_q_a_norm.weight
|
483 |
+
423: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.26.attn_q_b.weight
|
484 |
+
424: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.26.ffn_down_exps.weight
|
485 |
+
425: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.26.ffn_down_shexp.weight
|
486 |
+
426: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.26.ffn_gate_exps.weight
|
487 |
+
427: 819200 | 5120, 160, 1, 1 | F32 | blk.26.ffn_gate_inp.weight
|
488 |
+
428: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.26.ffn_gate_shexp.weight
|
489 |
+
429: 5120 | 5120, 1, 1, 1 | F32 | blk.26.ffn_norm.weight
|
490 |
+
430: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.26.ffn_up_exps.weight
|
491 |
+
431: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.26.ffn_up_shexp.weight
|
492 |
+
432: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.27.attn_kv_a_mqa.weight
|
493 |
+
433: 512 | 512, 1, 1, 1 | F32 | blk.27.attn_kv_a_norm.weight
|
494 |
+
434: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.27.attn_kv_b.weight
|
495 |
+
435: 5120 | 5120, 1, 1, 1 | F32 | blk.27.attn_norm.weight
|
496 |
+
436: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.27.attn_output.weight
|
497 |
+
437: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.27.attn_q_a.weight
|
498 |
+
438: 1536 | 1536, 1, 1, 1 | F32 | blk.27.attn_q_a_norm.weight
|
499 |
+
439: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.27.attn_q_b.weight
|
500 |
+
440: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.27.ffn_down_exps.weight
|
501 |
+
441: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.27.ffn_down_shexp.weight
|
502 |
+
442: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.27.ffn_gate_exps.weight
|
503 |
+
443: 819200 | 5120, 160, 1, 1 | F32 | blk.27.ffn_gate_inp.weight
|
504 |
+
444: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.27.ffn_gate_shexp.weight
|
505 |
+
445: 5120 | 5120, 1, 1, 1 | F32 | blk.27.ffn_norm.weight
|
506 |
+
446: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.27.ffn_up_exps.weight
|
507 |
+
447: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.27.ffn_up_shexp.weight
|
508 |
+
448: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.28.attn_kv_a_mqa.weight
|
509 |
+
449: 512 | 512, 1, 1, 1 | F32 | blk.28.attn_kv_a_norm.weight
|
510 |
+
450: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.28.attn_kv_b.weight
|
511 |
+
451: 5120 | 5120, 1, 1, 1 | F32 | blk.28.attn_norm.weight
|
512 |
+
452: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.28.attn_output.weight
|
513 |
+
453: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.28.attn_q_a.weight
|
514 |
+
454: 1536 | 1536, 1, 1, 1 | F32 | blk.28.attn_q_a_norm.weight
|
515 |
+
455: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.28.attn_q_b.weight
|
516 |
+
456: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.28.ffn_down_exps.weight
|
517 |
+
457: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.28.ffn_down_shexp.weight
|
518 |
+
458: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.28.ffn_gate_exps.weight
|
519 |
+
459: 819200 | 5120, 160, 1, 1 | F32 | blk.28.ffn_gate_inp.weight
|
520 |
+
460: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.28.ffn_gate_shexp.weight
|
521 |
+
461: 5120 | 5120, 1, 1, 1 | F32 | blk.28.ffn_norm.weight
|
522 |
+
462: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.28.ffn_up_exps.weight
|
523 |
+
463: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.28.ffn_up_shexp.weight
|
524 |
+
464: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.29.attn_kv_a_mqa.weight
|
525 |
+
465: 512 | 512, 1, 1, 1 | F32 | blk.29.attn_kv_a_norm.weight
|
526 |
+
466: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.29.attn_kv_b.weight
|
527 |
+
467: 5120 | 5120, 1, 1, 1 | F32 | blk.29.attn_norm.weight
|
528 |
+
468: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.29.attn_output.weight
|
529 |
+
469: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.29.attn_q_a.weight
|
530 |
+
470: 1536 | 1536, 1, 1, 1 | F32 | blk.29.attn_q_a_norm.weight
|
531 |
+
471: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.29.attn_q_b.weight
|
532 |
+
472: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.29.ffn_down_exps.weight
|
533 |
+
473: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.29.ffn_down_shexp.weight
|
534 |
+
474: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.29.ffn_gate_exps.weight
|
535 |
+
475: 819200 | 5120, 160, 1, 1 | F32 | blk.29.ffn_gate_inp.weight
|
536 |
+
476: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.29.ffn_gate_shexp.weight
|
537 |
+
477: 5120 | 5120, 1, 1, 1 | F32 | blk.29.ffn_norm.weight
|
DeepSeek-v2.5-1210-UD-iq2_xxs-00002-of-00002.gguf.tensors.txt
ADDED
@@ -0,0 +1,492 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq2_xxs-00002-of-00002.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 6 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 482
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 3
|
7 |
+
4: UINT16 | 1 | split.no = 1
|
8 |
+
5: INT32 | 1 | split.tensors.count = 959
|
9 |
+
6: UINT16 | 1 | split.count = 2
|
10 |
+
* Dumping 482 tensor(s)
|
11 |
+
1: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.29.ffn_up_exps.weight
|
12 |
+
2: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.29.ffn_up_shexp.weight
|
13 |
+
3: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.30.attn_kv_a_mqa.weight
|
14 |
+
4: 512 | 512, 1, 1, 1 | F32 | blk.30.attn_kv_a_norm.weight
|
15 |
+
5: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.30.attn_kv_b.weight
|
16 |
+
6: 5120 | 5120, 1, 1, 1 | F32 | blk.30.attn_norm.weight
|
17 |
+
7: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.30.attn_output.weight
|
18 |
+
8: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.30.attn_q_a.weight
|
19 |
+
9: 1536 | 1536, 1, 1, 1 | F32 | blk.30.attn_q_a_norm.weight
|
20 |
+
10: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.30.attn_q_b.weight
|
21 |
+
11: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.30.ffn_down_exps.weight
|
22 |
+
12: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.30.ffn_down_shexp.weight
|
23 |
+
13: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.30.ffn_gate_exps.weight
|
24 |
+
14: 819200 | 5120, 160, 1, 1 | F32 | blk.30.ffn_gate_inp.weight
|
25 |
+
15: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.30.ffn_gate_shexp.weight
|
26 |
+
16: 5120 | 5120, 1, 1, 1 | F32 | blk.30.ffn_norm.weight
|
27 |
+
17: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.30.ffn_up_exps.weight
|
28 |
+
18: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.30.ffn_up_shexp.weight
|
29 |
+
19: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.31.attn_kv_a_mqa.weight
|
30 |
+
20: 512 | 512, 1, 1, 1 | F32 | blk.31.attn_kv_a_norm.weight
|
31 |
+
21: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.31.attn_kv_b.weight
|
32 |
+
22: 5120 | 5120, 1, 1, 1 | F32 | blk.31.attn_norm.weight
|
33 |
+
23: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.31.attn_output.weight
|
34 |
+
24: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.31.attn_q_a.weight
|
35 |
+
25: 1536 | 1536, 1, 1, 1 | F32 | blk.31.attn_q_a_norm.weight
|
36 |
+
26: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.31.attn_q_b.weight
|
37 |
+
27: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.31.ffn_down_exps.weight
|
38 |
+
28: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.31.ffn_down_shexp.weight
|
39 |
+
29: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.31.ffn_gate_exps.weight
|
40 |
+
30: 819200 | 5120, 160, 1, 1 | F32 | blk.31.ffn_gate_inp.weight
|
41 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.31.ffn_gate_shexp.weight
|
42 |
+
32: 5120 | 5120, 1, 1, 1 | F32 | blk.31.ffn_norm.weight
|
43 |
+
33: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.31.ffn_up_exps.weight
|
44 |
+
34: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.31.ffn_up_shexp.weight
|
45 |
+
35: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.32.attn_kv_a_mqa.weight
|
46 |
+
36: 512 | 512, 1, 1, 1 | F32 | blk.32.attn_kv_a_norm.weight
|
47 |
+
37: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.32.attn_kv_b.weight
|
48 |
+
38: 5120 | 5120, 1, 1, 1 | F32 | blk.32.attn_norm.weight
|
49 |
+
39: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.32.attn_output.weight
|
50 |
+
40: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.32.attn_q_a.weight
|
51 |
+
41: 1536 | 1536, 1, 1, 1 | F32 | blk.32.attn_q_a_norm.weight
|
52 |
+
42: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.32.attn_q_b.weight
|
53 |
+
43: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.32.ffn_down_exps.weight
|
54 |
+
44: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.32.ffn_down_shexp.weight
|
55 |
+
45: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.32.ffn_gate_exps.weight
|
56 |
+
46: 819200 | 5120, 160, 1, 1 | F32 | blk.32.ffn_gate_inp.weight
|
57 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.32.ffn_gate_shexp.weight
|
58 |
+
48: 5120 | 5120, 1, 1, 1 | F32 | blk.32.ffn_norm.weight
|
59 |
+
49: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.32.ffn_up_exps.weight
|
60 |
+
50: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.32.ffn_up_shexp.weight
|
61 |
+
51: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.33.attn_kv_a_mqa.weight
|
62 |
+
52: 512 | 512, 1, 1, 1 | F32 | blk.33.attn_kv_a_norm.weight
|
63 |
+
53: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.33.attn_kv_b.weight
|
64 |
+
54: 5120 | 5120, 1, 1, 1 | F32 | blk.33.attn_norm.weight
|
65 |
+
55: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.33.attn_output.weight
|
66 |
+
56: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.33.attn_q_a.weight
|
67 |
+
57: 1536 | 1536, 1, 1, 1 | F32 | blk.33.attn_q_a_norm.weight
|
68 |
+
58: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.33.attn_q_b.weight
|
69 |
+
59: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.33.ffn_down_exps.weight
|
70 |
+
60: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.33.ffn_down_shexp.weight
|
71 |
+
61: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.33.ffn_gate_exps.weight
|
72 |
+
62: 819200 | 5120, 160, 1, 1 | F32 | blk.33.ffn_gate_inp.weight
|
73 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.33.ffn_gate_shexp.weight
|
74 |
+
64: 5120 | 5120, 1, 1, 1 | F32 | blk.33.ffn_norm.weight
|
75 |
+
65: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.33.ffn_up_exps.weight
|
76 |
+
66: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.33.ffn_up_shexp.weight
|
77 |
+
67: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.34.attn_kv_a_mqa.weight
|
78 |
+
68: 512 | 512, 1, 1, 1 | F32 | blk.34.attn_kv_a_norm.weight
|
79 |
+
69: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.34.attn_kv_b.weight
|
80 |
+
70: 5120 | 5120, 1, 1, 1 | F32 | blk.34.attn_norm.weight
|
81 |
+
71: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.34.attn_output.weight
|
82 |
+
72: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.34.attn_q_a.weight
|
83 |
+
73: 1536 | 1536, 1, 1, 1 | F32 | blk.34.attn_q_a_norm.weight
|
84 |
+
74: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.34.attn_q_b.weight
|
85 |
+
75: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.34.ffn_down_exps.weight
|
86 |
+
76: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.34.ffn_down_shexp.weight
|
87 |
+
77: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.34.ffn_gate_exps.weight
|
88 |
+
78: 819200 | 5120, 160, 1, 1 | F32 | blk.34.ffn_gate_inp.weight
|
89 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.34.ffn_gate_shexp.weight
|
90 |
+
80: 5120 | 5120, 1, 1, 1 | F32 | blk.34.ffn_norm.weight
|
91 |
+
81: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.34.ffn_up_exps.weight
|
92 |
+
82: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.34.ffn_up_shexp.weight
|
93 |
+
83: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.35.attn_kv_a_mqa.weight
|
94 |
+
84: 512 | 512, 1, 1, 1 | F32 | blk.35.attn_kv_a_norm.weight
|
95 |
+
85: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.35.attn_kv_b.weight
|
96 |
+
86: 5120 | 5120, 1, 1, 1 | F32 | blk.35.attn_norm.weight
|
97 |
+
87: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.35.attn_output.weight
|
98 |
+
88: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.35.attn_q_a.weight
|
99 |
+
89: 1536 | 1536, 1, 1, 1 | F32 | blk.35.attn_q_a_norm.weight
|
100 |
+
90: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.35.attn_q_b.weight
|
101 |
+
91: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.35.ffn_down_exps.weight
|
102 |
+
92: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.35.ffn_down_shexp.weight
|
103 |
+
93: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.35.ffn_gate_exps.weight
|
104 |
+
94: 819200 | 5120, 160, 1, 1 | F32 | blk.35.ffn_gate_inp.weight
|
105 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.35.ffn_gate_shexp.weight
|
106 |
+
96: 5120 | 5120, 1, 1, 1 | F32 | blk.35.ffn_norm.weight
|
107 |
+
97: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.35.ffn_up_exps.weight
|
108 |
+
98: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.35.ffn_up_shexp.weight
|
109 |
+
99: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.36.attn_kv_a_mqa.weight
|
110 |
+
100: 512 | 512, 1, 1, 1 | F32 | blk.36.attn_kv_a_norm.weight
|
111 |
+
101: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.36.attn_kv_b.weight
|
112 |
+
102: 5120 | 5120, 1, 1, 1 | F32 | blk.36.attn_norm.weight
|
113 |
+
103: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.36.attn_output.weight
|
114 |
+
104: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.36.attn_q_a.weight
|
115 |
+
105: 1536 | 1536, 1, 1, 1 | F32 | blk.36.attn_q_a_norm.weight
|
116 |
+
106: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.36.attn_q_b.weight
|
117 |
+
107: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.36.ffn_down_exps.weight
|
118 |
+
108: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.36.ffn_down_shexp.weight
|
119 |
+
109: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.36.ffn_gate_exps.weight
|
120 |
+
110: 819200 | 5120, 160, 1, 1 | F32 | blk.36.ffn_gate_inp.weight
|
121 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.36.ffn_gate_shexp.weight
|
122 |
+
112: 5120 | 5120, 1, 1, 1 | F32 | blk.36.ffn_norm.weight
|
123 |
+
113: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.36.ffn_up_exps.weight
|
124 |
+
114: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.36.ffn_up_shexp.weight
|
125 |
+
115: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.37.attn_kv_a_mqa.weight
|
126 |
+
116: 512 | 512, 1, 1, 1 | F32 | blk.37.attn_kv_a_norm.weight
|
127 |
+
117: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.37.attn_kv_b.weight
|
128 |
+
118: 5120 | 5120, 1, 1, 1 | F32 | blk.37.attn_norm.weight
|
129 |
+
119: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.37.attn_output.weight
|
130 |
+
120: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.37.attn_q_a.weight
|
131 |
+
121: 1536 | 1536, 1, 1, 1 | F32 | blk.37.attn_q_a_norm.weight
|
132 |
+
122: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.37.attn_q_b.weight
|
133 |
+
123: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.37.ffn_down_exps.weight
|
134 |
+
124: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.37.ffn_down_shexp.weight
|
135 |
+
125: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.37.ffn_gate_exps.weight
|
136 |
+
126: 819200 | 5120, 160, 1, 1 | F32 | blk.37.ffn_gate_inp.weight
|
137 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.37.ffn_gate_shexp.weight
|
138 |
+
128: 5120 | 5120, 1, 1, 1 | F32 | blk.37.ffn_norm.weight
|
139 |
+
129: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.37.ffn_up_exps.weight
|
140 |
+
130: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.37.ffn_up_shexp.weight
|
141 |
+
131: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.38.attn_kv_a_mqa.weight
|
142 |
+
132: 512 | 512, 1, 1, 1 | F32 | blk.38.attn_kv_a_norm.weight
|
143 |
+
133: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.38.attn_kv_b.weight
|
144 |
+
134: 5120 | 5120, 1, 1, 1 | F32 | blk.38.attn_norm.weight
|
145 |
+
135: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.38.attn_output.weight
|
146 |
+
136: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.38.attn_q_a.weight
|
147 |
+
137: 1536 | 1536, 1, 1, 1 | F32 | blk.38.attn_q_a_norm.weight
|
148 |
+
138: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.38.attn_q_b.weight
|
149 |
+
139: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.38.ffn_down_exps.weight
|
150 |
+
140: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.38.ffn_down_shexp.weight
|
151 |
+
141: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.38.ffn_gate_exps.weight
|
152 |
+
142: 819200 | 5120, 160, 1, 1 | F32 | blk.38.ffn_gate_inp.weight
|
153 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.38.ffn_gate_shexp.weight
|
154 |
+
144: 5120 | 5120, 1, 1, 1 | F32 | blk.38.ffn_norm.weight
|
155 |
+
145: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.38.ffn_up_exps.weight
|
156 |
+
146: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.38.ffn_up_shexp.weight
|
157 |
+
147: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.39.attn_kv_a_mqa.weight
|
158 |
+
148: 512 | 512, 1, 1, 1 | F32 | blk.39.attn_kv_a_norm.weight
|
159 |
+
149: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.39.attn_kv_b.weight
|
160 |
+
150: 5120 | 5120, 1, 1, 1 | F32 | blk.39.attn_norm.weight
|
161 |
+
151: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.39.attn_output.weight
|
162 |
+
152: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.39.attn_q_a.weight
|
163 |
+
153: 1536 | 1536, 1, 1, 1 | F32 | blk.39.attn_q_a_norm.weight
|
164 |
+
154: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.39.attn_q_b.weight
|
165 |
+
155: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.39.ffn_down_exps.weight
|
166 |
+
156: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.39.ffn_down_shexp.weight
|
167 |
+
157: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.39.ffn_gate_exps.weight
|
168 |
+
158: 819200 | 5120, 160, 1, 1 | F32 | blk.39.ffn_gate_inp.weight
|
169 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.39.ffn_gate_shexp.weight
|
170 |
+
160: 5120 | 5120, 1, 1, 1 | F32 | blk.39.ffn_norm.weight
|
171 |
+
161: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.39.ffn_up_exps.weight
|
172 |
+
162: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.39.ffn_up_shexp.weight
|
173 |
+
163: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.40.attn_kv_a_mqa.weight
|
174 |
+
164: 512 | 512, 1, 1, 1 | F32 | blk.40.attn_kv_a_norm.weight
|
175 |
+
165: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.40.attn_kv_b.weight
|
176 |
+
166: 5120 | 5120, 1, 1, 1 | F32 | blk.40.attn_norm.weight
|
177 |
+
167: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.40.attn_output.weight
|
178 |
+
168: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.40.attn_q_a.weight
|
179 |
+
169: 1536 | 1536, 1, 1, 1 | F32 | blk.40.attn_q_a_norm.weight
|
180 |
+
170: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.40.attn_q_b.weight
|
181 |
+
171: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.40.ffn_down_exps.weight
|
182 |
+
172: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.40.ffn_down_shexp.weight
|
183 |
+
173: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.40.ffn_gate_exps.weight
|
184 |
+
174: 819200 | 5120, 160, 1, 1 | F32 | blk.40.ffn_gate_inp.weight
|
185 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.40.ffn_gate_shexp.weight
|
186 |
+
176: 5120 | 5120, 1, 1, 1 | F32 | blk.40.ffn_norm.weight
|
187 |
+
177: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.40.ffn_up_exps.weight
|
188 |
+
178: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.40.ffn_up_shexp.weight
|
189 |
+
179: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.41.attn_kv_a_mqa.weight
|
190 |
+
180: 512 | 512, 1, 1, 1 | F32 | blk.41.attn_kv_a_norm.weight
|
191 |
+
181: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.41.attn_kv_b.weight
|
192 |
+
182: 5120 | 5120, 1, 1, 1 | F32 | blk.41.attn_norm.weight
|
193 |
+
183: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.41.attn_output.weight
|
194 |
+
184: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.41.attn_q_a.weight
|
195 |
+
185: 1536 | 1536, 1, 1, 1 | F32 | blk.41.attn_q_a_norm.weight
|
196 |
+
186: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.41.attn_q_b.weight
|
197 |
+
187: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.41.ffn_down_exps.weight
|
198 |
+
188: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.41.ffn_down_shexp.weight
|
199 |
+
189: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.41.ffn_gate_exps.weight
|
200 |
+
190: 819200 | 5120, 160, 1, 1 | F32 | blk.41.ffn_gate_inp.weight
|
201 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.41.ffn_gate_shexp.weight
|
202 |
+
192: 5120 | 5120, 1, 1, 1 | F32 | blk.41.ffn_norm.weight
|
203 |
+
193: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.41.ffn_up_exps.weight
|
204 |
+
194: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.41.ffn_up_shexp.weight
|
205 |
+
195: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.42.attn_kv_a_mqa.weight
|
206 |
+
196: 512 | 512, 1, 1, 1 | F32 | blk.42.attn_kv_a_norm.weight
|
207 |
+
197: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.42.attn_kv_b.weight
|
208 |
+
198: 5120 | 5120, 1, 1, 1 | F32 | blk.42.attn_norm.weight
|
209 |
+
199: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.42.attn_output.weight
|
210 |
+
200: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.42.attn_q_a.weight
|
211 |
+
201: 1536 | 1536, 1, 1, 1 | F32 | blk.42.attn_q_a_norm.weight
|
212 |
+
202: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.42.attn_q_b.weight
|
213 |
+
203: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.42.ffn_down_exps.weight
|
214 |
+
204: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.42.ffn_down_shexp.weight
|
215 |
+
205: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.42.ffn_gate_exps.weight
|
216 |
+
206: 819200 | 5120, 160, 1, 1 | F32 | blk.42.ffn_gate_inp.weight
|
217 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.42.ffn_gate_shexp.weight
|
218 |
+
208: 5120 | 5120, 1, 1, 1 | F32 | blk.42.ffn_norm.weight
|
219 |
+
209: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.42.ffn_up_exps.weight
|
220 |
+
210: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.42.ffn_up_shexp.weight
|
221 |
+
211: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.43.attn_kv_a_mqa.weight
|
222 |
+
212: 512 | 512, 1, 1, 1 | F32 | blk.43.attn_kv_a_norm.weight
|
223 |
+
213: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.43.attn_kv_b.weight
|
224 |
+
214: 5120 | 5120, 1, 1, 1 | F32 | blk.43.attn_norm.weight
|
225 |
+
215: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.43.attn_output.weight
|
226 |
+
216: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.43.attn_q_a.weight
|
227 |
+
217: 1536 | 1536, 1, 1, 1 | F32 | blk.43.attn_q_a_norm.weight
|
228 |
+
218: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.43.attn_q_b.weight
|
229 |
+
219: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.43.ffn_down_exps.weight
|
230 |
+
220: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.43.ffn_down_shexp.weight
|
231 |
+
221: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.43.ffn_gate_exps.weight
|
232 |
+
222: 819200 | 5120, 160, 1, 1 | F32 | blk.43.ffn_gate_inp.weight
|
233 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.43.ffn_gate_shexp.weight
|
234 |
+
224: 5120 | 5120, 1, 1, 1 | F32 | blk.43.ffn_norm.weight
|
235 |
+
225: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.43.ffn_up_exps.weight
|
236 |
+
226: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.43.ffn_up_shexp.weight
|
237 |
+
227: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.44.attn_kv_a_mqa.weight
|
238 |
+
228: 512 | 512, 1, 1, 1 | F32 | blk.44.attn_kv_a_norm.weight
|
239 |
+
229: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.44.attn_kv_b.weight
|
240 |
+
230: 5120 | 5120, 1, 1, 1 | F32 | blk.44.attn_norm.weight
|
241 |
+
231: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.44.attn_output.weight
|
242 |
+
232: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.44.attn_q_a.weight
|
243 |
+
233: 1536 | 1536, 1, 1, 1 | F32 | blk.44.attn_q_a_norm.weight
|
244 |
+
234: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.44.attn_q_b.weight
|
245 |
+
235: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.44.ffn_down_exps.weight
|
246 |
+
236: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.44.ffn_down_shexp.weight
|
247 |
+
237: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.44.ffn_gate_exps.weight
|
248 |
+
238: 819200 | 5120, 160, 1, 1 | F32 | blk.44.ffn_gate_inp.weight
|
249 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.44.ffn_gate_shexp.weight
|
250 |
+
240: 5120 | 5120, 1, 1, 1 | F32 | blk.44.ffn_norm.weight
|
251 |
+
241: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.44.ffn_up_exps.weight
|
252 |
+
242: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.44.ffn_up_shexp.weight
|
253 |
+
243: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.45.attn_kv_a_mqa.weight
|
254 |
+
244: 512 | 512, 1, 1, 1 | F32 | blk.45.attn_kv_a_norm.weight
|
255 |
+
245: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.45.attn_kv_b.weight
|
256 |
+
246: 5120 | 5120, 1, 1, 1 | F32 | blk.45.attn_norm.weight
|
257 |
+
247: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.45.attn_output.weight
|
258 |
+
248: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.45.attn_q_a.weight
|
259 |
+
249: 1536 | 1536, 1, 1, 1 | F32 | blk.45.attn_q_a_norm.weight
|
260 |
+
250: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.45.attn_q_b.weight
|
261 |
+
251: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.45.ffn_down_exps.weight
|
262 |
+
252: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.45.ffn_down_shexp.weight
|
263 |
+
253: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.45.ffn_gate_exps.weight
|
264 |
+
254: 819200 | 5120, 160, 1, 1 | F32 | blk.45.ffn_gate_inp.weight
|
265 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.45.ffn_gate_shexp.weight
|
266 |
+
256: 5120 | 5120, 1, 1, 1 | F32 | blk.45.ffn_norm.weight
|
267 |
+
257: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.45.ffn_up_exps.weight
|
268 |
+
258: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.45.ffn_up_shexp.weight
|
269 |
+
259: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.46.attn_kv_a_mqa.weight
|
270 |
+
260: 512 | 512, 1, 1, 1 | F32 | blk.46.attn_kv_a_norm.weight
|
271 |
+
261: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.46.attn_kv_b.weight
|
272 |
+
262: 5120 | 5120, 1, 1, 1 | F32 | blk.46.attn_norm.weight
|
273 |
+
263: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.46.attn_output.weight
|
274 |
+
264: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.46.attn_q_a.weight
|
275 |
+
265: 1536 | 1536, 1, 1, 1 | F32 | blk.46.attn_q_a_norm.weight
|
276 |
+
266: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.46.attn_q_b.weight
|
277 |
+
267: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.46.ffn_down_exps.weight
|
278 |
+
268: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.46.ffn_down_shexp.weight
|
279 |
+
269: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.46.ffn_gate_exps.weight
|
280 |
+
270: 819200 | 5120, 160, 1, 1 | F32 | blk.46.ffn_gate_inp.weight
|
281 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.46.ffn_gate_shexp.weight
|
282 |
+
272: 5120 | 5120, 1, 1, 1 | F32 | blk.46.ffn_norm.weight
|
283 |
+
273: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.46.ffn_up_exps.weight
|
284 |
+
274: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.46.ffn_up_shexp.weight
|
285 |
+
275: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.47.attn_kv_a_mqa.weight
|
286 |
+
276: 512 | 512, 1, 1, 1 | F32 | blk.47.attn_kv_a_norm.weight
|
287 |
+
277: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.47.attn_kv_b.weight
|
288 |
+
278: 5120 | 5120, 1, 1, 1 | F32 | blk.47.attn_norm.weight
|
289 |
+
279: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.47.attn_output.weight
|
290 |
+
280: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.47.attn_q_a.weight
|
291 |
+
281: 1536 | 1536, 1, 1, 1 | F32 | blk.47.attn_q_a_norm.weight
|
292 |
+
282: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.47.attn_q_b.weight
|
293 |
+
283: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.47.ffn_down_exps.weight
|
294 |
+
284: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.47.ffn_down_shexp.weight
|
295 |
+
285: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.47.ffn_gate_exps.weight
|
296 |
+
286: 819200 | 5120, 160, 1, 1 | F32 | blk.47.ffn_gate_inp.weight
|
297 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.47.ffn_gate_shexp.weight
|
298 |
+
288: 5120 | 5120, 1, 1, 1 | F32 | blk.47.ffn_norm.weight
|
299 |
+
289: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.47.ffn_up_exps.weight
|
300 |
+
290: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.47.ffn_up_shexp.weight
|
301 |
+
291: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.48.attn_kv_a_mqa.weight
|
302 |
+
292: 512 | 512, 1, 1, 1 | F32 | blk.48.attn_kv_a_norm.weight
|
303 |
+
293: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.48.attn_kv_b.weight
|
304 |
+
294: 5120 | 5120, 1, 1, 1 | F32 | blk.48.attn_norm.weight
|
305 |
+
295: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.48.attn_output.weight
|
306 |
+
296: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.48.attn_q_a.weight
|
307 |
+
297: 1536 | 1536, 1, 1, 1 | F32 | blk.48.attn_q_a_norm.weight
|
308 |
+
298: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.48.attn_q_b.weight
|
309 |
+
299: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.48.ffn_down_exps.weight
|
310 |
+
300: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.48.ffn_down_shexp.weight
|
311 |
+
301: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.48.ffn_gate_exps.weight
|
312 |
+
302: 819200 | 5120, 160, 1, 1 | F32 | blk.48.ffn_gate_inp.weight
|
313 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.48.ffn_gate_shexp.weight
|
314 |
+
304: 5120 | 5120, 1, 1, 1 | F32 | blk.48.ffn_norm.weight
|
315 |
+
305: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.48.ffn_up_exps.weight
|
316 |
+
306: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.48.ffn_up_shexp.weight
|
317 |
+
307: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.49.attn_kv_a_mqa.weight
|
318 |
+
308: 512 | 512, 1, 1, 1 | F32 | blk.49.attn_kv_a_norm.weight
|
319 |
+
309: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.49.attn_kv_b.weight
|
320 |
+
310: 5120 | 5120, 1, 1, 1 | F32 | blk.49.attn_norm.weight
|
321 |
+
311: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.49.attn_output.weight
|
322 |
+
312: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.49.attn_q_a.weight
|
323 |
+
313: 1536 | 1536, 1, 1, 1 | F32 | blk.49.attn_q_a_norm.weight
|
324 |
+
314: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.49.attn_q_b.weight
|
325 |
+
315: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.49.ffn_down_exps.weight
|
326 |
+
316: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.49.ffn_down_shexp.weight
|
327 |
+
317: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.49.ffn_gate_exps.weight
|
328 |
+
318: 819200 | 5120, 160, 1, 1 | F32 | blk.49.ffn_gate_inp.weight
|
329 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.49.ffn_gate_shexp.weight
|
330 |
+
320: 5120 | 5120, 1, 1, 1 | F32 | blk.49.ffn_norm.weight
|
331 |
+
321: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.49.ffn_up_exps.weight
|
332 |
+
322: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.49.ffn_up_shexp.weight
|
333 |
+
323: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.50.attn_kv_a_mqa.weight
|
334 |
+
324: 512 | 512, 1, 1, 1 | F32 | blk.50.attn_kv_a_norm.weight
|
335 |
+
325: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.50.attn_kv_b.weight
|
336 |
+
326: 5120 | 5120, 1, 1, 1 | F32 | blk.50.attn_norm.weight
|
337 |
+
327: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.50.attn_output.weight
|
338 |
+
328: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.50.attn_q_a.weight
|
339 |
+
329: 1536 | 1536, 1, 1, 1 | F32 | blk.50.attn_q_a_norm.weight
|
340 |
+
330: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.50.attn_q_b.weight
|
341 |
+
331: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.50.ffn_down_exps.weight
|
342 |
+
332: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.50.ffn_down_shexp.weight
|
343 |
+
333: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.50.ffn_gate_exps.weight
|
344 |
+
334: 819200 | 5120, 160, 1, 1 | F32 | blk.50.ffn_gate_inp.weight
|
345 |
+
335: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.50.ffn_gate_shexp.weight
|
346 |
+
336: 5120 | 5120, 1, 1, 1 | F32 | blk.50.ffn_norm.weight
|
347 |
+
337: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.50.ffn_up_exps.weight
|
348 |
+
338: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.50.ffn_up_shexp.weight
|
349 |
+
339: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.51.attn_kv_a_mqa.weight
|
350 |
+
340: 512 | 512, 1, 1, 1 | F32 | blk.51.attn_kv_a_norm.weight
|
351 |
+
341: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.51.attn_kv_b.weight
|
352 |
+
342: 5120 | 5120, 1, 1, 1 | F32 | blk.51.attn_norm.weight
|
353 |
+
343: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.51.attn_output.weight
|
354 |
+
344: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.51.attn_q_a.weight
|
355 |
+
345: 1536 | 1536, 1, 1, 1 | F32 | blk.51.attn_q_a_norm.weight
|
356 |
+
346: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.51.attn_q_b.weight
|
357 |
+
347: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.51.ffn_down_exps.weight
|
358 |
+
348: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.51.ffn_down_shexp.weight
|
359 |
+
349: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.51.ffn_gate_exps.weight
|
360 |
+
350: 819200 | 5120, 160, 1, 1 | F32 | blk.51.ffn_gate_inp.weight
|
361 |
+
351: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.51.ffn_gate_shexp.weight
|
362 |
+
352: 5120 | 5120, 1, 1, 1 | F32 | blk.51.ffn_norm.weight
|
363 |
+
353: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.51.ffn_up_exps.weight
|
364 |
+
354: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.51.ffn_up_shexp.weight
|
365 |
+
355: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.52.attn_kv_a_mqa.weight
|
366 |
+
356: 512 | 512, 1, 1, 1 | F32 | blk.52.attn_kv_a_norm.weight
|
367 |
+
357: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.52.attn_kv_b.weight
|
368 |
+
358: 5120 | 5120, 1, 1, 1 | F32 | blk.52.attn_norm.weight
|
369 |
+
359: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.52.attn_output.weight
|
370 |
+
360: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.52.attn_q_a.weight
|
371 |
+
361: 1536 | 1536, 1, 1, 1 | F32 | blk.52.attn_q_a_norm.weight
|
372 |
+
362: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.52.attn_q_b.weight
|
373 |
+
363: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.52.ffn_down_exps.weight
|
374 |
+
364: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.52.ffn_down_shexp.weight
|
375 |
+
365: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.52.ffn_gate_exps.weight
|
376 |
+
366: 819200 | 5120, 160, 1, 1 | F32 | blk.52.ffn_gate_inp.weight
|
377 |
+
367: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.52.ffn_gate_shexp.weight
|
378 |
+
368: 5120 | 5120, 1, 1, 1 | F32 | blk.52.ffn_norm.weight
|
379 |
+
369: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.52.ffn_up_exps.weight
|
380 |
+
370: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.52.ffn_up_shexp.weight
|
381 |
+
371: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.53.attn_kv_a_mqa.weight
|
382 |
+
372: 512 | 512, 1, 1, 1 | F32 | blk.53.attn_kv_a_norm.weight
|
383 |
+
373: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.53.attn_kv_b.weight
|
384 |
+
374: 5120 | 5120, 1, 1, 1 | F32 | blk.53.attn_norm.weight
|
385 |
+
375: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.53.attn_output.weight
|
386 |
+
376: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.53.attn_q_a.weight
|
387 |
+
377: 1536 | 1536, 1, 1, 1 | F32 | blk.53.attn_q_a_norm.weight
|
388 |
+
378: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.53.attn_q_b.weight
|
389 |
+
379: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.53.ffn_down_exps.weight
|
390 |
+
380: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.53.ffn_down_shexp.weight
|
391 |
+
381: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.53.ffn_gate_exps.weight
|
392 |
+
382: 819200 | 5120, 160, 1, 1 | F32 | blk.53.ffn_gate_inp.weight
|
393 |
+
383: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.53.ffn_gate_shexp.weight
|
394 |
+
384: 5120 | 5120, 1, 1, 1 | F32 | blk.53.ffn_norm.weight
|
395 |
+
385: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.53.ffn_up_exps.weight
|
396 |
+
386: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.53.ffn_up_shexp.weight
|
397 |
+
387: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.54.attn_kv_a_mqa.weight
|
398 |
+
388: 512 | 512, 1, 1, 1 | F32 | blk.54.attn_kv_a_norm.weight
|
399 |
+
389: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.54.attn_kv_b.weight
|
400 |
+
390: 5120 | 5120, 1, 1, 1 | F32 | blk.54.attn_norm.weight
|
401 |
+
391: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.54.attn_output.weight
|
402 |
+
392: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.54.attn_q_a.weight
|
403 |
+
393: 1536 | 1536, 1, 1, 1 | F32 | blk.54.attn_q_a_norm.weight
|
404 |
+
394: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.54.attn_q_b.weight
|
405 |
+
395: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.54.ffn_down_exps.weight
|
406 |
+
396: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.54.ffn_down_shexp.weight
|
407 |
+
397: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.54.ffn_gate_exps.weight
|
408 |
+
398: 819200 | 5120, 160, 1, 1 | F32 | blk.54.ffn_gate_inp.weight
|
409 |
+
399: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.54.ffn_gate_shexp.weight
|
410 |
+
400: 5120 | 5120, 1, 1, 1 | F32 | blk.54.ffn_norm.weight
|
411 |
+
401: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.54.ffn_up_exps.weight
|
412 |
+
402: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.54.ffn_up_shexp.weight
|
413 |
+
403: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.55.attn_kv_a_mqa.weight
|
414 |
+
404: 512 | 512, 1, 1, 1 | F32 | blk.55.attn_kv_a_norm.weight
|
415 |
+
405: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.55.attn_kv_b.weight
|
416 |
+
406: 5120 | 5120, 1, 1, 1 | F32 | blk.55.attn_norm.weight
|
417 |
+
407: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.55.attn_output.weight
|
418 |
+
408: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.55.attn_q_a.weight
|
419 |
+
409: 1536 | 1536, 1, 1, 1 | F32 | blk.55.attn_q_a_norm.weight
|
420 |
+
410: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.55.attn_q_b.weight
|
421 |
+
411: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.55.ffn_down_exps.weight
|
422 |
+
412: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.55.ffn_down_shexp.weight
|
423 |
+
413: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.55.ffn_gate_exps.weight
|
424 |
+
414: 819200 | 5120, 160, 1, 1 | F32 | blk.55.ffn_gate_inp.weight
|
425 |
+
415: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.55.ffn_gate_shexp.weight
|
426 |
+
416: 5120 | 5120, 1, 1, 1 | F32 | blk.55.ffn_norm.weight
|
427 |
+
417: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.55.ffn_up_exps.weight
|
428 |
+
418: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.55.ffn_up_shexp.weight
|
429 |
+
419: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.56.attn_kv_a_mqa.weight
|
430 |
+
420: 512 | 512, 1, 1, 1 | F32 | blk.56.attn_kv_a_norm.weight
|
431 |
+
421: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.56.attn_kv_b.weight
|
432 |
+
422: 5120 | 5120, 1, 1, 1 | F32 | blk.56.attn_norm.weight
|
433 |
+
423: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.56.attn_output.weight
|
434 |
+
424: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.56.attn_q_a.weight
|
435 |
+
425: 1536 | 1536, 1, 1, 1 | F32 | blk.56.attn_q_a_norm.weight
|
436 |
+
426: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.56.attn_q_b.weight
|
437 |
+
427: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.56.ffn_down_exps.weight
|
438 |
+
428: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.56.ffn_down_shexp.weight
|
439 |
+
429: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.56.ffn_gate_exps.weight
|
440 |
+
430: 819200 | 5120, 160, 1, 1 | F32 | blk.56.ffn_gate_inp.weight
|
441 |
+
431: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.56.ffn_gate_shexp.weight
|
442 |
+
432: 5120 | 5120, 1, 1, 1 | F32 | blk.56.ffn_norm.weight
|
443 |
+
433: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.56.ffn_up_exps.weight
|
444 |
+
434: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.56.ffn_up_shexp.weight
|
445 |
+
435: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.57.attn_kv_a_mqa.weight
|
446 |
+
436: 512 | 512, 1, 1, 1 | F32 | blk.57.attn_kv_a_norm.weight
|
447 |
+
437: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.57.attn_kv_b.weight
|
448 |
+
438: 5120 | 5120, 1, 1, 1 | F32 | blk.57.attn_norm.weight
|
449 |
+
439: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.57.attn_output.weight
|
450 |
+
440: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.57.attn_q_a.weight
|
451 |
+
441: 1536 | 1536, 1, 1, 1 | F32 | blk.57.attn_q_a_norm.weight
|
452 |
+
442: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.57.attn_q_b.weight
|
453 |
+
443: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.57.ffn_down_exps.weight
|
454 |
+
444: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.57.ffn_down_shexp.weight
|
455 |
+
445: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.57.ffn_gate_exps.weight
|
456 |
+
446: 819200 | 5120, 160, 1, 1 | F32 | blk.57.ffn_gate_inp.weight
|
457 |
+
447: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.57.ffn_gate_shexp.weight
|
458 |
+
448: 5120 | 5120, 1, 1, 1 | F32 | blk.57.ffn_norm.weight
|
459 |
+
449: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.57.ffn_up_exps.weight
|
460 |
+
450: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.57.ffn_up_shexp.weight
|
461 |
+
451: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.58.attn_kv_a_mqa.weight
|
462 |
+
452: 512 | 512, 1, 1, 1 | F32 | blk.58.attn_kv_a_norm.weight
|
463 |
+
453: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.58.attn_kv_b.weight
|
464 |
+
454: 5120 | 5120, 1, 1, 1 | F32 | blk.58.attn_norm.weight
|
465 |
+
455: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.58.attn_output.weight
|
466 |
+
456: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.58.attn_q_a.weight
|
467 |
+
457: 1536 | 1536, 1, 1, 1 | F32 | blk.58.attn_q_a_norm.weight
|
468 |
+
458: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.58.attn_q_b.weight
|
469 |
+
459: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.58.ffn_down_exps.weight
|
470 |
+
460: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.58.ffn_down_shexp.weight
|
471 |
+
461: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.58.ffn_gate_exps.weight
|
472 |
+
462: 819200 | 5120, 160, 1, 1 | F32 | blk.58.ffn_gate_inp.weight
|
473 |
+
463: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.58.ffn_gate_shexp.weight
|
474 |
+
464: 5120 | 5120, 1, 1, 1 | F32 | blk.58.ffn_norm.weight
|
475 |
+
465: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.58.ffn_up_exps.weight
|
476 |
+
466: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.58.ffn_up_shexp.weight
|
477 |
+
467: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.59.attn_kv_a_mqa.weight
|
478 |
+
468: 512 | 512, 1, 1, 1 | F32 | blk.59.attn_kv_a_norm.weight
|
479 |
+
469: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.59.attn_kv_b.weight
|
480 |
+
470: 5120 | 5120, 1, 1, 1 | F32 | blk.59.attn_norm.weight
|
481 |
+
471: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.59.attn_output.weight
|
482 |
+
472: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.59.attn_q_a.weight
|
483 |
+
473: 1536 | 1536, 1, 1, 1 | F32 | blk.59.attn_q_a_norm.weight
|
484 |
+
474: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.59.attn_q_b.weight
|
485 |
+
475: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.59.ffn_down_exps.weight
|
486 |
+
476: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.59.ffn_down_shexp.weight
|
487 |
+
477: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.59.ffn_gate_exps.weight
|
488 |
+
478: 819200 | 5120, 160, 1, 1 | F32 | blk.59.ffn_gate_inp.weight
|
489 |
+
479: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.59.ffn_gate_shexp.weight
|
490 |
+
480: 5120 | 5120, 1, 1, 1 | F32 | blk.59.ffn_norm.weight
|
491 |
+
481: 1258291200 | 5120, 1536, 160, 1 | IQ2_XXS | blk.59.ffn_up_exps.weight
|
492 |
+
482: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.59.ffn_up_shexp.weight
|
DeepSeek-v2.5-1210-UD-iq3_m-00001-of-00003.gguf.tensors.txt
ADDED
@@ -0,0 +1,380 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq3_m-00001-of-00003.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 56 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 320
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 53
|
7 |
+
4: STRING | 1 | general.architecture = 'deepseek2'
|
8 |
+
5: STRING | 1 | general.type = 'model'
|
9 |
+
6: STRING | 1 | general.name = 'Dsv25'
|
10 |
+
7: STRING | 1 | general.size_label = '160x14B'
|
11 |
+
8: STRING | 1 | general.license = 'other'
|
12 |
+
9: STRING | 1 | general.license.name = 'deepseek'
|
13 |
+
10: STRING | 1 | general.license.link = 'https://github.com/deepseek-ai/DeepSeek-V2/blob/main/LICENSE'
|
14 |
+
11: UINT32 | 1 | deepseek2.block_count = 60
|
15 |
+
12: UINT32 | 1 | deepseek2.context_length = 163840
|
16 |
+
13: UINT32 | 1 | deepseek2.embedding_length = 5120
|
17 |
+
14: UINT32 | 1 | deepseek2.feed_forward_length = 12288
|
18 |
+
15: UINT32 | 1 | deepseek2.attention.head_count = 128
|
19 |
+
16: UINT32 | 1 | deepseek2.attention.head_count_kv = 128
|
20 |
+
17: FLOAT32 | 1 | deepseek2.rope.freq_base = 10000.0
|
21 |
+
18: FLOAT32 | 1 | deepseek2.attention.layer_norm_rms_epsilon = 9.999999974752427e-07
|
22 |
+
19: UINT32 | 1 | deepseek2.expert_used_count = 6
|
23 |
+
20: UINT32 | 1 | deepseek2.leading_dense_block_count = 1
|
24 |
+
21: UINT32 | 1 | deepseek2.vocab_size = 102400
|
25 |
+
22: UINT32 | 1 | deepseek2.attention.q_lora_rank = 1536
|
26 |
+
23: UINT32 | 1 | deepseek2.attention.kv_lora_rank = 512
|
27 |
+
24: UINT32 | 1 | deepseek2.attention.key_length = 192
|
28 |
+
25: UINT32 | 1 | deepseek2.attention.value_length = 128
|
29 |
+
26: UINT32 | 1 | deepseek2.expert_feed_forward_length = 1536
|
30 |
+
27: UINT32 | 1 | deepseek2.expert_count = 160
|
31 |
+
28: UINT32 | 1 | deepseek2.expert_shared_count = 2
|
32 |
+
29: FLOAT32 | 1 | deepseek2.expert_weights_scale = 16.0
|
33 |
+
30: BOOL | 1 | deepseek2.expert_weights_norm = False
|
34 |
+
31: UINT32 | 1 | deepseek2.expert_gating_func = 1
|
35 |
+
32: UINT32 | 1 | deepseek2.rope.dimension_count = 64
|
36 |
+
33: STRING | 1 | deepseek2.rope.scaling.type = 'yarn'
|
37 |
+
34: FLOAT32 | 1 | deepseek2.rope.scaling.factor = 40.0
|
38 |
+
35: UINT32 | 1 | deepseek2.rope.scaling.original_context_length = 4096
|
39 |
+
36: FLOAT32 | 1 | deepseek2.rope.scaling.yarn_log_multiplier = 0.10000000149011612
|
40 |
+
37: STRING | 1 | tokenizer.ggml.model = 'gpt2'
|
41 |
+
38: STRING | 1 | tokenizer.ggml.pre = 'deepseek-llm'
|
42 |
+
39: [STRING] | 102400 | tokenizer.ggml.tokens
|
43 |
+
40: [INT32] | 102400 | tokenizer.ggml.token_type
|
44 |
+
41: [STRING] | 99757 | tokenizer.ggml.merges
|
45 |
+
42: UINT32 | 1 | tokenizer.ggml.bos_token_id = 100000
|
46 |
+
43: UINT32 | 1 | tokenizer.ggml.eos_token_id = 100001
|
47 |
+
44: UINT32 | 1 | tokenizer.ggml.padding_token_id = 100001
|
48 |
+
45: BOOL | 1 | tokenizer.ggml.add_bos_token = True
|
49 |
+
46: BOOL | 1 | tokenizer.ggml.add_eos_token = False
|
50 |
+
47: STRING | 1 | tokenizer.chat_template = '{% if not add_generation_prompt is defined %}{% set add_gene'
|
51 |
+
48: UINT32 | 1 | general.quantization_version = 2
|
52 |
+
49: UINT32 | 1 | general.file_type = 27
|
53 |
+
50: STRING | 1 | quantize.imatrix.file = '/archive/nuc/LLM/raw/imatrix-DeepSeek-V2.5-1210-bartowski.da'
|
54 |
+
51: STRING | 1 | quantize.imatrix.dataset = '/training_dir/calibration_datav3.txt'
|
55 |
+
52: INT32 | 1 | quantize.imatrix.entries_count = 716
|
56 |
+
53: INT32 | 1 | quantize.imatrix.chunks_count = 139
|
57 |
+
54: UINT16 | 1 | split.no = 0
|
58 |
+
55: INT32 | 1 | split.tensors.count = 959
|
59 |
+
56: UINT16 | 1 | split.count = 3
|
60 |
+
* Dumping 320 tensor(s)
|
61 |
+
1: 524288000 | 5120, 102400, 1, 1 | Q6_K | output.weight
|
62 |
+
2: 5120 | 5120, 1, 1, 1 | F32 | output_norm.weight
|
63 |
+
3: 524288000 | 5120, 102400, 1, 1 | Q6_K | token_embd.weight
|
64 |
+
4: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.0.attn_kv_a_mqa.weight
|
65 |
+
5: 512 | 512, 1, 1, 1 | F32 | blk.0.attn_kv_a_norm.weight
|
66 |
+
6: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.0.attn_kv_b.weight
|
67 |
+
7: 5120 | 5120, 1, 1, 1 | F32 | blk.0.attn_norm.weight
|
68 |
+
8: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.0.attn_output.weight
|
69 |
+
9: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.0.attn_q_a.weight
|
70 |
+
10: 1536 | 1536, 1, 1, 1 | F32 | blk.0.attn_q_a_norm.weight
|
71 |
+
11: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.0.attn_q_b.weight
|
72 |
+
12: 62914560 | 12288, 5120, 1, 1 | Q6_K | blk.0.ffn_down.weight
|
73 |
+
13: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_gate.weight
|
74 |
+
14: 5120 | 5120, 1, 1, 1 | F32 | blk.0.ffn_norm.weight
|
75 |
+
15: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_up.weight
|
76 |
+
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.1.attn_kv_a_mqa.weight
|
77 |
+
17: 512 | 512, 1, 1, 1 | F32 | blk.1.attn_kv_a_norm.weight
|
78 |
+
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.1.attn_kv_b.weight
|
79 |
+
19: 5120 | 5120, 1, 1, 1 | F32 | blk.1.attn_norm.weight
|
80 |
+
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.1.attn_output.weight
|
81 |
+
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.1.attn_q_a.weight
|
82 |
+
22: 1536 | 1536, 1, 1, 1 | F32 | blk.1.attn_q_a_norm.weight
|
83 |
+
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.1.attn_q_b.weight
|
84 |
+
24: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.1.ffn_down_exps.weight
|
85 |
+
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.1.ffn_down_shexp.weight
|
86 |
+
26: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.1.ffn_gate_exps.weight
|
87 |
+
27: 819200 | 5120, 160, 1, 1 | F32 | blk.1.ffn_gate_inp.weight
|
88 |
+
28: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.1.ffn_gate_shexp.weight
|
89 |
+
29: 5120 | 5120, 1, 1, 1 | F32 | blk.1.ffn_norm.weight
|
90 |
+
30: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.1.ffn_up_exps.weight
|
91 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.1.ffn_up_shexp.weight
|
92 |
+
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.2.attn_kv_a_mqa.weight
|
93 |
+
33: 512 | 512, 1, 1, 1 | F32 | blk.2.attn_kv_a_norm.weight
|
94 |
+
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.2.attn_kv_b.weight
|
95 |
+
35: 5120 | 5120, 1, 1, 1 | F32 | blk.2.attn_norm.weight
|
96 |
+
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.2.attn_output.weight
|
97 |
+
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.2.attn_q_a.weight
|
98 |
+
38: 1536 | 1536, 1, 1, 1 | F32 | blk.2.attn_q_a_norm.weight
|
99 |
+
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.2.attn_q_b.weight
|
100 |
+
40: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.2.ffn_down_exps.weight
|
101 |
+
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.2.ffn_down_shexp.weight
|
102 |
+
42: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.2.ffn_gate_exps.weight
|
103 |
+
43: 819200 | 5120, 160, 1, 1 | F32 | blk.2.ffn_gate_inp.weight
|
104 |
+
44: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.2.ffn_gate_shexp.weight
|
105 |
+
45: 5120 | 5120, 1, 1, 1 | F32 | blk.2.ffn_norm.weight
|
106 |
+
46: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.2.ffn_up_exps.weight
|
107 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.2.ffn_up_shexp.weight
|
108 |
+
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.3.attn_kv_a_mqa.weight
|
109 |
+
49: 512 | 512, 1, 1, 1 | F32 | blk.3.attn_kv_a_norm.weight
|
110 |
+
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.3.attn_kv_b.weight
|
111 |
+
51: 5120 | 5120, 1, 1, 1 | F32 | blk.3.attn_norm.weight
|
112 |
+
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.3.attn_output.weight
|
113 |
+
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.3.attn_q_a.weight
|
114 |
+
54: 1536 | 1536, 1, 1, 1 | F32 | blk.3.attn_q_a_norm.weight
|
115 |
+
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.3.attn_q_b.weight
|
116 |
+
56: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.3.ffn_down_exps.weight
|
117 |
+
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.3.ffn_down_shexp.weight
|
118 |
+
58: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.3.ffn_gate_exps.weight
|
119 |
+
59: 819200 | 5120, 160, 1, 1 | F32 | blk.3.ffn_gate_inp.weight
|
120 |
+
60: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.3.ffn_gate_shexp.weight
|
121 |
+
61: 5120 | 5120, 1, 1, 1 | F32 | blk.3.ffn_norm.weight
|
122 |
+
62: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.3.ffn_up_exps.weight
|
123 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.3.ffn_up_shexp.weight
|
124 |
+
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.4.attn_kv_a_mqa.weight
|
125 |
+
65: 512 | 512, 1, 1, 1 | F32 | blk.4.attn_kv_a_norm.weight
|
126 |
+
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.4.attn_kv_b.weight
|
127 |
+
67: 5120 | 5120, 1, 1, 1 | F32 | blk.4.attn_norm.weight
|
128 |
+
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.4.attn_output.weight
|
129 |
+
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.4.attn_q_a.weight
|
130 |
+
70: 1536 | 1536, 1, 1, 1 | F32 | blk.4.attn_q_a_norm.weight
|
131 |
+
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.4.attn_q_b.weight
|
132 |
+
72: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.4.ffn_down_exps.weight
|
133 |
+
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.4.ffn_down_shexp.weight
|
134 |
+
74: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.4.ffn_gate_exps.weight
|
135 |
+
75: 819200 | 5120, 160, 1, 1 | F32 | blk.4.ffn_gate_inp.weight
|
136 |
+
76: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.4.ffn_gate_shexp.weight
|
137 |
+
77: 5120 | 5120, 1, 1, 1 | F32 | blk.4.ffn_norm.weight
|
138 |
+
78: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.4.ffn_up_exps.weight
|
139 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.4.ffn_up_shexp.weight
|
140 |
+
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.5.attn_kv_a_mqa.weight
|
141 |
+
81: 512 | 512, 1, 1, 1 | F32 | blk.5.attn_kv_a_norm.weight
|
142 |
+
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.5.attn_kv_b.weight
|
143 |
+
83: 5120 | 5120, 1, 1, 1 | F32 | blk.5.attn_norm.weight
|
144 |
+
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.5.attn_output.weight
|
145 |
+
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.5.attn_q_a.weight
|
146 |
+
86: 1536 | 1536, 1, 1, 1 | F32 | blk.5.attn_q_a_norm.weight
|
147 |
+
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.5.attn_q_b.weight
|
148 |
+
88: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.5.ffn_down_exps.weight
|
149 |
+
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.5.ffn_down_shexp.weight
|
150 |
+
90: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.5.ffn_gate_exps.weight
|
151 |
+
91: 819200 | 5120, 160, 1, 1 | F32 | blk.5.ffn_gate_inp.weight
|
152 |
+
92: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.5.ffn_gate_shexp.weight
|
153 |
+
93: 5120 | 5120, 1, 1, 1 | F32 | blk.5.ffn_norm.weight
|
154 |
+
94: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.5.ffn_up_exps.weight
|
155 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.5.ffn_up_shexp.weight
|
156 |
+
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.6.attn_kv_a_mqa.weight
|
157 |
+
97: 512 | 512, 1, 1, 1 | F32 | blk.6.attn_kv_a_norm.weight
|
158 |
+
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.6.attn_kv_b.weight
|
159 |
+
99: 5120 | 5120, 1, 1, 1 | F32 | blk.6.attn_norm.weight
|
160 |
+
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.6.attn_output.weight
|
161 |
+
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.6.attn_q_a.weight
|
162 |
+
102: 1536 | 1536, 1, 1, 1 | F32 | blk.6.attn_q_a_norm.weight
|
163 |
+
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.6.attn_q_b.weight
|
164 |
+
104: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.6.ffn_down_exps.weight
|
165 |
+
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.6.ffn_down_shexp.weight
|
166 |
+
106: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.6.ffn_gate_exps.weight
|
167 |
+
107: 819200 | 5120, 160, 1, 1 | F32 | blk.6.ffn_gate_inp.weight
|
168 |
+
108: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.6.ffn_gate_shexp.weight
|
169 |
+
109: 5120 | 5120, 1, 1, 1 | F32 | blk.6.ffn_norm.weight
|
170 |
+
110: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.6.ffn_up_exps.weight
|
171 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.6.ffn_up_shexp.weight
|
172 |
+
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.7.attn_kv_a_mqa.weight
|
173 |
+
113: 512 | 512, 1, 1, 1 | F32 | blk.7.attn_kv_a_norm.weight
|
174 |
+
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.7.attn_kv_b.weight
|
175 |
+
115: 5120 | 5120, 1, 1, 1 | F32 | blk.7.attn_norm.weight
|
176 |
+
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.7.attn_output.weight
|
177 |
+
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.7.attn_q_a.weight
|
178 |
+
118: 1536 | 1536, 1, 1, 1 | F32 | blk.7.attn_q_a_norm.weight
|
179 |
+
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.7.attn_q_b.weight
|
180 |
+
120: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.7.ffn_down_exps.weight
|
181 |
+
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.7.ffn_down_shexp.weight
|
182 |
+
122: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.7.ffn_gate_exps.weight
|
183 |
+
123: 819200 | 5120, 160, 1, 1 | F32 | blk.7.ffn_gate_inp.weight
|
184 |
+
124: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.7.ffn_gate_shexp.weight
|
185 |
+
125: 5120 | 5120, 1, 1, 1 | F32 | blk.7.ffn_norm.weight
|
186 |
+
126: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.7.ffn_up_exps.weight
|
187 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.7.ffn_up_shexp.weight
|
188 |
+
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.8.attn_kv_a_mqa.weight
|
189 |
+
129: 512 | 512, 1, 1, 1 | F32 | blk.8.attn_kv_a_norm.weight
|
190 |
+
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.8.attn_kv_b.weight
|
191 |
+
131: 5120 | 5120, 1, 1, 1 | F32 | blk.8.attn_norm.weight
|
192 |
+
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.8.attn_output.weight
|
193 |
+
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.8.attn_q_a.weight
|
194 |
+
134: 1536 | 1536, 1, 1, 1 | F32 | blk.8.attn_q_a_norm.weight
|
195 |
+
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.8.attn_q_b.weight
|
196 |
+
136: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.8.ffn_down_exps.weight
|
197 |
+
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.8.ffn_down_shexp.weight
|
198 |
+
138: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.8.ffn_gate_exps.weight
|
199 |
+
139: 819200 | 5120, 160, 1, 1 | F32 | blk.8.ffn_gate_inp.weight
|
200 |
+
140: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.8.ffn_gate_shexp.weight
|
201 |
+
141: 5120 | 5120, 1, 1, 1 | F32 | blk.8.ffn_norm.weight
|
202 |
+
142: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.8.ffn_up_exps.weight
|
203 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.8.ffn_up_shexp.weight
|
204 |
+
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.9.attn_kv_a_mqa.weight
|
205 |
+
145: 512 | 512, 1, 1, 1 | F32 | blk.9.attn_kv_a_norm.weight
|
206 |
+
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.9.attn_kv_b.weight
|
207 |
+
147: 5120 | 5120, 1, 1, 1 | F32 | blk.9.attn_norm.weight
|
208 |
+
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.9.attn_output.weight
|
209 |
+
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.9.attn_q_a.weight
|
210 |
+
150: 1536 | 1536, 1, 1, 1 | F32 | blk.9.attn_q_a_norm.weight
|
211 |
+
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.9.attn_q_b.weight
|
212 |
+
152: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.9.ffn_down_exps.weight
|
213 |
+
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.9.ffn_down_shexp.weight
|
214 |
+
154: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.9.ffn_gate_exps.weight
|
215 |
+
155: 819200 | 5120, 160, 1, 1 | F32 | blk.9.ffn_gate_inp.weight
|
216 |
+
156: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.9.ffn_gate_shexp.weight
|
217 |
+
157: 5120 | 5120, 1, 1, 1 | F32 | blk.9.ffn_norm.weight
|
218 |
+
158: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.9.ffn_up_exps.weight
|
219 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.9.ffn_up_shexp.weight
|
220 |
+
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.10.attn_kv_a_mqa.weight
|
221 |
+
161: 512 | 512, 1, 1, 1 | F32 | blk.10.attn_kv_a_norm.weight
|
222 |
+
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.10.attn_kv_b.weight
|
223 |
+
163: 5120 | 5120, 1, 1, 1 | F32 | blk.10.attn_norm.weight
|
224 |
+
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.10.attn_output.weight
|
225 |
+
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.10.attn_q_a.weight
|
226 |
+
166: 1536 | 1536, 1, 1, 1 | F32 | blk.10.attn_q_a_norm.weight
|
227 |
+
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.10.attn_q_b.weight
|
228 |
+
168: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.10.ffn_down_exps.weight
|
229 |
+
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.10.ffn_down_shexp.weight
|
230 |
+
170: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.10.ffn_gate_exps.weight
|
231 |
+
171: 819200 | 5120, 160, 1, 1 | F32 | blk.10.ffn_gate_inp.weight
|
232 |
+
172: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.10.ffn_gate_shexp.weight
|
233 |
+
173: 5120 | 5120, 1, 1, 1 | F32 | blk.10.ffn_norm.weight
|
234 |
+
174: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.10.ffn_up_exps.weight
|
235 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.10.ffn_up_shexp.weight
|
236 |
+
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.11.attn_kv_a_mqa.weight
|
237 |
+
177: 512 | 512, 1, 1, 1 | F32 | blk.11.attn_kv_a_norm.weight
|
238 |
+
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.11.attn_kv_b.weight
|
239 |
+
179: 5120 | 5120, 1, 1, 1 | F32 | blk.11.attn_norm.weight
|
240 |
+
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.11.attn_output.weight
|
241 |
+
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.11.attn_q_a.weight
|
242 |
+
182: 1536 | 1536, 1, 1, 1 | F32 | blk.11.attn_q_a_norm.weight
|
243 |
+
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.11.attn_q_b.weight
|
244 |
+
184: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.11.ffn_down_exps.weight
|
245 |
+
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.11.ffn_down_shexp.weight
|
246 |
+
186: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.11.ffn_gate_exps.weight
|
247 |
+
187: 819200 | 5120, 160, 1, 1 | F32 | blk.11.ffn_gate_inp.weight
|
248 |
+
188: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.11.ffn_gate_shexp.weight
|
249 |
+
189: 5120 | 5120, 1, 1, 1 | F32 | blk.11.ffn_norm.weight
|
250 |
+
190: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.11.ffn_up_exps.weight
|
251 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.11.ffn_up_shexp.weight
|
252 |
+
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.12.attn_kv_a_mqa.weight
|
253 |
+
193: 512 | 512, 1, 1, 1 | F32 | blk.12.attn_kv_a_norm.weight
|
254 |
+
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.12.attn_kv_b.weight
|
255 |
+
195: 5120 | 5120, 1, 1, 1 | F32 | blk.12.attn_norm.weight
|
256 |
+
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.12.attn_output.weight
|
257 |
+
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.12.attn_q_a.weight
|
258 |
+
198: 1536 | 1536, 1, 1, 1 | F32 | blk.12.attn_q_a_norm.weight
|
259 |
+
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.12.attn_q_b.weight
|
260 |
+
200: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.12.ffn_down_exps.weight
|
261 |
+
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.12.ffn_down_shexp.weight
|
262 |
+
202: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.12.ffn_gate_exps.weight
|
263 |
+
203: 819200 | 5120, 160, 1, 1 | F32 | blk.12.ffn_gate_inp.weight
|
264 |
+
204: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.12.ffn_gate_shexp.weight
|
265 |
+
205: 5120 | 5120, 1, 1, 1 | F32 | blk.12.ffn_norm.weight
|
266 |
+
206: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.12.ffn_up_exps.weight
|
267 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.12.ffn_up_shexp.weight
|
268 |
+
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.13.attn_kv_a_mqa.weight
|
269 |
+
209: 512 | 512, 1, 1, 1 | F32 | blk.13.attn_kv_a_norm.weight
|
270 |
+
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.13.attn_kv_b.weight
|
271 |
+
211: 5120 | 5120, 1, 1, 1 | F32 | blk.13.attn_norm.weight
|
272 |
+
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.13.attn_output.weight
|
273 |
+
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.13.attn_q_a.weight
|
274 |
+
214: 1536 | 1536, 1, 1, 1 | F32 | blk.13.attn_q_a_norm.weight
|
275 |
+
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.13.attn_q_b.weight
|
276 |
+
216: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.13.ffn_down_exps.weight
|
277 |
+
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.13.ffn_down_shexp.weight
|
278 |
+
218: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.13.ffn_gate_exps.weight
|
279 |
+
219: 819200 | 5120, 160, 1, 1 | F32 | blk.13.ffn_gate_inp.weight
|
280 |
+
220: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.13.ffn_gate_shexp.weight
|
281 |
+
221: 5120 | 5120, 1, 1, 1 | F32 | blk.13.ffn_norm.weight
|
282 |
+
222: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.13.ffn_up_exps.weight
|
283 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.13.ffn_up_shexp.weight
|
284 |
+
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.14.attn_kv_a_mqa.weight
|
285 |
+
225: 512 | 512, 1, 1, 1 | F32 | blk.14.attn_kv_a_norm.weight
|
286 |
+
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.14.attn_kv_b.weight
|
287 |
+
227: 5120 | 5120, 1, 1, 1 | F32 | blk.14.attn_norm.weight
|
288 |
+
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.14.attn_output.weight
|
289 |
+
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.14.attn_q_a.weight
|
290 |
+
230: 1536 | 1536, 1, 1, 1 | F32 | blk.14.attn_q_a_norm.weight
|
291 |
+
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.14.attn_q_b.weight
|
292 |
+
232: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.14.ffn_down_exps.weight
|
293 |
+
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.14.ffn_down_shexp.weight
|
294 |
+
234: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.14.ffn_gate_exps.weight
|
295 |
+
235: 819200 | 5120, 160, 1, 1 | F32 | blk.14.ffn_gate_inp.weight
|
296 |
+
236: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.14.ffn_gate_shexp.weight
|
297 |
+
237: 5120 | 5120, 1, 1, 1 | F32 | blk.14.ffn_norm.weight
|
298 |
+
238: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.14.ffn_up_exps.weight
|
299 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.14.ffn_up_shexp.weight
|
300 |
+
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.15.attn_kv_a_mqa.weight
|
301 |
+
241: 512 | 512, 1, 1, 1 | F32 | blk.15.attn_kv_a_norm.weight
|
302 |
+
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.15.attn_kv_b.weight
|
303 |
+
243: 5120 | 5120, 1, 1, 1 | F32 | blk.15.attn_norm.weight
|
304 |
+
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.15.attn_output.weight
|
305 |
+
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.15.attn_q_a.weight
|
306 |
+
246: 1536 | 1536, 1, 1, 1 | F32 | blk.15.attn_q_a_norm.weight
|
307 |
+
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.15.attn_q_b.weight
|
308 |
+
248: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.15.ffn_down_exps.weight
|
309 |
+
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.15.ffn_down_shexp.weight
|
310 |
+
250: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.15.ffn_gate_exps.weight
|
311 |
+
251: 819200 | 5120, 160, 1, 1 | F32 | blk.15.ffn_gate_inp.weight
|
312 |
+
252: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.15.ffn_gate_shexp.weight
|
313 |
+
253: 5120 | 5120, 1, 1, 1 | F32 | blk.15.ffn_norm.weight
|
314 |
+
254: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.15.ffn_up_exps.weight
|
315 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.15.ffn_up_shexp.weight
|
316 |
+
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.16.attn_kv_a_mqa.weight
|
317 |
+
257: 512 | 512, 1, 1, 1 | F32 | blk.16.attn_kv_a_norm.weight
|
318 |
+
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.16.attn_kv_b.weight
|
319 |
+
259: 5120 | 5120, 1, 1, 1 | F32 | blk.16.attn_norm.weight
|
320 |
+
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.16.attn_output.weight
|
321 |
+
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.16.attn_q_a.weight
|
322 |
+
262: 1536 | 1536, 1, 1, 1 | F32 | blk.16.attn_q_a_norm.weight
|
323 |
+
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.16.attn_q_b.weight
|
324 |
+
264: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.16.ffn_down_exps.weight
|
325 |
+
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.16.ffn_down_shexp.weight
|
326 |
+
266: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.16.ffn_gate_exps.weight
|
327 |
+
267: 819200 | 5120, 160, 1, 1 | F32 | blk.16.ffn_gate_inp.weight
|
328 |
+
268: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.16.ffn_gate_shexp.weight
|
329 |
+
269: 5120 | 5120, 1, 1, 1 | F32 | blk.16.ffn_norm.weight
|
330 |
+
270: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.16.ffn_up_exps.weight
|
331 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.16.ffn_up_shexp.weight
|
332 |
+
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.17.attn_kv_a_mqa.weight
|
333 |
+
273: 512 | 512, 1, 1, 1 | F32 | blk.17.attn_kv_a_norm.weight
|
334 |
+
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.17.attn_kv_b.weight
|
335 |
+
275: 5120 | 5120, 1, 1, 1 | F32 | blk.17.attn_norm.weight
|
336 |
+
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.17.attn_output.weight
|
337 |
+
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.17.attn_q_a.weight
|
338 |
+
278: 1536 | 1536, 1, 1, 1 | F32 | blk.17.attn_q_a_norm.weight
|
339 |
+
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.17.attn_q_b.weight
|
340 |
+
280: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.17.ffn_down_exps.weight
|
341 |
+
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.17.ffn_down_shexp.weight
|
342 |
+
282: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.17.ffn_gate_exps.weight
|
343 |
+
283: 819200 | 5120, 160, 1, 1 | F32 | blk.17.ffn_gate_inp.weight
|
344 |
+
284: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.17.ffn_gate_shexp.weight
|
345 |
+
285: 5120 | 5120, 1, 1, 1 | F32 | blk.17.ffn_norm.weight
|
346 |
+
286: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.17.ffn_up_exps.weight
|
347 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.17.ffn_up_shexp.weight
|
348 |
+
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.18.attn_kv_a_mqa.weight
|
349 |
+
289: 512 | 512, 1, 1, 1 | F32 | blk.18.attn_kv_a_norm.weight
|
350 |
+
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.18.attn_kv_b.weight
|
351 |
+
291: 5120 | 5120, 1, 1, 1 | F32 | blk.18.attn_norm.weight
|
352 |
+
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.18.attn_output.weight
|
353 |
+
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.18.attn_q_a.weight
|
354 |
+
294: 1536 | 1536, 1, 1, 1 | F32 | blk.18.attn_q_a_norm.weight
|
355 |
+
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.18.attn_q_b.weight
|
356 |
+
296: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.18.ffn_down_exps.weight
|
357 |
+
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.18.ffn_down_shexp.weight
|
358 |
+
298: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.18.ffn_gate_exps.weight
|
359 |
+
299: 819200 | 5120, 160, 1, 1 | F32 | blk.18.ffn_gate_inp.weight
|
360 |
+
300: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.18.ffn_gate_shexp.weight
|
361 |
+
301: 5120 | 5120, 1, 1, 1 | F32 | blk.18.ffn_norm.weight
|
362 |
+
302: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.18.ffn_up_exps.weight
|
363 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.18.ffn_up_shexp.weight
|
364 |
+
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.19.attn_kv_a_mqa.weight
|
365 |
+
305: 512 | 512, 1, 1, 1 | F32 | blk.19.attn_kv_a_norm.weight
|
366 |
+
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.19.attn_kv_b.weight
|
367 |
+
307: 5120 | 5120, 1, 1, 1 | F32 | blk.19.attn_norm.weight
|
368 |
+
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.19.attn_output.weight
|
369 |
+
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.19.attn_q_a.weight
|
370 |
+
310: 1536 | 1536, 1, 1, 1 | F32 | blk.19.attn_q_a_norm.weight
|
371 |
+
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.19.attn_q_b.weight
|
372 |
+
312: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.19.ffn_down_exps.weight
|
373 |
+
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.19.ffn_down_shexp.weight
|
374 |
+
314: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.19.ffn_gate_exps.weight
|
375 |
+
315: 819200 | 5120, 160, 1, 1 | F32 | blk.19.ffn_gate_inp.weight
|
376 |
+
316: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.19.ffn_gate_shexp.weight
|
377 |
+
317: 5120 | 5120, 1, 1, 1 | F32 | blk.19.ffn_norm.weight
|
378 |
+
318: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.19.ffn_up_exps.weight
|
379 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.19.ffn_up_shexp.weight
|
380 |
+
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.20.attn_kv_a_mqa.weight
|
DeepSeek-v2.5-1210-UD-iq3_m-00002-of-00003.gguf.tensors.txt
ADDED
@@ -0,0 +1,330 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq3_m-00002-of-00003.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 6 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 320
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 3
|
7 |
+
4: UINT16 | 1 | split.no = 1
|
8 |
+
5: INT32 | 1 | split.tensors.count = 959
|
9 |
+
6: UINT16 | 1 | split.count = 3
|
10 |
+
* Dumping 320 tensor(s)
|
11 |
+
1: 512 | 512, 1, 1, 1 | F32 | blk.20.attn_kv_a_norm.weight
|
12 |
+
2: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.20.attn_kv_b.weight
|
13 |
+
3: 5120 | 5120, 1, 1, 1 | F32 | blk.20.attn_norm.weight
|
14 |
+
4: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.20.attn_output.weight
|
15 |
+
5: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.20.attn_q_a.weight
|
16 |
+
6: 1536 | 1536, 1, 1, 1 | F32 | blk.20.attn_q_a_norm.weight
|
17 |
+
7: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.20.attn_q_b.weight
|
18 |
+
8: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.20.ffn_down_exps.weight
|
19 |
+
9: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.20.ffn_down_shexp.weight
|
20 |
+
10: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.20.ffn_gate_exps.weight
|
21 |
+
11: 819200 | 5120, 160, 1, 1 | F32 | blk.20.ffn_gate_inp.weight
|
22 |
+
12: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.20.ffn_gate_shexp.weight
|
23 |
+
13: 5120 | 5120, 1, 1, 1 | F32 | blk.20.ffn_norm.weight
|
24 |
+
14: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.20.ffn_up_exps.weight
|
25 |
+
15: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.20.ffn_up_shexp.weight
|
26 |
+
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.21.attn_kv_a_mqa.weight
|
27 |
+
17: 512 | 512, 1, 1, 1 | F32 | blk.21.attn_kv_a_norm.weight
|
28 |
+
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.21.attn_kv_b.weight
|
29 |
+
19: 5120 | 5120, 1, 1, 1 | F32 | blk.21.attn_norm.weight
|
30 |
+
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.21.attn_output.weight
|
31 |
+
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.21.attn_q_a.weight
|
32 |
+
22: 1536 | 1536, 1, 1, 1 | F32 | blk.21.attn_q_a_norm.weight
|
33 |
+
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.21.attn_q_b.weight
|
34 |
+
24: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.21.ffn_down_exps.weight
|
35 |
+
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.21.ffn_down_shexp.weight
|
36 |
+
26: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.21.ffn_gate_exps.weight
|
37 |
+
27: 819200 | 5120, 160, 1, 1 | F32 | blk.21.ffn_gate_inp.weight
|
38 |
+
28: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.21.ffn_gate_shexp.weight
|
39 |
+
29: 5120 | 5120, 1, 1, 1 | F32 | blk.21.ffn_norm.weight
|
40 |
+
30: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.21.ffn_up_exps.weight
|
41 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.21.ffn_up_shexp.weight
|
42 |
+
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.22.attn_kv_a_mqa.weight
|
43 |
+
33: 512 | 512, 1, 1, 1 | F32 | blk.22.attn_kv_a_norm.weight
|
44 |
+
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.22.attn_kv_b.weight
|
45 |
+
35: 5120 | 5120, 1, 1, 1 | F32 | blk.22.attn_norm.weight
|
46 |
+
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.22.attn_output.weight
|
47 |
+
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.22.attn_q_a.weight
|
48 |
+
38: 1536 | 1536, 1, 1, 1 | F32 | blk.22.attn_q_a_norm.weight
|
49 |
+
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.22.attn_q_b.weight
|
50 |
+
40: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.22.ffn_down_exps.weight
|
51 |
+
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.22.ffn_down_shexp.weight
|
52 |
+
42: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.22.ffn_gate_exps.weight
|
53 |
+
43: 819200 | 5120, 160, 1, 1 | F32 | blk.22.ffn_gate_inp.weight
|
54 |
+
44: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.22.ffn_gate_shexp.weight
|
55 |
+
45: 5120 | 5120, 1, 1, 1 | F32 | blk.22.ffn_norm.weight
|
56 |
+
46: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.22.ffn_up_exps.weight
|
57 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.22.ffn_up_shexp.weight
|
58 |
+
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.23.attn_kv_a_mqa.weight
|
59 |
+
49: 512 | 512, 1, 1, 1 | F32 | blk.23.attn_kv_a_norm.weight
|
60 |
+
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.23.attn_kv_b.weight
|
61 |
+
51: 5120 | 5120, 1, 1, 1 | F32 | blk.23.attn_norm.weight
|
62 |
+
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.23.attn_output.weight
|
63 |
+
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.23.attn_q_a.weight
|
64 |
+
54: 1536 | 1536, 1, 1, 1 | F32 | blk.23.attn_q_a_norm.weight
|
65 |
+
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.23.attn_q_b.weight
|
66 |
+
56: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.23.ffn_down_exps.weight
|
67 |
+
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.23.ffn_down_shexp.weight
|
68 |
+
58: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.23.ffn_gate_exps.weight
|
69 |
+
59: 819200 | 5120, 160, 1, 1 | F32 | blk.23.ffn_gate_inp.weight
|
70 |
+
60: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.23.ffn_gate_shexp.weight
|
71 |
+
61: 5120 | 5120, 1, 1, 1 | F32 | blk.23.ffn_norm.weight
|
72 |
+
62: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.23.ffn_up_exps.weight
|
73 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.23.ffn_up_shexp.weight
|
74 |
+
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.24.attn_kv_a_mqa.weight
|
75 |
+
65: 512 | 512, 1, 1, 1 | F32 | blk.24.attn_kv_a_norm.weight
|
76 |
+
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.24.attn_kv_b.weight
|
77 |
+
67: 5120 | 5120, 1, 1, 1 | F32 | blk.24.attn_norm.weight
|
78 |
+
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.24.attn_output.weight
|
79 |
+
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.24.attn_q_a.weight
|
80 |
+
70: 1536 | 1536, 1, 1, 1 | F32 | blk.24.attn_q_a_norm.weight
|
81 |
+
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.24.attn_q_b.weight
|
82 |
+
72: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.24.ffn_down_exps.weight
|
83 |
+
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.24.ffn_down_shexp.weight
|
84 |
+
74: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.24.ffn_gate_exps.weight
|
85 |
+
75: 819200 | 5120, 160, 1, 1 | F32 | blk.24.ffn_gate_inp.weight
|
86 |
+
76: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.24.ffn_gate_shexp.weight
|
87 |
+
77: 5120 | 5120, 1, 1, 1 | F32 | blk.24.ffn_norm.weight
|
88 |
+
78: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.24.ffn_up_exps.weight
|
89 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.24.ffn_up_shexp.weight
|
90 |
+
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.25.attn_kv_a_mqa.weight
|
91 |
+
81: 512 | 512, 1, 1, 1 | F32 | blk.25.attn_kv_a_norm.weight
|
92 |
+
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.25.attn_kv_b.weight
|
93 |
+
83: 5120 | 5120, 1, 1, 1 | F32 | blk.25.attn_norm.weight
|
94 |
+
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.25.attn_output.weight
|
95 |
+
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.25.attn_q_a.weight
|
96 |
+
86: 1536 | 1536, 1, 1, 1 | F32 | blk.25.attn_q_a_norm.weight
|
97 |
+
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.25.attn_q_b.weight
|
98 |
+
88: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.25.ffn_down_exps.weight
|
99 |
+
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.25.ffn_down_shexp.weight
|
100 |
+
90: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.25.ffn_gate_exps.weight
|
101 |
+
91: 819200 | 5120, 160, 1, 1 | F32 | blk.25.ffn_gate_inp.weight
|
102 |
+
92: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.25.ffn_gate_shexp.weight
|
103 |
+
93: 5120 | 5120, 1, 1, 1 | F32 | blk.25.ffn_norm.weight
|
104 |
+
94: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.25.ffn_up_exps.weight
|
105 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.25.ffn_up_shexp.weight
|
106 |
+
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.26.attn_kv_a_mqa.weight
|
107 |
+
97: 512 | 512, 1, 1, 1 | F32 | blk.26.attn_kv_a_norm.weight
|
108 |
+
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.26.attn_kv_b.weight
|
109 |
+
99: 5120 | 5120, 1, 1, 1 | F32 | blk.26.attn_norm.weight
|
110 |
+
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.26.attn_output.weight
|
111 |
+
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.26.attn_q_a.weight
|
112 |
+
102: 1536 | 1536, 1, 1, 1 | F32 | blk.26.attn_q_a_norm.weight
|
113 |
+
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.26.attn_q_b.weight
|
114 |
+
104: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.26.ffn_down_exps.weight
|
115 |
+
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.26.ffn_down_shexp.weight
|
116 |
+
106: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.26.ffn_gate_exps.weight
|
117 |
+
107: 819200 | 5120, 160, 1, 1 | F32 | blk.26.ffn_gate_inp.weight
|
118 |
+
108: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.26.ffn_gate_shexp.weight
|
119 |
+
109: 5120 | 5120, 1, 1, 1 | F32 | blk.26.ffn_norm.weight
|
120 |
+
110: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.26.ffn_up_exps.weight
|
121 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.26.ffn_up_shexp.weight
|
122 |
+
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.27.attn_kv_a_mqa.weight
|
123 |
+
113: 512 | 512, 1, 1, 1 | F32 | blk.27.attn_kv_a_norm.weight
|
124 |
+
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.27.attn_kv_b.weight
|
125 |
+
115: 5120 | 5120, 1, 1, 1 | F32 | blk.27.attn_norm.weight
|
126 |
+
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.27.attn_output.weight
|
127 |
+
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.27.attn_q_a.weight
|
128 |
+
118: 1536 | 1536, 1, 1, 1 | F32 | blk.27.attn_q_a_norm.weight
|
129 |
+
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.27.attn_q_b.weight
|
130 |
+
120: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.27.ffn_down_exps.weight
|
131 |
+
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.27.ffn_down_shexp.weight
|
132 |
+
122: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.27.ffn_gate_exps.weight
|
133 |
+
123: 819200 | 5120, 160, 1, 1 | F32 | blk.27.ffn_gate_inp.weight
|
134 |
+
124: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.27.ffn_gate_shexp.weight
|
135 |
+
125: 5120 | 5120, 1, 1, 1 | F32 | blk.27.ffn_norm.weight
|
136 |
+
126: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.27.ffn_up_exps.weight
|
137 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.27.ffn_up_shexp.weight
|
138 |
+
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.28.attn_kv_a_mqa.weight
|
139 |
+
129: 512 | 512, 1, 1, 1 | F32 | blk.28.attn_kv_a_norm.weight
|
140 |
+
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.28.attn_kv_b.weight
|
141 |
+
131: 5120 | 5120, 1, 1, 1 | F32 | blk.28.attn_norm.weight
|
142 |
+
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.28.attn_output.weight
|
143 |
+
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.28.attn_q_a.weight
|
144 |
+
134: 1536 | 1536, 1, 1, 1 | F32 | blk.28.attn_q_a_norm.weight
|
145 |
+
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.28.attn_q_b.weight
|
146 |
+
136: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.28.ffn_down_exps.weight
|
147 |
+
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.28.ffn_down_shexp.weight
|
148 |
+
138: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.28.ffn_gate_exps.weight
|
149 |
+
139: 819200 | 5120, 160, 1, 1 | F32 | blk.28.ffn_gate_inp.weight
|
150 |
+
140: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.28.ffn_gate_shexp.weight
|
151 |
+
141: 5120 | 5120, 1, 1, 1 | F32 | blk.28.ffn_norm.weight
|
152 |
+
142: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.28.ffn_up_exps.weight
|
153 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.28.ffn_up_shexp.weight
|
154 |
+
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.29.attn_kv_a_mqa.weight
|
155 |
+
145: 512 | 512, 1, 1, 1 | F32 | blk.29.attn_kv_a_norm.weight
|
156 |
+
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.29.attn_kv_b.weight
|
157 |
+
147: 5120 | 5120, 1, 1, 1 | F32 | blk.29.attn_norm.weight
|
158 |
+
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.29.attn_output.weight
|
159 |
+
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.29.attn_q_a.weight
|
160 |
+
150: 1536 | 1536, 1, 1, 1 | F32 | blk.29.attn_q_a_norm.weight
|
161 |
+
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.29.attn_q_b.weight
|
162 |
+
152: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.29.ffn_down_exps.weight
|
163 |
+
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.29.ffn_down_shexp.weight
|
164 |
+
154: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.29.ffn_gate_exps.weight
|
165 |
+
155: 819200 | 5120, 160, 1, 1 | F32 | blk.29.ffn_gate_inp.weight
|
166 |
+
156: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.29.ffn_gate_shexp.weight
|
167 |
+
157: 5120 | 5120, 1, 1, 1 | F32 | blk.29.ffn_norm.weight
|
168 |
+
158: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.29.ffn_up_exps.weight
|
169 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.29.ffn_up_shexp.weight
|
170 |
+
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.30.attn_kv_a_mqa.weight
|
171 |
+
161: 512 | 512, 1, 1, 1 | F32 | blk.30.attn_kv_a_norm.weight
|
172 |
+
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.30.attn_kv_b.weight
|
173 |
+
163: 5120 | 5120, 1, 1, 1 | F32 | blk.30.attn_norm.weight
|
174 |
+
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.30.attn_output.weight
|
175 |
+
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.30.attn_q_a.weight
|
176 |
+
166: 1536 | 1536, 1, 1, 1 | F32 | blk.30.attn_q_a_norm.weight
|
177 |
+
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.30.attn_q_b.weight
|
178 |
+
168: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.30.ffn_down_exps.weight
|
179 |
+
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.30.ffn_down_shexp.weight
|
180 |
+
170: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.30.ffn_gate_exps.weight
|
181 |
+
171: 819200 | 5120, 160, 1, 1 | F32 | blk.30.ffn_gate_inp.weight
|
182 |
+
172: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.30.ffn_gate_shexp.weight
|
183 |
+
173: 5120 | 5120, 1, 1, 1 | F32 | blk.30.ffn_norm.weight
|
184 |
+
174: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.30.ffn_up_exps.weight
|
185 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.30.ffn_up_shexp.weight
|
186 |
+
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.31.attn_kv_a_mqa.weight
|
187 |
+
177: 512 | 512, 1, 1, 1 | F32 | blk.31.attn_kv_a_norm.weight
|
188 |
+
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.31.attn_kv_b.weight
|
189 |
+
179: 5120 | 5120, 1, 1, 1 | F32 | blk.31.attn_norm.weight
|
190 |
+
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.31.attn_output.weight
|
191 |
+
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.31.attn_q_a.weight
|
192 |
+
182: 1536 | 1536, 1, 1, 1 | F32 | blk.31.attn_q_a_norm.weight
|
193 |
+
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.31.attn_q_b.weight
|
194 |
+
184: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.31.ffn_down_exps.weight
|
195 |
+
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.31.ffn_down_shexp.weight
|
196 |
+
186: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.31.ffn_gate_exps.weight
|
197 |
+
187: 819200 | 5120, 160, 1, 1 | F32 | blk.31.ffn_gate_inp.weight
|
198 |
+
188: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.31.ffn_gate_shexp.weight
|
199 |
+
189: 5120 | 5120, 1, 1, 1 | F32 | blk.31.ffn_norm.weight
|
200 |
+
190: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.31.ffn_up_exps.weight
|
201 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.31.ffn_up_shexp.weight
|
202 |
+
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.32.attn_kv_a_mqa.weight
|
203 |
+
193: 512 | 512, 1, 1, 1 | F32 | blk.32.attn_kv_a_norm.weight
|
204 |
+
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.32.attn_kv_b.weight
|
205 |
+
195: 5120 | 5120, 1, 1, 1 | F32 | blk.32.attn_norm.weight
|
206 |
+
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.32.attn_output.weight
|
207 |
+
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.32.attn_q_a.weight
|
208 |
+
198: 1536 | 1536, 1, 1, 1 | F32 | blk.32.attn_q_a_norm.weight
|
209 |
+
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.32.attn_q_b.weight
|
210 |
+
200: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.32.ffn_down_exps.weight
|
211 |
+
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.32.ffn_down_shexp.weight
|
212 |
+
202: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.32.ffn_gate_exps.weight
|
213 |
+
203: 819200 | 5120, 160, 1, 1 | F32 | blk.32.ffn_gate_inp.weight
|
214 |
+
204: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.32.ffn_gate_shexp.weight
|
215 |
+
205: 5120 | 5120, 1, 1, 1 | F32 | blk.32.ffn_norm.weight
|
216 |
+
206: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.32.ffn_up_exps.weight
|
217 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.32.ffn_up_shexp.weight
|
218 |
+
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.33.attn_kv_a_mqa.weight
|
219 |
+
209: 512 | 512, 1, 1, 1 | F32 | blk.33.attn_kv_a_norm.weight
|
220 |
+
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.33.attn_kv_b.weight
|
221 |
+
211: 5120 | 5120, 1, 1, 1 | F32 | blk.33.attn_norm.weight
|
222 |
+
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.33.attn_output.weight
|
223 |
+
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.33.attn_q_a.weight
|
224 |
+
214: 1536 | 1536, 1, 1, 1 | F32 | blk.33.attn_q_a_norm.weight
|
225 |
+
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.33.attn_q_b.weight
|
226 |
+
216: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.33.ffn_down_exps.weight
|
227 |
+
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.33.ffn_down_shexp.weight
|
228 |
+
218: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.33.ffn_gate_exps.weight
|
229 |
+
219: 819200 | 5120, 160, 1, 1 | F32 | blk.33.ffn_gate_inp.weight
|
230 |
+
220: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.33.ffn_gate_shexp.weight
|
231 |
+
221: 5120 | 5120, 1, 1, 1 | F32 | blk.33.ffn_norm.weight
|
232 |
+
222: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.33.ffn_up_exps.weight
|
233 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.33.ffn_up_shexp.weight
|
234 |
+
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.34.attn_kv_a_mqa.weight
|
235 |
+
225: 512 | 512, 1, 1, 1 | F32 | blk.34.attn_kv_a_norm.weight
|
236 |
+
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.34.attn_kv_b.weight
|
237 |
+
227: 5120 | 5120, 1, 1, 1 | F32 | blk.34.attn_norm.weight
|
238 |
+
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.34.attn_output.weight
|
239 |
+
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.34.attn_q_a.weight
|
240 |
+
230: 1536 | 1536, 1, 1, 1 | F32 | blk.34.attn_q_a_norm.weight
|
241 |
+
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.34.attn_q_b.weight
|
242 |
+
232: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.34.ffn_down_exps.weight
|
243 |
+
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.34.ffn_down_shexp.weight
|
244 |
+
234: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.34.ffn_gate_exps.weight
|
245 |
+
235: 819200 | 5120, 160, 1, 1 | F32 | blk.34.ffn_gate_inp.weight
|
246 |
+
236: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.34.ffn_gate_shexp.weight
|
247 |
+
237: 5120 | 5120, 1, 1, 1 | F32 | blk.34.ffn_norm.weight
|
248 |
+
238: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.34.ffn_up_exps.weight
|
249 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.34.ffn_up_shexp.weight
|
250 |
+
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.35.attn_kv_a_mqa.weight
|
251 |
+
241: 512 | 512, 1, 1, 1 | F32 | blk.35.attn_kv_a_norm.weight
|
252 |
+
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.35.attn_kv_b.weight
|
253 |
+
243: 5120 | 5120, 1, 1, 1 | F32 | blk.35.attn_norm.weight
|
254 |
+
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.35.attn_output.weight
|
255 |
+
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.35.attn_q_a.weight
|
256 |
+
246: 1536 | 1536, 1, 1, 1 | F32 | blk.35.attn_q_a_norm.weight
|
257 |
+
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.35.attn_q_b.weight
|
258 |
+
248: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.35.ffn_down_exps.weight
|
259 |
+
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.35.ffn_down_shexp.weight
|
260 |
+
250: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.35.ffn_gate_exps.weight
|
261 |
+
251: 819200 | 5120, 160, 1, 1 | F32 | blk.35.ffn_gate_inp.weight
|
262 |
+
252: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.35.ffn_gate_shexp.weight
|
263 |
+
253: 5120 | 5120, 1, 1, 1 | F32 | blk.35.ffn_norm.weight
|
264 |
+
254: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.35.ffn_up_exps.weight
|
265 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.35.ffn_up_shexp.weight
|
266 |
+
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.36.attn_kv_a_mqa.weight
|
267 |
+
257: 512 | 512, 1, 1, 1 | F32 | blk.36.attn_kv_a_norm.weight
|
268 |
+
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.36.attn_kv_b.weight
|
269 |
+
259: 5120 | 5120, 1, 1, 1 | F32 | blk.36.attn_norm.weight
|
270 |
+
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.36.attn_output.weight
|
271 |
+
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.36.attn_q_a.weight
|
272 |
+
262: 1536 | 1536, 1, 1, 1 | F32 | blk.36.attn_q_a_norm.weight
|
273 |
+
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.36.attn_q_b.weight
|
274 |
+
264: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.36.ffn_down_exps.weight
|
275 |
+
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.36.ffn_down_shexp.weight
|
276 |
+
266: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.36.ffn_gate_exps.weight
|
277 |
+
267: 819200 | 5120, 160, 1, 1 | F32 | blk.36.ffn_gate_inp.weight
|
278 |
+
268: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.36.ffn_gate_shexp.weight
|
279 |
+
269: 5120 | 5120, 1, 1, 1 | F32 | blk.36.ffn_norm.weight
|
280 |
+
270: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.36.ffn_up_exps.weight
|
281 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.36.ffn_up_shexp.weight
|
282 |
+
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.37.attn_kv_a_mqa.weight
|
283 |
+
273: 512 | 512, 1, 1, 1 | F32 | blk.37.attn_kv_a_norm.weight
|
284 |
+
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.37.attn_kv_b.weight
|
285 |
+
275: 5120 | 5120, 1, 1, 1 | F32 | blk.37.attn_norm.weight
|
286 |
+
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.37.attn_output.weight
|
287 |
+
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.37.attn_q_a.weight
|
288 |
+
278: 1536 | 1536, 1, 1, 1 | F32 | blk.37.attn_q_a_norm.weight
|
289 |
+
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.37.attn_q_b.weight
|
290 |
+
280: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.37.ffn_down_exps.weight
|
291 |
+
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.37.ffn_down_shexp.weight
|
292 |
+
282: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.37.ffn_gate_exps.weight
|
293 |
+
283: 819200 | 5120, 160, 1, 1 | F32 | blk.37.ffn_gate_inp.weight
|
294 |
+
284: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.37.ffn_gate_shexp.weight
|
295 |
+
285: 5120 | 5120, 1, 1, 1 | F32 | blk.37.ffn_norm.weight
|
296 |
+
286: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.37.ffn_up_exps.weight
|
297 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.37.ffn_up_shexp.weight
|
298 |
+
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.38.attn_kv_a_mqa.weight
|
299 |
+
289: 512 | 512, 1, 1, 1 | F32 | blk.38.attn_kv_a_norm.weight
|
300 |
+
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.38.attn_kv_b.weight
|
301 |
+
291: 5120 | 5120, 1, 1, 1 | F32 | blk.38.attn_norm.weight
|
302 |
+
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.38.attn_output.weight
|
303 |
+
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.38.attn_q_a.weight
|
304 |
+
294: 1536 | 1536, 1, 1, 1 | F32 | blk.38.attn_q_a_norm.weight
|
305 |
+
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.38.attn_q_b.weight
|
306 |
+
296: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.38.ffn_down_exps.weight
|
307 |
+
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.38.ffn_down_shexp.weight
|
308 |
+
298: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.38.ffn_gate_exps.weight
|
309 |
+
299: 819200 | 5120, 160, 1, 1 | F32 | blk.38.ffn_gate_inp.weight
|
310 |
+
300: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.38.ffn_gate_shexp.weight
|
311 |
+
301: 5120 | 5120, 1, 1, 1 | F32 | blk.38.ffn_norm.weight
|
312 |
+
302: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.38.ffn_up_exps.weight
|
313 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.38.ffn_up_shexp.weight
|
314 |
+
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.39.attn_kv_a_mqa.weight
|
315 |
+
305: 512 | 512, 1, 1, 1 | F32 | blk.39.attn_kv_a_norm.weight
|
316 |
+
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.39.attn_kv_b.weight
|
317 |
+
307: 5120 | 5120, 1, 1, 1 | F32 | blk.39.attn_norm.weight
|
318 |
+
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.39.attn_output.weight
|
319 |
+
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.39.attn_q_a.weight
|
320 |
+
310: 1536 | 1536, 1, 1, 1 | F32 | blk.39.attn_q_a_norm.weight
|
321 |
+
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.39.attn_q_b.weight
|
322 |
+
312: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.39.ffn_down_exps.weight
|
323 |
+
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.39.ffn_down_shexp.weight
|
324 |
+
314: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.39.ffn_gate_exps.weight
|
325 |
+
315: 819200 | 5120, 160, 1, 1 | F32 | blk.39.ffn_gate_inp.weight
|
326 |
+
316: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.39.ffn_gate_shexp.weight
|
327 |
+
317: 5120 | 5120, 1, 1, 1 | F32 | blk.39.ffn_norm.weight
|
328 |
+
318: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.39.ffn_up_exps.weight
|
329 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.39.ffn_up_shexp.weight
|
330 |
+
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.40.attn_kv_a_mqa.weight
|
DeepSeek-v2.5-1210-UD-iq3_m-00003-of-00003.gguf.tensors.txt
ADDED
@@ -0,0 +1,329 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq3_m-00003-of-00003.gguf
|
2 |
+
* File is LITTLE endian, script is running on a LITTLE endian host.
|
3 |
+
* Dumping 6 key/value pair(s)
|
4 |
+
1: UINT32 | 1 | GGUF.version = 3
|
5 |
+
2: UINT64 | 1 | GGUF.tensor_count = 319
|
6 |
+
3: UINT64 | 1 | GGUF.kv_count = 3
|
7 |
+
4: UINT16 | 1 | split.no = 2
|
8 |
+
5: INT32 | 1 | split.tensors.count = 959
|
9 |
+
6: UINT16 | 1 | split.count = 3
|
10 |
+
* Dumping 319 tensor(s)
|
11 |
+
1: 512 | 512, 1, 1, 1 | F32 | blk.40.attn_kv_a_norm.weight
|
12 |
+
2: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.40.attn_kv_b.weight
|
13 |
+
3: 5120 | 5120, 1, 1, 1 | F32 | blk.40.attn_norm.weight
|
14 |
+
4: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.40.attn_output.weight
|
15 |
+
5: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.40.attn_q_a.weight
|
16 |
+
6: 1536 | 1536, 1, 1, 1 | F32 | blk.40.attn_q_a_norm.weight
|
17 |
+
7: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.40.attn_q_b.weight
|
18 |
+
8: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.40.ffn_down_exps.weight
|
19 |
+
9: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.40.ffn_down_shexp.weight
|
20 |
+
10: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.40.ffn_gate_exps.weight
|
21 |
+
11: 819200 | 5120, 160, 1, 1 | F32 | blk.40.ffn_gate_inp.weight
|
22 |
+
12: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.40.ffn_gate_shexp.weight
|
23 |
+
13: 5120 | 5120, 1, 1, 1 | F32 | blk.40.ffn_norm.weight
|
24 |
+
14: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.40.ffn_up_exps.weight
|
25 |
+
15: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.40.ffn_up_shexp.weight
|
26 |
+
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.41.attn_kv_a_mqa.weight
|
27 |
+
17: 512 | 512, 1, 1, 1 | F32 | blk.41.attn_kv_a_norm.weight
|
28 |
+
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.41.attn_kv_b.weight
|
29 |
+
19: 5120 | 5120, 1, 1, 1 | F32 | blk.41.attn_norm.weight
|
30 |
+
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.41.attn_output.weight
|
31 |
+
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.41.attn_q_a.weight
|
32 |
+
22: 1536 | 1536, 1, 1, 1 | F32 | blk.41.attn_q_a_norm.weight
|
33 |
+
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.41.attn_q_b.weight
|
34 |
+
24: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.41.ffn_down_exps.weight
|
35 |
+
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.41.ffn_down_shexp.weight
|
36 |
+
26: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.41.ffn_gate_exps.weight
|
37 |
+
27: 819200 | 5120, 160, 1, 1 | F32 | blk.41.ffn_gate_inp.weight
|
38 |
+
28: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.41.ffn_gate_shexp.weight
|
39 |
+
29: 5120 | 5120, 1, 1, 1 | F32 | blk.41.ffn_norm.weight
|
40 |
+
30: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.41.ffn_up_exps.weight
|
41 |
+
31: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.41.ffn_up_shexp.weight
|
42 |
+
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.42.attn_kv_a_mqa.weight
|
43 |
+
33: 512 | 512, 1, 1, 1 | F32 | blk.42.attn_kv_a_norm.weight
|
44 |
+
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.42.attn_kv_b.weight
|
45 |
+
35: 5120 | 5120, 1, 1, 1 | F32 | blk.42.attn_norm.weight
|
46 |
+
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.42.attn_output.weight
|
47 |
+
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.42.attn_q_a.weight
|
48 |
+
38: 1536 | 1536, 1, 1, 1 | F32 | blk.42.attn_q_a_norm.weight
|
49 |
+
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.42.attn_q_b.weight
|
50 |
+
40: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.42.ffn_down_exps.weight
|
51 |
+
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.42.ffn_down_shexp.weight
|
52 |
+
42: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.42.ffn_gate_exps.weight
|
53 |
+
43: 819200 | 5120, 160, 1, 1 | F32 | blk.42.ffn_gate_inp.weight
|
54 |
+
44: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.42.ffn_gate_shexp.weight
|
55 |
+
45: 5120 | 5120, 1, 1, 1 | F32 | blk.42.ffn_norm.weight
|
56 |
+
46: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.42.ffn_up_exps.weight
|
57 |
+
47: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.42.ffn_up_shexp.weight
|
58 |
+
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.43.attn_kv_a_mqa.weight
|
59 |
+
49: 512 | 512, 1, 1, 1 | F32 | blk.43.attn_kv_a_norm.weight
|
60 |
+
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.43.attn_kv_b.weight
|
61 |
+
51: 5120 | 5120, 1, 1, 1 | F32 | blk.43.attn_norm.weight
|
62 |
+
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.43.attn_output.weight
|
63 |
+
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.43.attn_q_a.weight
|
64 |
+
54: 1536 | 1536, 1, 1, 1 | F32 | blk.43.attn_q_a_norm.weight
|
65 |
+
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.43.attn_q_b.weight
|
66 |
+
56: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.43.ffn_down_exps.weight
|
67 |
+
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.43.ffn_down_shexp.weight
|
68 |
+
58: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.43.ffn_gate_exps.weight
|
69 |
+
59: 819200 | 5120, 160, 1, 1 | F32 | blk.43.ffn_gate_inp.weight
|
70 |
+
60: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.43.ffn_gate_shexp.weight
|
71 |
+
61: 5120 | 5120, 1, 1, 1 | F32 | blk.43.ffn_norm.weight
|
72 |
+
62: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.43.ffn_up_exps.weight
|
73 |
+
63: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.43.ffn_up_shexp.weight
|
74 |
+
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.44.attn_kv_a_mqa.weight
|
75 |
+
65: 512 | 512, 1, 1, 1 | F32 | blk.44.attn_kv_a_norm.weight
|
76 |
+
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.44.attn_kv_b.weight
|
77 |
+
67: 5120 | 5120, 1, 1, 1 | F32 | blk.44.attn_norm.weight
|
78 |
+
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.44.attn_output.weight
|
79 |
+
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.44.attn_q_a.weight
|
80 |
+
70: 1536 | 1536, 1, 1, 1 | F32 | blk.44.attn_q_a_norm.weight
|
81 |
+
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.44.attn_q_b.weight
|
82 |
+
72: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.44.ffn_down_exps.weight
|
83 |
+
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.44.ffn_down_shexp.weight
|
84 |
+
74: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.44.ffn_gate_exps.weight
|
85 |
+
75: 819200 | 5120, 160, 1, 1 | F32 | blk.44.ffn_gate_inp.weight
|
86 |
+
76: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.44.ffn_gate_shexp.weight
|
87 |
+
77: 5120 | 5120, 1, 1, 1 | F32 | blk.44.ffn_norm.weight
|
88 |
+
78: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.44.ffn_up_exps.weight
|
89 |
+
79: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.44.ffn_up_shexp.weight
|
90 |
+
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.45.attn_kv_a_mqa.weight
|
91 |
+
81: 512 | 512, 1, 1, 1 | F32 | blk.45.attn_kv_a_norm.weight
|
92 |
+
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.45.attn_kv_b.weight
|
93 |
+
83: 5120 | 5120, 1, 1, 1 | F32 | blk.45.attn_norm.weight
|
94 |
+
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.45.attn_output.weight
|
95 |
+
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.45.attn_q_a.weight
|
96 |
+
86: 1536 | 1536, 1, 1, 1 | F32 | blk.45.attn_q_a_norm.weight
|
97 |
+
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.45.attn_q_b.weight
|
98 |
+
88: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.45.ffn_down_exps.weight
|
99 |
+
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.45.ffn_down_shexp.weight
|
100 |
+
90: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.45.ffn_gate_exps.weight
|
101 |
+
91: 819200 | 5120, 160, 1, 1 | F32 | blk.45.ffn_gate_inp.weight
|
102 |
+
92: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.45.ffn_gate_shexp.weight
|
103 |
+
93: 5120 | 5120, 1, 1, 1 | F32 | blk.45.ffn_norm.weight
|
104 |
+
94: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.45.ffn_up_exps.weight
|
105 |
+
95: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.45.ffn_up_shexp.weight
|
106 |
+
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.46.attn_kv_a_mqa.weight
|
107 |
+
97: 512 | 512, 1, 1, 1 | F32 | blk.46.attn_kv_a_norm.weight
|
108 |
+
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.46.attn_kv_b.weight
|
109 |
+
99: 5120 | 5120, 1, 1, 1 | F32 | blk.46.attn_norm.weight
|
110 |
+
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.46.attn_output.weight
|
111 |
+
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.46.attn_q_a.weight
|
112 |
+
102: 1536 | 1536, 1, 1, 1 | F32 | blk.46.attn_q_a_norm.weight
|
113 |
+
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.46.attn_q_b.weight
|
114 |
+
104: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.46.ffn_down_exps.weight
|
115 |
+
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.46.ffn_down_shexp.weight
|
116 |
+
106: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.46.ffn_gate_exps.weight
|
117 |
+
107: 819200 | 5120, 160, 1, 1 | F32 | blk.46.ffn_gate_inp.weight
|
118 |
+
108: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.46.ffn_gate_shexp.weight
|
119 |
+
109: 5120 | 5120, 1, 1, 1 | F32 | blk.46.ffn_norm.weight
|
120 |
+
110: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.46.ffn_up_exps.weight
|
121 |
+
111: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.46.ffn_up_shexp.weight
|
122 |
+
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.47.attn_kv_a_mqa.weight
|
123 |
+
113: 512 | 512, 1, 1, 1 | F32 | blk.47.attn_kv_a_norm.weight
|
124 |
+
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.47.attn_kv_b.weight
|
125 |
+
115: 5120 | 5120, 1, 1, 1 | F32 | blk.47.attn_norm.weight
|
126 |
+
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.47.attn_output.weight
|
127 |
+
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.47.attn_q_a.weight
|
128 |
+
118: 1536 | 1536, 1, 1, 1 | F32 | blk.47.attn_q_a_norm.weight
|
129 |
+
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.47.attn_q_b.weight
|
130 |
+
120: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.47.ffn_down_exps.weight
|
131 |
+
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.47.ffn_down_shexp.weight
|
132 |
+
122: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.47.ffn_gate_exps.weight
|
133 |
+
123: 819200 | 5120, 160, 1, 1 | F32 | blk.47.ffn_gate_inp.weight
|
134 |
+
124: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.47.ffn_gate_shexp.weight
|
135 |
+
125: 5120 | 5120, 1, 1, 1 | F32 | blk.47.ffn_norm.weight
|
136 |
+
126: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.47.ffn_up_exps.weight
|
137 |
+
127: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.47.ffn_up_shexp.weight
|
138 |
+
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.48.attn_kv_a_mqa.weight
|
139 |
+
129: 512 | 512, 1, 1, 1 | F32 | blk.48.attn_kv_a_norm.weight
|
140 |
+
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.48.attn_kv_b.weight
|
141 |
+
131: 5120 | 5120, 1, 1, 1 | F32 | blk.48.attn_norm.weight
|
142 |
+
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.48.attn_output.weight
|
143 |
+
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.48.attn_q_a.weight
|
144 |
+
134: 1536 | 1536, 1, 1, 1 | F32 | blk.48.attn_q_a_norm.weight
|
145 |
+
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.48.attn_q_b.weight
|
146 |
+
136: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.48.ffn_down_exps.weight
|
147 |
+
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.48.ffn_down_shexp.weight
|
148 |
+
138: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.48.ffn_gate_exps.weight
|
149 |
+
139: 819200 | 5120, 160, 1, 1 | F32 | blk.48.ffn_gate_inp.weight
|
150 |
+
140: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.48.ffn_gate_shexp.weight
|
151 |
+
141: 5120 | 5120, 1, 1, 1 | F32 | blk.48.ffn_norm.weight
|
152 |
+
142: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.48.ffn_up_exps.weight
|
153 |
+
143: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.48.ffn_up_shexp.weight
|
154 |
+
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.49.attn_kv_a_mqa.weight
|
155 |
+
145: 512 | 512, 1, 1, 1 | F32 | blk.49.attn_kv_a_norm.weight
|
156 |
+
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.49.attn_kv_b.weight
|
157 |
+
147: 5120 | 5120, 1, 1, 1 | F32 | blk.49.attn_norm.weight
|
158 |
+
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.49.attn_output.weight
|
159 |
+
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.49.attn_q_a.weight
|
160 |
+
150: 1536 | 1536, 1, 1, 1 | F32 | blk.49.attn_q_a_norm.weight
|
161 |
+
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.49.attn_q_b.weight
|
162 |
+
152: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.49.ffn_down_exps.weight
|
163 |
+
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.49.ffn_down_shexp.weight
|
164 |
+
154: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.49.ffn_gate_exps.weight
|
165 |
+
155: 819200 | 5120, 160, 1, 1 | F32 | blk.49.ffn_gate_inp.weight
|
166 |
+
156: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.49.ffn_gate_shexp.weight
|
167 |
+
157: 5120 | 5120, 1, 1, 1 | F32 | blk.49.ffn_norm.weight
|
168 |
+
158: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.49.ffn_up_exps.weight
|
169 |
+
159: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.49.ffn_up_shexp.weight
|
170 |
+
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.50.attn_kv_a_mqa.weight
|
171 |
+
161: 512 | 512, 1, 1, 1 | F32 | blk.50.attn_kv_a_norm.weight
|
172 |
+
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.50.attn_kv_b.weight
|
173 |
+
163: 5120 | 5120, 1, 1, 1 | F32 | blk.50.attn_norm.weight
|
174 |
+
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.50.attn_output.weight
|
175 |
+
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.50.attn_q_a.weight
|
176 |
+
166: 1536 | 1536, 1, 1, 1 | F32 | blk.50.attn_q_a_norm.weight
|
177 |
+
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.50.attn_q_b.weight
|
178 |
+
168: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.50.ffn_down_exps.weight
|
179 |
+
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.50.ffn_down_shexp.weight
|
180 |
+
170: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.50.ffn_gate_exps.weight
|
181 |
+
171: 819200 | 5120, 160, 1, 1 | F32 | blk.50.ffn_gate_inp.weight
|
182 |
+
172: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.50.ffn_gate_shexp.weight
|
183 |
+
173: 5120 | 5120, 1, 1, 1 | F32 | blk.50.ffn_norm.weight
|
184 |
+
174: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.50.ffn_up_exps.weight
|
185 |
+
175: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.50.ffn_up_shexp.weight
|
186 |
+
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.51.attn_kv_a_mqa.weight
|
187 |
+
177: 512 | 512, 1, 1, 1 | F32 | blk.51.attn_kv_a_norm.weight
|
188 |
+
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.51.attn_kv_b.weight
|
189 |
+
179: 5120 | 5120, 1, 1, 1 | F32 | blk.51.attn_norm.weight
|
190 |
+
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.51.attn_output.weight
|
191 |
+
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.51.attn_q_a.weight
|
192 |
+
182: 1536 | 1536, 1, 1, 1 | F32 | blk.51.attn_q_a_norm.weight
|
193 |
+
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.51.attn_q_b.weight
|
194 |
+
184: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.51.ffn_down_exps.weight
|
195 |
+
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.51.ffn_down_shexp.weight
|
196 |
+
186: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.51.ffn_gate_exps.weight
|
197 |
+
187: 819200 | 5120, 160, 1, 1 | F32 | blk.51.ffn_gate_inp.weight
|
198 |
+
188: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.51.ffn_gate_shexp.weight
|
199 |
+
189: 5120 | 5120, 1, 1, 1 | F32 | blk.51.ffn_norm.weight
|
200 |
+
190: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.51.ffn_up_exps.weight
|
201 |
+
191: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.51.ffn_up_shexp.weight
|
202 |
+
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.52.attn_kv_a_mqa.weight
|
203 |
+
193: 512 | 512, 1, 1, 1 | F32 | blk.52.attn_kv_a_norm.weight
|
204 |
+
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.52.attn_kv_b.weight
|
205 |
+
195: 5120 | 5120, 1, 1, 1 | F32 | blk.52.attn_norm.weight
|
206 |
+
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.52.attn_output.weight
|
207 |
+
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.52.attn_q_a.weight
|
208 |
+
198: 1536 | 1536, 1, 1, 1 | F32 | blk.52.attn_q_a_norm.weight
|
209 |
+
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.52.attn_q_b.weight
|
210 |
+
200: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.52.ffn_down_exps.weight
|
211 |
+
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.52.ffn_down_shexp.weight
|
212 |
+
202: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.52.ffn_gate_exps.weight
|
213 |
+
203: 819200 | 5120, 160, 1, 1 | F32 | blk.52.ffn_gate_inp.weight
|
214 |
+
204: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.52.ffn_gate_shexp.weight
|
215 |
+
205: 5120 | 5120, 1, 1, 1 | F32 | blk.52.ffn_norm.weight
|
216 |
+
206: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.52.ffn_up_exps.weight
|
217 |
+
207: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.52.ffn_up_shexp.weight
|
218 |
+
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.53.attn_kv_a_mqa.weight
|
219 |
+
209: 512 | 512, 1, 1, 1 | F32 | blk.53.attn_kv_a_norm.weight
|
220 |
+
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.53.attn_kv_b.weight
|
221 |
+
211: 5120 | 5120, 1, 1, 1 | F32 | blk.53.attn_norm.weight
|
222 |
+
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.53.attn_output.weight
|
223 |
+
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.53.attn_q_a.weight
|
224 |
+
214: 1536 | 1536, 1, 1, 1 | F32 | blk.53.attn_q_a_norm.weight
|
225 |
+
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.53.attn_q_b.weight
|
226 |
+
216: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.53.ffn_down_exps.weight
|
227 |
+
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.53.ffn_down_shexp.weight
|
228 |
+
218: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.53.ffn_gate_exps.weight
|
229 |
+
219: 819200 | 5120, 160, 1, 1 | F32 | blk.53.ffn_gate_inp.weight
|
230 |
+
220: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.53.ffn_gate_shexp.weight
|
231 |
+
221: 5120 | 5120, 1, 1, 1 | F32 | blk.53.ffn_norm.weight
|
232 |
+
222: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.53.ffn_up_exps.weight
|
233 |
+
223: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.53.ffn_up_shexp.weight
|
234 |
+
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.54.attn_kv_a_mqa.weight
|
235 |
+
225: 512 | 512, 1, 1, 1 | F32 | blk.54.attn_kv_a_norm.weight
|
236 |
+
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.54.attn_kv_b.weight
|
237 |
+
227: 5120 | 5120, 1, 1, 1 | F32 | blk.54.attn_norm.weight
|
238 |
+
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.54.attn_output.weight
|
239 |
+
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.54.attn_q_a.weight
|
240 |
+
230: 1536 | 1536, 1, 1, 1 | F32 | blk.54.attn_q_a_norm.weight
|
241 |
+
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.54.attn_q_b.weight
|
242 |
+
232: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.54.ffn_down_exps.weight
|
243 |
+
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.54.ffn_down_shexp.weight
|
244 |
+
234: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.54.ffn_gate_exps.weight
|
245 |
+
235: 819200 | 5120, 160, 1, 1 | F32 | blk.54.ffn_gate_inp.weight
|
246 |
+
236: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.54.ffn_gate_shexp.weight
|
247 |
+
237: 5120 | 5120, 1, 1, 1 | F32 | blk.54.ffn_norm.weight
|
248 |
+
238: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.54.ffn_up_exps.weight
|
249 |
+
239: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.54.ffn_up_shexp.weight
|
250 |
+
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.55.attn_kv_a_mqa.weight
|
251 |
+
241: 512 | 512, 1, 1, 1 | F32 | blk.55.attn_kv_a_norm.weight
|
252 |
+
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.55.attn_kv_b.weight
|
253 |
+
243: 5120 | 5120, 1, 1, 1 | F32 | blk.55.attn_norm.weight
|
254 |
+
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.55.attn_output.weight
|
255 |
+
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.55.attn_q_a.weight
|
256 |
+
246: 1536 | 1536, 1, 1, 1 | F32 | blk.55.attn_q_a_norm.weight
|
257 |
+
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.55.attn_q_b.weight
|
258 |
+
248: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.55.ffn_down_exps.weight
|
259 |
+
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.55.ffn_down_shexp.weight
|
260 |
+
250: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.55.ffn_gate_exps.weight
|
261 |
+
251: 819200 | 5120, 160, 1, 1 | F32 | blk.55.ffn_gate_inp.weight
|
262 |
+
252: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.55.ffn_gate_shexp.weight
|
263 |
+
253: 5120 | 5120, 1, 1, 1 | F32 | blk.55.ffn_norm.weight
|
264 |
+
254: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.55.ffn_up_exps.weight
|
265 |
+
255: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.55.ffn_up_shexp.weight
|
266 |
+
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.56.attn_kv_a_mqa.weight
|
267 |
+
257: 512 | 512, 1, 1, 1 | F32 | blk.56.attn_kv_a_norm.weight
|
268 |
+
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.56.attn_kv_b.weight
|
269 |
+
259: 5120 | 5120, 1, 1, 1 | F32 | blk.56.attn_norm.weight
|
270 |
+
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.56.attn_output.weight
|
271 |
+
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.56.attn_q_a.weight
|
272 |
+
262: 1536 | 1536, 1, 1, 1 | F32 | blk.56.attn_q_a_norm.weight
|
273 |
+
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.56.attn_q_b.weight
|
274 |
+
264: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.56.ffn_down_exps.weight
|
275 |
+
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.56.ffn_down_shexp.weight
|
276 |
+
266: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.56.ffn_gate_exps.weight
|
277 |
+
267: 819200 | 5120, 160, 1, 1 | F32 | blk.56.ffn_gate_inp.weight
|
278 |
+
268: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.56.ffn_gate_shexp.weight
|
279 |
+
269: 5120 | 5120, 1, 1, 1 | F32 | blk.56.ffn_norm.weight
|
280 |
+
270: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.56.ffn_up_exps.weight
|
281 |
+
271: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.56.ffn_up_shexp.weight
|
282 |
+
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.57.attn_kv_a_mqa.weight
|
283 |
+
273: 512 | 512, 1, 1, 1 | F32 | blk.57.attn_kv_a_norm.weight
|
284 |
+
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.57.attn_kv_b.weight
|
285 |
+
275: 5120 | 5120, 1, 1, 1 | F32 | blk.57.attn_norm.weight
|
286 |
+
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.57.attn_output.weight
|
287 |
+
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.57.attn_q_a.weight
|
288 |
+
278: 1536 | 1536, 1, 1, 1 | F32 | blk.57.attn_q_a_norm.weight
|
289 |
+
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.57.attn_q_b.weight
|
290 |
+
280: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.57.ffn_down_exps.weight
|
291 |
+
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.57.ffn_down_shexp.weight
|
292 |
+
282: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.57.ffn_gate_exps.weight
|
293 |
+
283: 819200 | 5120, 160, 1, 1 | F32 | blk.57.ffn_gate_inp.weight
|
294 |
+
284: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.57.ffn_gate_shexp.weight
|
295 |
+
285: 5120 | 5120, 1, 1, 1 | F32 | blk.57.ffn_norm.weight
|
296 |
+
286: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.57.ffn_up_exps.weight
|
297 |
+
287: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.57.ffn_up_shexp.weight
|
298 |
+
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.58.attn_kv_a_mqa.weight
|
299 |
+
289: 512 | 512, 1, 1, 1 | F32 | blk.58.attn_kv_a_norm.weight
|
300 |
+
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.58.attn_kv_b.weight
|
301 |
+
291: 5120 | 5120, 1, 1, 1 | F32 | blk.58.attn_norm.weight
|
302 |
+
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.58.attn_output.weight
|
303 |
+
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.58.attn_q_a.weight
|
304 |
+
294: 1536 | 1536, 1, 1, 1 | F32 | blk.58.attn_q_a_norm.weight
|
305 |
+
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.58.attn_q_b.weight
|
306 |
+
296: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.58.ffn_down_exps.weight
|
307 |
+
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.58.ffn_down_shexp.weight
|
308 |
+
298: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.58.ffn_gate_exps.weight
|
309 |
+
299: 819200 | 5120, 160, 1, 1 | F32 | blk.58.ffn_gate_inp.weight
|
310 |
+
300: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.58.ffn_gate_shexp.weight
|
311 |
+
301: 5120 | 5120, 1, 1, 1 | F32 | blk.58.ffn_norm.weight
|
312 |
+
302: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.58.ffn_up_exps.weight
|
313 |
+
303: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.58.ffn_up_shexp.weight
|
314 |
+
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.59.attn_kv_a_mqa.weight
|
315 |
+
305: 512 | 512, 1, 1, 1 | F32 | blk.59.attn_kv_a_norm.weight
|
316 |
+
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.59.attn_kv_b.weight
|
317 |
+
307: 5120 | 5120, 1, 1, 1 | F32 | blk.59.attn_norm.weight
|
318 |
+
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.59.attn_output.weight
|
319 |
+
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.59.attn_q_a.weight
|
320 |
+
310: 1536 | 1536, 1, 1, 1 | F32 | blk.59.attn_q_a_norm.weight
|
321 |
+
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.59.attn_q_b.weight
|
322 |
+
312: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.59.ffn_down_exps.weight
|
323 |
+
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.59.ffn_down_shexp.weight
|
324 |
+
314: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.59.ffn_gate_exps.weight
|
325 |
+
315: 819200 | 5120, 160, 1, 1 | F32 | blk.59.ffn_gate_inp.weight
|
326 |
+
316: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.59.ffn_gate_shexp.weight
|
327 |
+
317: 5120 | 5120, 1, 1, 1 | F32 | blk.59.ffn_norm.weight
|
328 |
+
318: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.59.ffn_up_exps.weight
|
329 |
+
319: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.59.ffn_up_shexp.weight
|