DeepSeek-v2.5-1210-UD-gguf / DeepSeek-v2.5-1210-UD-iq3_m-00001-of-00003.gguf.tensors.txt
gnisho's picture
Upload 11 files
0746586 verified
raw
history blame
31.9 kB
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq3_m-00001-of-00003.gguf
* File is LITTLE endian, script is running on a LITTLE endian host.
* Dumping 56 key/value pair(s)
1: UINT32 | 1 | GGUF.version = 3
2: UINT64 | 1 | GGUF.tensor_count = 320
3: UINT64 | 1 | GGUF.kv_count = 53
4: STRING | 1 | general.architecture = 'deepseek2'
5: STRING | 1 | general.type = 'model'
6: STRING | 1 | general.name = 'Dsv25'
7: STRING | 1 | general.size_label = '160x14B'
8: STRING | 1 | general.license = 'other'
9: STRING | 1 | general.license.name = 'deepseek'
10: STRING | 1 | general.license.link = 'https://github.com/deepseek-ai/DeepSeek-V2/blob/main/LICENSE'
11: UINT32 | 1 | deepseek2.block_count = 60
12: UINT32 | 1 | deepseek2.context_length = 163840
13: UINT32 | 1 | deepseek2.embedding_length = 5120
14: UINT32 | 1 | deepseek2.feed_forward_length = 12288
15: UINT32 | 1 | deepseek2.attention.head_count = 128
16: UINT32 | 1 | deepseek2.attention.head_count_kv = 128
17: FLOAT32 | 1 | deepseek2.rope.freq_base = 10000.0
18: FLOAT32 | 1 | deepseek2.attention.layer_norm_rms_epsilon = 9.999999974752427e-07
19: UINT32 | 1 | deepseek2.expert_used_count = 6
20: UINT32 | 1 | deepseek2.leading_dense_block_count = 1
21: UINT32 | 1 | deepseek2.vocab_size = 102400
22: UINT32 | 1 | deepseek2.attention.q_lora_rank = 1536
23: UINT32 | 1 | deepseek2.attention.kv_lora_rank = 512
24: UINT32 | 1 | deepseek2.attention.key_length = 192
25: UINT32 | 1 | deepseek2.attention.value_length = 128
26: UINT32 | 1 | deepseek2.expert_feed_forward_length = 1536
27: UINT32 | 1 | deepseek2.expert_count = 160
28: UINT32 | 1 | deepseek2.expert_shared_count = 2
29: FLOAT32 | 1 | deepseek2.expert_weights_scale = 16.0
30: BOOL | 1 | deepseek2.expert_weights_norm = False
31: UINT32 | 1 | deepseek2.expert_gating_func = 1
32: UINT32 | 1 | deepseek2.rope.dimension_count = 64
33: STRING | 1 | deepseek2.rope.scaling.type = 'yarn'
34: FLOAT32 | 1 | deepseek2.rope.scaling.factor = 40.0
35: UINT32 | 1 | deepseek2.rope.scaling.original_context_length = 4096
36: FLOAT32 | 1 | deepseek2.rope.scaling.yarn_log_multiplier = 0.10000000149011612
37: STRING | 1 | tokenizer.ggml.model = 'gpt2'
38: STRING | 1 | tokenizer.ggml.pre = 'deepseek-llm'
39: [STRING] | 102400 | tokenizer.ggml.tokens
40: [INT32] | 102400 | tokenizer.ggml.token_type
41: [STRING] | 99757 | tokenizer.ggml.merges
42: UINT32 | 1 | tokenizer.ggml.bos_token_id = 100000
43: UINT32 | 1 | tokenizer.ggml.eos_token_id = 100001
44: UINT32 | 1 | tokenizer.ggml.padding_token_id = 100001
45: BOOL | 1 | tokenizer.ggml.add_bos_token = True
46: BOOL | 1 | tokenizer.ggml.add_eos_token = False
47: STRING | 1 | tokenizer.chat_template = '{% if not add_generation_prompt is defined %}{% set add_gene'
48: UINT32 | 1 | general.quantization_version = 2
49: UINT32 | 1 | general.file_type = 27
50: STRING | 1 | quantize.imatrix.file = '/archive/nuc/LLM/raw/imatrix-DeepSeek-V2.5-1210-bartowski.da'
51: STRING | 1 | quantize.imatrix.dataset = '/training_dir/calibration_datav3.txt'
52: INT32 | 1 | quantize.imatrix.entries_count = 716
53: INT32 | 1 | quantize.imatrix.chunks_count = 139
54: UINT16 | 1 | split.no = 0
55: INT32 | 1 | split.tensors.count = 959
56: UINT16 | 1 | split.count = 3
* Dumping 320 tensor(s)
1: 524288000 | 5120, 102400, 1, 1 | Q6_K | output.weight
2: 5120 | 5120, 1, 1, 1 | F32 | output_norm.weight
3: 524288000 | 5120, 102400, 1, 1 | Q6_K | token_embd.weight
4: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.0.attn_kv_a_mqa.weight
5: 512 | 512, 1, 1, 1 | F32 | blk.0.attn_kv_a_norm.weight
6: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.0.attn_kv_b.weight
7: 5120 | 5120, 1, 1, 1 | F32 | blk.0.attn_norm.weight
8: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.0.attn_output.weight
9: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.0.attn_q_a.weight
10: 1536 | 1536, 1, 1, 1 | F32 | blk.0.attn_q_a_norm.weight
11: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.0.attn_q_b.weight
12: 62914560 | 12288, 5120, 1, 1 | Q6_K | blk.0.ffn_down.weight
13: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_gate.weight
14: 5120 | 5120, 1, 1, 1 | F32 | blk.0.ffn_norm.weight
15: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_up.weight
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.1.attn_kv_a_mqa.weight
17: 512 | 512, 1, 1, 1 | F32 | blk.1.attn_kv_a_norm.weight
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.1.attn_kv_b.weight
19: 5120 | 5120, 1, 1, 1 | F32 | blk.1.attn_norm.weight
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.1.attn_output.weight
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.1.attn_q_a.weight
22: 1536 | 1536, 1, 1, 1 | F32 | blk.1.attn_q_a_norm.weight
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.1.attn_q_b.weight
24: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.1.ffn_down_exps.weight
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.1.ffn_down_shexp.weight
26: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.1.ffn_gate_exps.weight
27: 819200 | 5120, 160, 1, 1 | F32 | blk.1.ffn_gate_inp.weight
28: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.1.ffn_gate_shexp.weight
29: 5120 | 5120, 1, 1, 1 | F32 | blk.1.ffn_norm.weight
30: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.1.ffn_up_exps.weight
31: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.1.ffn_up_shexp.weight
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.2.attn_kv_a_mqa.weight
33: 512 | 512, 1, 1, 1 | F32 | blk.2.attn_kv_a_norm.weight
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.2.attn_kv_b.weight
35: 5120 | 5120, 1, 1, 1 | F32 | blk.2.attn_norm.weight
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.2.attn_output.weight
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.2.attn_q_a.weight
38: 1536 | 1536, 1, 1, 1 | F32 | blk.2.attn_q_a_norm.weight
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.2.attn_q_b.weight
40: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.2.ffn_down_exps.weight
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.2.ffn_down_shexp.weight
42: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.2.ffn_gate_exps.weight
43: 819200 | 5120, 160, 1, 1 | F32 | blk.2.ffn_gate_inp.weight
44: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.2.ffn_gate_shexp.weight
45: 5120 | 5120, 1, 1, 1 | F32 | blk.2.ffn_norm.weight
46: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.2.ffn_up_exps.weight
47: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.2.ffn_up_shexp.weight
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.3.attn_kv_a_mqa.weight
49: 512 | 512, 1, 1, 1 | F32 | blk.3.attn_kv_a_norm.weight
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.3.attn_kv_b.weight
51: 5120 | 5120, 1, 1, 1 | F32 | blk.3.attn_norm.weight
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.3.attn_output.weight
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.3.attn_q_a.weight
54: 1536 | 1536, 1, 1, 1 | F32 | blk.3.attn_q_a_norm.weight
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.3.attn_q_b.weight
56: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.3.ffn_down_exps.weight
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.3.ffn_down_shexp.weight
58: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.3.ffn_gate_exps.weight
59: 819200 | 5120, 160, 1, 1 | F32 | blk.3.ffn_gate_inp.weight
60: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.3.ffn_gate_shexp.weight
61: 5120 | 5120, 1, 1, 1 | F32 | blk.3.ffn_norm.weight
62: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.3.ffn_up_exps.weight
63: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.3.ffn_up_shexp.weight
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.4.attn_kv_a_mqa.weight
65: 512 | 512, 1, 1, 1 | F32 | blk.4.attn_kv_a_norm.weight
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.4.attn_kv_b.weight
67: 5120 | 5120, 1, 1, 1 | F32 | blk.4.attn_norm.weight
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.4.attn_output.weight
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.4.attn_q_a.weight
70: 1536 | 1536, 1, 1, 1 | F32 | blk.4.attn_q_a_norm.weight
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.4.attn_q_b.weight
72: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.4.ffn_down_exps.weight
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.4.ffn_down_shexp.weight
74: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.4.ffn_gate_exps.weight
75: 819200 | 5120, 160, 1, 1 | F32 | blk.4.ffn_gate_inp.weight
76: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.4.ffn_gate_shexp.weight
77: 5120 | 5120, 1, 1, 1 | F32 | blk.4.ffn_norm.weight
78: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.4.ffn_up_exps.weight
79: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.4.ffn_up_shexp.weight
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.5.attn_kv_a_mqa.weight
81: 512 | 512, 1, 1, 1 | F32 | blk.5.attn_kv_a_norm.weight
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.5.attn_kv_b.weight
83: 5120 | 5120, 1, 1, 1 | F32 | blk.5.attn_norm.weight
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.5.attn_output.weight
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.5.attn_q_a.weight
86: 1536 | 1536, 1, 1, 1 | F32 | blk.5.attn_q_a_norm.weight
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.5.attn_q_b.weight
88: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.5.ffn_down_exps.weight
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.5.ffn_down_shexp.weight
90: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.5.ffn_gate_exps.weight
91: 819200 | 5120, 160, 1, 1 | F32 | blk.5.ffn_gate_inp.weight
92: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.5.ffn_gate_shexp.weight
93: 5120 | 5120, 1, 1, 1 | F32 | blk.5.ffn_norm.weight
94: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.5.ffn_up_exps.weight
95: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.5.ffn_up_shexp.weight
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.6.attn_kv_a_mqa.weight
97: 512 | 512, 1, 1, 1 | F32 | blk.6.attn_kv_a_norm.weight
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.6.attn_kv_b.weight
99: 5120 | 5120, 1, 1, 1 | F32 | blk.6.attn_norm.weight
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.6.attn_output.weight
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.6.attn_q_a.weight
102: 1536 | 1536, 1, 1, 1 | F32 | blk.6.attn_q_a_norm.weight
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.6.attn_q_b.weight
104: 1258291200 | 1536, 5120, 160, 1 | Q4_K | blk.6.ffn_down_exps.weight
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.6.ffn_down_shexp.weight
106: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.6.ffn_gate_exps.weight
107: 819200 | 5120, 160, 1, 1 | F32 | blk.6.ffn_gate_inp.weight
108: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.6.ffn_gate_shexp.weight
109: 5120 | 5120, 1, 1, 1 | F32 | blk.6.ffn_norm.weight
110: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.6.ffn_up_exps.weight
111: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.6.ffn_up_shexp.weight
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.7.attn_kv_a_mqa.weight
113: 512 | 512, 1, 1, 1 | F32 | blk.7.attn_kv_a_norm.weight
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.7.attn_kv_b.weight
115: 5120 | 5120, 1, 1, 1 | F32 | blk.7.attn_norm.weight
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.7.attn_output.weight
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.7.attn_q_a.weight
118: 1536 | 1536, 1, 1, 1 | F32 | blk.7.attn_q_a_norm.weight
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.7.attn_q_b.weight
120: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.7.ffn_down_exps.weight
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.7.ffn_down_shexp.weight
122: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.7.ffn_gate_exps.weight
123: 819200 | 5120, 160, 1, 1 | F32 | blk.7.ffn_gate_inp.weight
124: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.7.ffn_gate_shexp.weight
125: 5120 | 5120, 1, 1, 1 | F32 | blk.7.ffn_norm.weight
126: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.7.ffn_up_exps.weight
127: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.7.ffn_up_shexp.weight
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.8.attn_kv_a_mqa.weight
129: 512 | 512, 1, 1, 1 | F32 | blk.8.attn_kv_a_norm.weight
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.8.attn_kv_b.weight
131: 5120 | 5120, 1, 1, 1 | F32 | blk.8.attn_norm.weight
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.8.attn_output.weight
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.8.attn_q_a.weight
134: 1536 | 1536, 1, 1, 1 | F32 | blk.8.attn_q_a_norm.weight
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.8.attn_q_b.weight
136: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.8.ffn_down_exps.weight
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.8.ffn_down_shexp.weight
138: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.8.ffn_gate_exps.weight
139: 819200 | 5120, 160, 1, 1 | F32 | blk.8.ffn_gate_inp.weight
140: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.8.ffn_gate_shexp.weight
141: 5120 | 5120, 1, 1, 1 | F32 | blk.8.ffn_norm.weight
142: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.8.ffn_up_exps.weight
143: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.8.ffn_up_shexp.weight
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.9.attn_kv_a_mqa.weight
145: 512 | 512, 1, 1, 1 | F32 | blk.9.attn_kv_a_norm.weight
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.9.attn_kv_b.weight
147: 5120 | 5120, 1, 1, 1 | F32 | blk.9.attn_norm.weight
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.9.attn_output.weight
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.9.attn_q_a.weight
150: 1536 | 1536, 1, 1, 1 | F32 | blk.9.attn_q_a_norm.weight
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.9.attn_q_b.weight
152: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.9.ffn_down_exps.weight
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.9.ffn_down_shexp.weight
154: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.9.ffn_gate_exps.weight
155: 819200 | 5120, 160, 1, 1 | F32 | blk.9.ffn_gate_inp.weight
156: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.9.ffn_gate_shexp.weight
157: 5120 | 5120, 1, 1, 1 | F32 | blk.9.ffn_norm.weight
158: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.9.ffn_up_exps.weight
159: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.9.ffn_up_shexp.weight
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.10.attn_kv_a_mqa.weight
161: 512 | 512, 1, 1, 1 | F32 | blk.10.attn_kv_a_norm.weight
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.10.attn_kv_b.weight
163: 5120 | 5120, 1, 1, 1 | F32 | blk.10.attn_norm.weight
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.10.attn_output.weight
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.10.attn_q_a.weight
166: 1536 | 1536, 1, 1, 1 | F32 | blk.10.attn_q_a_norm.weight
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.10.attn_q_b.weight
168: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.10.ffn_down_exps.weight
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.10.ffn_down_shexp.weight
170: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.10.ffn_gate_exps.weight
171: 819200 | 5120, 160, 1, 1 | F32 | blk.10.ffn_gate_inp.weight
172: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.10.ffn_gate_shexp.weight
173: 5120 | 5120, 1, 1, 1 | F32 | blk.10.ffn_norm.weight
174: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.10.ffn_up_exps.weight
175: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.10.ffn_up_shexp.weight
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.11.attn_kv_a_mqa.weight
177: 512 | 512, 1, 1, 1 | F32 | blk.11.attn_kv_a_norm.weight
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.11.attn_kv_b.weight
179: 5120 | 5120, 1, 1, 1 | F32 | blk.11.attn_norm.weight
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.11.attn_output.weight
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.11.attn_q_a.weight
182: 1536 | 1536, 1, 1, 1 | F32 | blk.11.attn_q_a_norm.weight
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.11.attn_q_b.weight
184: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.11.ffn_down_exps.weight
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.11.ffn_down_shexp.weight
186: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.11.ffn_gate_exps.weight
187: 819200 | 5120, 160, 1, 1 | F32 | blk.11.ffn_gate_inp.weight
188: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.11.ffn_gate_shexp.weight
189: 5120 | 5120, 1, 1, 1 | F32 | blk.11.ffn_norm.weight
190: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.11.ffn_up_exps.weight
191: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.11.ffn_up_shexp.weight
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.12.attn_kv_a_mqa.weight
193: 512 | 512, 1, 1, 1 | F32 | blk.12.attn_kv_a_norm.weight
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.12.attn_kv_b.weight
195: 5120 | 5120, 1, 1, 1 | F32 | blk.12.attn_norm.weight
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.12.attn_output.weight
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.12.attn_q_a.weight
198: 1536 | 1536, 1, 1, 1 | F32 | blk.12.attn_q_a_norm.weight
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.12.attn_q_b.weight
200: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.12.ffn_down_exps.weight
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.12.ffn_down_shexp.weight
202: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.12.ffn_gate_exps.weight
203: 819200 | 5120, 160, 1, 1 | F32 | blk.12.ffn_gate_inp.weight
204: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.12.ffn_gate_shexp.weight
205: 5120 | 5120, 1, 1, 1 | F32 | blk.12.ffn_norm.weight
206: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.12.ffn_up_exps.weight
207: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.12.ffn_up_shexp.weight
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.13.attn_kv_a_mqa.weight
209: 512 | 512, 1, 1, 1 | F32 | blk.13.attn_kv_a_norm.weight
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.13.attn_kv_b.weight
211: 5120 | 5120, 1, 1, 1 | F32 | blk.13.attn_norm.weight
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.13.attn_output.weight
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.13.attn_q_a.weight
214: 1536 | 1536, 1, 1, 1 | F32 | blk.13.attn_q_a_norm.weight
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.13.attn_q_b.weight
216: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.13.ffn_down_exps.weight
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.13.ffn_down_shexp.weight
218: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.13.ffn_gate_exps.weight
219: 819200 | 5120, 160, 1, 1 | F32 | blk.13.ffn_gate_inp.weight
220: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.13.ffn_gate_shexp.weight
221: 5120 | 5120, 1, 1, 1 | F32 | blk.13.ffn_norm.weight
222: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.13.ffn_up_exps.weight
223: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.13.ffn_up_shexp.weight
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.14.attn_kv_a_mqa.weight
225: 512 | 512, 1, 1, 1 | F32 | blk.14.attn_kv_a_norm.weight
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.14.attn_kv_b.weight
227: 5120 | 5120, 1, 1, 1 | F32 | blk.14.attn_norm.weight
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.14.attn_output.weight
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.14.attn_q_a.weight
230: 1536 | 1536, 1, 1, 1 | F32 | blk.14.attn_q_a_norm.weight
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.14.attn_q_b.weight
232: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.14.ffn_down_exps.weight
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.14.ffn_down_shexp.weight
234: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.14.ffn_gate_exps.weight
235: 819200 | 5120, 160, 1, 1 | F32 | blk.14.ffn_gate_inp.weight
236: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.14.ffn_gate_shexp.weight
237: 5120 | 5120, 1, 1, 1 | F32 | blk.14.ffn_norm.weight
238: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.14.ffn_up_exps.weight
239: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.14.ffn_up_shexp.weight
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.15.attn_kv_a_mqa.weight
241: 512 | 512, 1, 1, 1 | F32 | blk.15.attn_kv_a_norm.weight
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.15.attn_kv_b.weight
243: 5120 | 5120, 1, 1, 1 | F32 | blk.15.attn_norm.weight
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.15.attn_output.weight
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.15.attn_q_a.weight
246: 1536 | 1536, 1, 1, 1 | F32 | blk.15.attn_q_a_norm.weight
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.15.attn_q_b.weight
248: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.15.ffn_down_exps.weight
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.15.ffn_down_shexp.weight
250: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.15.ffn_gate_exps.weight
251: 819200 | 5120, 160, 1, 1 | F32 | blk.15.ffn_gate_inp.weight
252: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.15.ffn_gate_shexp.weight
253: 5120 | 5120, 1, 1, 1 | F32 | blk.15.ffn_norm.weight
254: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.15.ffn_up_exps.weight
255: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.15.ffn_up_shexp.weight
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.16.attn_kv_a_mqa.weight
257: 512 | 512, 1, 1, 1 | F32 | blk.16.attn_kv_a_norm.weight
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.16.attn_kv_b.weight
259: 5120 | 5120, 1, 1, 1 | F32 | blk.16.attn_norm.weight
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.16.attn_output.weight
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.16.attn_q_a.weight
262: 1536 | 1536, 1, 1, 1 | F32 | blk.16.attn_q_a_norm.weight
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.16.attn_q_b.weight
264: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.16.ffn_down_exps.weight
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.16.ffn_down_shexp.weight
266: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.16.ffn_gate_exps.weight
267: 819200 | 5120, 160, 1, 1 | F32 | blk.16.ffn_gate_inp.weight
268: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.16.ffn_gate_shexp.weight
269: 5120 | 5120, 1, 1, 1 | F32 | blk.16.ffn_norm.weight
270: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.16.ffn_up_exps.weight
271: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.16.ffn_up_shexp.weight
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.17.attn_kv_a_mqa.weight
273: 512 | 512, 1, 1, 1 | F32 | blk.17.attn_kv_a_norm.weight
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.17.attn_kv_b.weight
275: 5120 | 5120, 1, 1, 1 | F32 | blk.17.attn_norm.weight
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.17.attn_output.weight
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.17.attn_q_a.weight
278: 1536 | 1536, 1, 1, 1 | F32 | blk.17.attn_q_a_norm.weight
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.17.attn_q_b.weight
280: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.17.ffn_down_exps.weight
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.17.ffn_down_shexp.weight
282: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.17.ffn_gate_exps.weight
283: 819200 | 5120, 160, 1, 1 | F32 | blk.17.ffn_gate_inp.weight
284: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.17.ffn_gate_shexp.weight
285: 5120 | 5120, 1, 1, 1 | F32 | blk.17.ffn_norm.weight
286: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.17.ffn_up_exps.weight
287: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.17.ffn_up_shexp.weight
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.18.attn_kv_a_mqa.weight
289: 512 | 512, 1, 1, 1 | F32 | blk.18.attn_kv_a_norm.weight
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.18.attn_kv_b.weight
291: 5120 | 5120, 1, 1, 1 | F32 | blk.18.attn_norm.weight
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.18.attn_output.weight
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.18.attn_q_a.weight
294: 1536 | 1536, 1, 1, 1 | F32 | blk.18.attn_q_a_norm.weight
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.18.attn_q_b.weight
296: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.18.ffn_down_exps.weight
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.18.ffn_down_shexp.weight
298: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.18.ffn_gate_exps.weight
299: 819200 | 5120, 160, 1, 1 | F32 | blk.18.ffn_gate_inp.weight
300: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.18.ffn_gate_shexp.weight
301: 5120 | 5120, 1, 1, 1 | F32 | blk.18.ffn_norm.weight
302: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.18.ffn_up_exps.weight
303: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.18.ffn_up_shexp.weight
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.19.attn_kv_a_mqa.weight
305: 512 | 512, 1, 1, 1 | F32 | blk.19.attn_kv_a_norm.weight
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.19.attn_kv_b.weight
307: 5120 | 5120, 1, 1, 1 | F32 | blk.19.attn_norm.weight
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.19.attn_output.weight
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.19.attn_q_a.weight
310: 1536 | 1536, 1, 1, 1 | F32 | blk.19.attn_q_a_norm.weight
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.19.attn_q_b.weight
312: 1258291200 | 1536, 5120, 160, 1 | IQ3_S | blk.19.ffn_down_exps.weight
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.19.ffn_down_shexp.weight
314: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.19.ffn_gate_exps.weight
315: 819200 | 5120, 160, 1, 1 | F32 | blk.19.ffn_gate_inp.weight
316: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.19.ffn_gate_shexp.weight
317: 5120 | 5120, 1, 1, 1 | F32 | blk.19.ffn_norm.weight
318: 1258291200 | 5120, 1536, 160, 1 | IQ3_S | blk.19.ffn_up_exps.weight
319: 15728640 | 5120, 3072, 1, 1 | Q4_K | blk.19.ffn_up_shexp.weight
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.20.attn_kv_a_mqa.weight