File size: 45,864 Bytes
0746586
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq2_s-00001-of-00002.gguf
* File is LITTLE endian, script is running on a LITTLE endian host.
* Dumping 56 key/value pair(s)
      1: UINT32     |        1 | GGUF.version = 3
      2: UINT64     |        1 | GGUF.tensor_count = 480
      3: UINT64     |        1 | GGUF.kv_count = 53
      4: STRING     |        1 | general.architecture = 'deepseek2'
      5: STRING     |        1 | general.type = 'model'
      6: STRING     |        1 | general.name = 'Dsv25'
      7: STRING     |        1 | general.size_label = '160x14B'
      8: STRING     |        1 | general.license = 'other'
      9: STRING     |        1 | general.license.name = 'deepseek'
     10: STRING     |        1 | general.license.link = 'https://github.com/deepseek-ai/DeepSeek-V2/blob/main/LICENSE'
     11: UINT32     |        1 | deepseek2.block_count = 60
     12: UINT32     |        1 | deepseek2.context_length = 163840
     13: UINT32     |        1 | deepseek2.embedding_length = 5120
     14: UINT32     |        1 | deepseek2.feed_forward_length = 12288
     15: UINT32     |        1 | deepseek2.attention.head_count = 128
     16: UINT32     |        1 | deepseek2.attention.head_count_kv = 128
     17: FLOAT32    |        1 | deepseek2.rope.freq_base = 10000.0
     18: FLOAT32    |        1 | deepseek2.attention.layer_norm_rms_epsilon = 9.999999974752427e-07
     19: UINT32     |        1 | deepseek2.expert_used_count = 6
     20: UINT32     |        1 | deepseek2.leading_dense_block_count = 1
     21: UINT32     |        1 | deepseek2.vocab_size = 102400
     22: UINT32     |        1 | deepseek2.attention.q_lora_rank = 1536
     23: UINT32     |        1 | deepseek2.attention.kv_lora_rank = 512
     24: UINT32     |        1 | deepseek2.attention.key_length = 192
     25: UINT32     |        1 | deepseek2.attention.value_length = 128
     26: UINT32     |        1 | deepseek2.expert_feed_forward_length = 1536
     27: UINT32     |        1 | deepseek2.expert_count = 160
     28: UINT32     |        1 | deepseek2.expert_shared_count = 2
     29: FLOAT32    |        1 | deepseek2.expert_weights_scale = 16.0
     30: BOOL       |        1 | deepseek2.expert_weights_norm = False
     31: UINT32     |        1 | deepseek2.expert_gating_func = 1
     32: UINT32     |        1 | deepseek2.rope.dimension_count = 64
     33: STRING     |        1 | deepseek2.rope.scaling.type = 'yarn'
     34: FLOAT32    |        1 | deepseek2.rope.scaling.factor = 40.0
     35: UINT32     |        1 | deepseek2.rope.scaling.original_context_length = 4096
     36: FLOAT32    |        1 | deepseek2.rope.scaling.yarn_log_multiplier = 0.10000000149011612
     37: STRING     |        1 | tokenizer.ggml.model = 'gpt2'
     38: STRING     |        1 | tokenizer.ggml.pre = 'deepseek-llm'
     39: [STRING]   |   102400 | tokenizer.ggml.tokens
     40: [INT32]    |   102400 | tokenizer.ggml.token_type
     41: [STRING]   |    99757 | tokenizer.ggml.merges
     42: UINT32     |        1 | tokenizer.ggml.bos_token_id = 100000
     43: UINT32     |        1 | tokenizer.ggml.eos_token_id = 100001
     44: UINT32     |        1 | tokenizer.ggml.padding_token_id = 100001
     45: BOOL       |        1 | tokenizer.ggml.add_bos_token = True
     46: BOOL       |        1 | tokenizer.ggml.add_eos_token = False
     47: STRING     |        1 | tokenizer.chat_template = '{% if not add_generation_prompt is defined %}{% set add_gene'
     48: UINT32     |        1 | general.quantization_version = 2
     49: UINT32     |        1 | general.file_type = 28
     50: STRING     |        1 | quantize.imatrix.file = '/archive/nuc/LLM/raw/imatrix-DeepSeek-V2.5-1210-bartowski.da'
     51: STRING     |        1 | quantize.imatrix.dataset = '/training_dir/calibration_datav3.txt'
     52: INT32      |        1 | quantize.imatrix.entries_count = 716
     53: INT32      |        1 | quantize.imatrix.chunks_count = 139
     54: UINT16     |        1 | split.no = 0
     55: INT32      |        1 | split.tensors.count = 959
     56: UINT16     |        1 | split.count = 2
* Dumping 480 tensor(s)
      1:  524288000 |  5120, 102400,     1,     1 | Q6_K    | output.weight
      2:       5120 |  5120,     1,     1,     1 | F32     | output_norm.weight
      3:  524288000 |  5120, 102400,     1,     1 | Q6_K    | token_embd.weight
      4:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.0.attn_kv_a_mqa.weight
      5:        512 |   512,     1,     1,     1 | F32     | blk.0.attn_kv_a_norm.weight
      6:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.0.attn_kv_b.weight
      7:       5120 |  5120,     1,     1,     1 | F32     | blk.0.attn_norm.weight
      8:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.0.attn_output.weight
      9:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.0.attn_q_a.weight
     10:       1536 |  1536,     1,     1,     1 | F32     | blk.0.attn_q_a_norm.weight
     11:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.0.attn_q_b.weight
     12:   62914560 | 12288,  5120,     1,     1 | Q6_K    | blk.0.ffn_down.weight
     13:   62914560 |  5120, 12288,     1,     1 | Q4_K    | blk.0.ffn_gate.weight
     14:       5120 |  5120,     1,     1,     1 | F32     | blk.0.ffn_norm.weight
     15:   62914560 |  5120, 12288,     1,     1 | Q4_K    | blk.0.ffn_up.weight
     16:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.1.attn_kv_a_mqa.weight
     17:        512 |   512,     1,     1,     1 | F32     | blk.1.attn_kv_a_norm.weight
     18:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.1.attn_kv_b.weight
     19:       5120 |  5120,     1,     1,     1 | F32     | blk.1.attn_norm.weight
     20:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.1.attn_output.weight
     21:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.1.attn_q_a.weight
     22:       1536 |  1536,     1,     1,     1 | F32     | blk.1.attn_q_a_norm.weight
     23:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.1.attn_q_b.weight
     24: 1258291200 |  1536,  5120,   160,     1 | Q3_K    | blk.1.ffn_down_exps.weight
     25:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.1.ffn_down_shexp.weight
     26: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.1.ffn_gate_exps.weight
     27:     819200 |  5120,   160,     1,     1 | F32     | blk.1.ffn_gate_inp.weight
     28:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.1.ffn_gate_shexp.weight
     29:       5120 |  5120,     1,     1,     1 | F32     | blk.1.ffn_norm.weight
     30: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.1.ffn_up_exps.weight
     31:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.1.ffn_up_shexp.weight
     32:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.2.attn_kv_a_mqa.weight
     33:        512 |   512,     1,     1,     1 | F32     | blk.2.attn_kv_a_norm.weight
     34:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.2.attn_kv_b.weight
     35:       5120 |  5120,     1,     1,     1 | F32     | blk.2.attn_norm.weight
     36:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.2.attn_output.weight
     37:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.2.attn_q_a.weight
     38:       1536 |  1536,     1,     1,     1 | F32     | blk.2.attn_q_a_norm.weight
     39:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.2.attn_q_b.weight
     40: 1258291200 |  1536,  5120,   160,     1 | Q3_K    | blk.2.ffn_down_exps.weight
     41:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.2.ffn_down_shexp.weight
     42: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.2.ffn_gate_exps.weight
     43:     819200 |  5120,   160,     1,     1 | F32     | blk.2.ffn_gate_inp.weight
     44:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.2.ffn_gate_shexp.weight
     45:       5120 |  5120,     1,     1,     1 | F32     | blk.2.ffn_norm.weight
     46: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.2.ffn_up_exps.weight
     47:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.2.ffn_up_shexp.weight
     48:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.3.attn_kv_a_mqa.weight
     49:        512 |   512,     1,     1,     1 | F32     | blk.3.attn_kv_a_norm.weight
     50:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.3.attn_kv_b.weight
     51:       5120 |  5120,     1,     1,     1 | F32     | blk.3.attn_norm.weight
     52:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.3.attn_output.weight
     53:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.3.attn_q_a.weight
     54:       1536 |  1536,     1,     1,     1 | F32     | blk.3.attn_q_a_norm.weight
     55:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.3.attn_q_b.weight
     56: 1258291200 |  1536,  5120,   160,     1 | Q3_K    | blk.3.ffn_down_exps.weight
     57:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.3.ffn_down_shexp.weight
     58: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.3.ffn_gate_exps.weight
     59:     819200 |  5120,   160,     1,     1 | F32     | blk.3.ffn_gate_inp.weight
     60:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.3.ffn_gate_shexp.weight
     61:       5120 |  5120,     1,     1,     1 | F32     | blk.3.ffn_norm.weight
     62: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.3.ffn_up_exps.weight
     63:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.3.ffn_up_shexp.weight
     64:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.4.attn_kv_a_mqa.weight
     65:        512 |   512,     1,     1,     1 | F32     | blk.4.attn_kv_a_norm.weight
     66:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.4.attn_kv_b.weight
     67:       5120 |  5120,     1,     1,     1 | F32     | blk.4.attn_norm.weight
     68:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.4.attn_output.weight
     69:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.4.attn_q_a.weight
     70:       1536 |  1536,     1,     1,     1 | F32     | blk.4.attn_q_a_norm.weight
     71:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.4.attn_q_b.weight
     72: 1258291200 |  1536,  5120,   160,     1 | Q3_K    | blk.4.ffn_down_exps.weight
     73:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.4.ffn_down_shexp.weight
     74: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.4.ffn_gate_exps.weight
     75:     819200 |  5120,   160,     1,     1 | F32     | blk.4.ffn_gate_inp.weight
     76:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.4.ffn_gate_shexp.weight
     77:       5120 |  5120,     1,     1,     1 | F32     | blk.4.ffn_norm.weight
     78: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.4.ffn_up_exps.weight
     79:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.4.ffn_up_shexp.weight
     80:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.5.attn_kv_a_mqa.weight
     81:        512 |   512,     1,     1,     1 | F32     | blk.5.attn_kv_a_norm.weight
     82:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.5.attn_kv_b.weight
     83:       5120 |  5120,     1,     1,     1 | F32     | blk.5.attn_norm.weight
     84:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.5.attn_output.weight
     85:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.5.attn_q_a.weight
     86:       1536 |  1536,     1,     1,     1 | F32     | blk.5.attn_q_a_norm.weight
     87:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.5.attn_q_b.weight
     88: 1258291200 |  1536,  5120,   160,     1 | Q3_K    | blk.5.ffn_down_exps.weight
     89:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.5.ffn_down_shexp.weight
     90: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.5.ffn_gate_exps.weight
     91:     819200 |  5120,   160,     1,     1 | F32     | blk.5.ffn_gate_inp.weight
     92:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.5.ffn_gate_shexp.weight
     93:       5120 |  5120,     1,     1,     1 | F32     | blk.5.ffn_norm.weight
     94: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.5.ffn_up_exps.weight
     95:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.5.ffn_up_shexp.weight
     96:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.6.attn_kv_a_mqa.weight
     97:        512 |   512,     1,     1,     1 | F32     | blk.6.attn_kv_a_norm.weight
     98:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.6.attn_kv_b.weight
     99:       5120 |  5120,     1,     1,     1 | F32     | blk.6.attn_norm.weight
    100:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.6.attn_output.weight
    101:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.6.attn_q_a.weight
    102:       1536 |  1536,     1,     1,     1 | F32     | blk.6.attn_q_a_norm.weight
    103:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.6.attn_q_b.weight
    104: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.6.ffn_down_exps.weight
    105:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.6.ffn_down_shexp.weight
    106: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.6.ffn_gate_exps.weight
    107:     819200 |  5120,   160,     1,     1 | F32     | blk.6.ffn_gate_inp.weight
    108:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.6.ffn_gate_shexp.weight
    109:       5120 |  5120,     1,     1,     1 | F32     | blk.6.ffn_norm.weight
    110: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.6.ffn_up_exps.weight
    111:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.6.ffn_up_shexp.weight
    112:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.7.attn_kv_a_mqa.weight
    113:        512 |   512,     1,     1,     1 | F32     | blk.7.attn_kv_a_norm.weight
    114:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.7.attn_kv_b.weight
    115:       5120 |  5120,     1,     1,     1 | F32     | blk.7.attn_norm.weight
    116:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.7.attn_output.weight
    117:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.7.attn_q_a.weight
    118:       1536 |  1536,     1,     1,     1 | F32     | blk.7.attn_q_a_norm.weight
    119:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.7.attn_q_b.weight
    120: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.7.ffn_down_exps.weight
    121:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.7.ffn_down_shexp.weight
    122: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.7.ffn_gate_exps.weight
    123:     819200 |  5120,   160,     1,     1 | F32     | blk.7.ffn_gate_inp.weight
    124:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.7.ffn_gate_shexp.weight
    125:       5120 |  5120,     1,     1,     1 | F32     | blk.7.ffn_norm.weight
    126: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.7.ffn_up_exps.weight
    127:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.7.ffn_up_shexp.weight
    128:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.8.attn_kv_a_mqa.weight
    129:        512 |   512,     1,     1,     1 | F32     | blk.8.attn_kv_a_norm.weight
    130:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.8.attn_kv_b.weight
    131:       5120 |  5120,     1,     1,     1 | F32     | blk.8.attn_norm.weight
    132:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.8.attn_output.weight
    133:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.8.attn_q_a.weight
    134:       1536 |  1536,     1,     1,     1 | F32     | blk.8.attn_q_a_norm.weight
    135:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.8.attn_q_b.weight
    136: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.8.ffn_down_exps.weight
    137:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.8.ffn_down_shexp.weight
    138: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.8.ffn_gate_exps.weight
    139:     819200 |  5120,   160,     1,     1 | F32     | blk.8.ffn_gate_inp.weight
    140:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.8.ffn_gate_shexp.weight
    141:       5120 |  5120,     1,     1,     1 | F32     | blk.8.ffn_norm.weight
    142: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.8.ffn_up_exps.weight
    143:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.8.ffn_up_shexp.weight
    144:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.9.attn_kv_a_mqa.weight
    145:        512 |   512,     1,     1,     1 | F32     | blk.9.attn_kv_a_norm.weight
    146:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.9.attn_kv_b.weight
    147:       5120 |  5120,     1,     1,     1 | F32     | blk.9.attn_norm.weight
    148:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.9.attn_output.weight
    149:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.9.attn_q_a.weight
    150:       1536 |  1536,     1,     1,     1 | F32     | blk.9.attn_q_a_norm.weight
    151:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.9.attn_q_b.weight
    152: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.9.ffn_down_exps.weight
    153:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.9.ffn_down_shexp.weight
    154: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.9.ffn_gate_exps.weight
    155:     819200 |  5120,   160,     1,     1 | F32     | blk.9.ffn_gate_inp.weight
    156:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.9.ffn_gate_shexp.weight
    157:       5120 |  5120,     1,     1,     1 | F32     | blk.9.ffn_norm.weight
    158: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.9.ffn_up_exps.weight
    159:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.9.ffn_up_shexp.weight
    160:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.10.attn_kv_a_mqa.weight
    161:        512 |   512,     1,     1,     1 | F32     | blk.10.attn_kv_a_norm.weight
    162:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.10.attn_kv_b.weight
    163:       5120 |  5120,     1,     1,     1 | F32     | blk.10.attn_norm.weight
    164:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.10.attn_output.weight
    165:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.10.attn_q_a.weight
    166:       1536 |  1536,     1,     1,     1 | F32     | blk.10.attn_q_a_norm.weight
    167:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.10.attn_q_b.weight
    168: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.10.ffn_down_exps.weight
    169:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.10.ffn_down_shexp.weight
    170: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.10.ffn_gate_exps.weight
    171:     819200 |  5120,   160,     1,     1 | F32     | blk.10.ffn_gate_inp.weight
    172:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.10.ffn_gate_shexp.weight
    173:       5120 |  5120,     1,     1,     1 | F32     | blk.10.ffn_norm.weight
    174: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.10.ffn_up_exps.weight
    175:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.10.ffn_up_shexp.weight
    176:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.11.attn_kv_a_mqa.weight
    177:        512 |   512,     1,     1,     1 | F32     | blk.11.attn_kv_a_norm.weight
    178:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.11.attn_kv_b.weight
    179:       5120 |  5120,     1,     1,     1 | F32     | blk.11.attn_norm.weight
    180:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.11.attn_output.weight
    181:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.11.attn_q_a.weight
    182:       1536 |  1536,     1,     1,     1 | F32     | blk.11.attn_q_a_norm.weight
    183:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.11.attn_q_b.weight
    184: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.11.ffn_down_exps.weight
    185:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.11.ffn_down_shexp.weight
    186: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.11.ffn_gate_exps.weight
    187:     819200 |  5120,   160,     1,     1 | F32     | blk.11.ffn_gate_inp.weight
    188:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.11.ffn_gate_shexp.weight
    189:       5120 |  5120,     1,     1,     1 | F32     | blk.11.ffn_norm.weight
    190: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.11.ffn_up_exps.weight
    191:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.11.ffn_up_shexp.weight
    192:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.12.attn_kv_a_mqa.weight
    193:        512 |   512,     1,     1,     1 | F32     | blk.12.attn_kv_a_norm.weight
    194:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.12.attn_kv_b.weight
    195:       5120 |  5120,     1,     1,     1 | F32     | blk.12.attn_norm.weight
    196:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.12.attn_output.weight
    197:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.12.attn_q_a.weight
    198:       1536 |  1536,     1,     1,     1 | F32     | blk.12.attn_q_a_norm.weight
    199:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.12.attn_q_b.weight
    200: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.12.ffn_down_exps.weight
    201:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.12.ffn_down_shexp.weight
    202: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.12.ffn_gate_exps.weight
    203:     819200 |  5120,   160,     1,     1 | F32     | blk.12.ffn_gate_inp.weight
    204:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.12.ffn_gate_shexp.weight
    205:       5120 |  5120,     1,     1,     1 | F32     | blk.12.ffn_norm.weight
    206: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.12.ffn_up_exps.weight
    207:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.12.ffn_up_shexp.weight
    208:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.13.attn_kv_a_mqa.weight
    209:        512 |   512,     1,     1,     1 | F32     | blk.13.attn_kv_a_norm.weight
    210:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.13.attn_kv_b.weight
    211:       5120 |  5120,     1,     1,     1 | F32     | blk.13.attn_norm.weight
    212:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.13.attn_output.weight
    213:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.13.attn_q_a.weight
    214:       1536 |  1536,     1,     1,     1 | F32     | blk.13.attn_q_a_norm.weight
    215:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.13.attn_q_b.weight
    216: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.13.ffn_down_exps.weight
    217:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.13.ffn_down_shexp.weight
    218: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.13.ffn_gate_exps.weight
    219:     819200 |  5120,   160,     1,     1 | F32     | blk.13.ffn_gate_inp.weight
    220:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.13.ffn_gate_shexp.weight
    221:       5120 |  5120,     1,     1,     1 | F32     | blk.13.ffn_norm.weight
    222: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.13.ffn_up_exps.weight
    223:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.13.ffn_up_shexp.weight
    224:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.14.attn_kv_a_mqa.weight
    225:        512 |   512,     1,     1,     1 | F32     | blk.14.attn_kv_a_norm.weight
    226:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.14.attn_kv_b.weight
    227:       5120 |  5120,     1,     1,     1 | F32     | blk.14.attn_norm.weight
    228:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.14.attn_output.weight
    229:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.14.attn_q_a.weight
    230:       1536 |  1536,     1,     1,     1 | F32     | blk.14.attn_q_a_norm.weight
    231:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.14.attn_q_b.weight
    232: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.14.ffn_down_exps.weight
    233:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.14.ffn_down_shexp.weight
    234: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.14.ffn_gate_exps.weight
    235:     819200 |  5120,   160,     1,     1 | F32     | blk.14.ffn_gate_inp.weight
    236:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.14.ffn_gate_shexp.weight
    237:       5120 |  5120,     1,     1,     1 | F32     | blk.14.ffn_norm.weight
    238: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.14.ffn_up_exps.weight
    239:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.14.ffn_up_shexp.weight
    240:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.15.attn_kv_a_mqa.weight
    241:        512 |   512,     1,     1,     1 | F32     | blk.15.attn_kv_a_norm.weight
    242:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.15.attn_kv_b.weight
    243:       5120 |  5120,     1,     1,     1 | F32     | blk.15.attn_norm.weight
    244:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.15.attn_output.weight
    245:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.15.attn_q_a.weight
    246:       1536 |  1536,     1,     1,     1 | F32     | blk.15.attn_q_a_norm.weight
    247:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.15.attn_q_b.weight
    248: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.15.ffn_down_exps.weight
    249:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.15.ffn_down_shexp.weight
    250: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.15.ffn_gate_exps.weight
    251:     819200 |  5120,   160,     1,     1 | F32     | blk.15.ffn_gate_inp.weight
    252:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.15.ffn_gate_shexp.weight
    253:       5120 |  5120,     1,     1,     1 | F32     | blk.15.ffn_norm.weight
    254: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.15.ffn_up_exps.weight
    255:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.15.ffn_up_shexp.weight
    256:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.16.attn_kv_a_mqa.weight
    257:        512 |   512,     1,     1,     1 | F32     | blk.16.attn_kv_a_norm.weight
    258:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.16.attn_kv_b.weight
    259:       5120 |  5120,     1,     1,     1 | F32     | blk.16.attn_norm.weight
    260:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.16.attn_output.weight
    261:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.16.attn_q_a.weight
    262:       1536 |  1536,     1,     1,     1 | F32     | blk.16.attn_q_a_norm.weight
    263:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.16.attn_q_b.weight
    264: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.16.ffn_down_exps.weight
    265:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.16.ffn_down_shexp.weight
    266: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.16.ffn_gate_exps.weight
    267:     819200 |  5120,   160,     1,     1 | F32     | blk.16.ffn_gate_inp.weight
    268:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.16.ffn_gate_shexp.weight
    269:       5120 |  5120,     1,     1,     1 | F32     | blk.16.ffn_norm.weight
    270: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.16.ffn_up_exps.weight
    271:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.16.ffn_up_shexp.weight
    272:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.17.attn_kv_a_mqa.weight
    273:        512 |   512,     1,     1,     1 | F32     | blk.17.attn_kv_a_norm.weight
    274:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.17.attn_kv_b.weight
    275:       5120 |  5120,     1,     1,     1 | F32     | blk.17.attn_norm.weight
    276:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.17.attn_output.weight
    277:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.17.attn_q_a.weight
    278:       1536 |  1536,     1,     1,     1 | F32     | blk.17.attn_q_a_norm.weight
    279:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.17.attn_q_b.weight
    280: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.17.ffn_down_exps.weight
    281:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.17.ffn_down_shexp.weight
    282: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.17.ffn_gate_exps.weight
    283:     819200 |  5120,   160,     1,     1 | F32     | blk.17.ffn_gate_inp.weight
    284:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.17.ffn_gate_shexp.weight
    285:       5120 |  5120,     1,     1,     1 | F32     | blk.17.ffn_norm.weight
    286: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.17.ffn_up_exps.weight
    287:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.17.ffn_up_shexp.weight
    288:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.18.attn_kv_a_mqa.weight
    289:        512 |   512,     1,     1,     1 | F32     | blk.18.attn_kv_a_norm.weight
    290:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.18.attn_kv_b.weight
    291:       5120 |  5120,     1,     1,     1 | F32     | blk.18.attn_norm.weight
    292:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.18.attn_output.weight
    293:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.18.attn_q_a.weight
    294:       1536 |  1536,     1,     1,     1 | F32     | blk.18.attn_q_a_norm.weight
    295:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.18.attn_q_b.weight
    296: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.18.ffn_down_exps.weight
    297:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.18.ffn_down_shexp.weight
    298: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.18.ffn_gate_exps.weight
    299:     819200 |  5120,   160,     1,     1 | F32     | blk.18.ffn_gate_inp.weight
    300:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.18.ffn_gate_shexp.weight
    301:       5120 |  5120,     1,     1,     1 | F32     | blk.18.ffn_norm.weight
    302: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.18.ffn_up_exps.weight
    303:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.18.ffn_up_shexp.weight
    304:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.19.attn_kv_a_mqa.weight
    305:        512 |   512,     1,     1,     1 | F32     | blk.19.attn_kv_a_norm.weight
    306:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.19.attn_kv_b.weight
    307:       5120 |  5120,     1,     1,     1 | F32     | blk.19.attn_norm.weight
    308:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.19.attn_output.weight
    309:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.19.attn_q_a.weight
    310:       1536 |  1536,     1,     1,     1 | F32     | blk.19.attn_q_a_norm.weight
    311:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.19.attn_q_b.weight
    312: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.19.ffn_down_exps.weight
    313:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.19.ffn_down_shexp.weight
    314: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.19.ffn_gate_exps.weight
    315:     819200 |  5120,   160,     1,     1 | F32     | blk.19.ffn_gate_inp.weight
    316:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.19.ffn_gate_shexp.weight
    317:       5120 |  5120,     1,     1,     1 | F32     | blk.19.ffn_norm.weight
    318: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.19.ffn_up_exps.weight
    319:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.19.ffn_up_shexp.weight
    320:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.20.attn_kv_a_mqa.weight
    321:        512 |   512,     1,     1,     1 | F32     | blk.20.attn_kv_a_norm.weight
    322:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.20.attn_kv_b.weight
    323:       5120 |  5120,     1,     1,     1 | F32     | blk.20.attn_norm.weight
    324:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.20.attn_output.weight
    325:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.20.attn_q_a.weight
    326:       1536 |  1536,     1,     1,     1 | F32     | blk.20.attn_q_a_norm.weight
    327:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.20.attn_q_b.weight
    328: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.20.ffn_down_exps.weight
    329:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.20.ffn_down_shexp.weight
    330: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.20.ffn_gate_exps.weight
    331:     819200 |  5120,   160,     1,     1 | F32     | blk.20.ffn_gate_inp.weight
    332:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.20.ffn_gate_shexp.weight
    333:       5120 |  5120,     1,     1,     1 | F32     | blk.20.ffn_norm.weight
    334: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.20.ffn_up_exps.weight
    335:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.20.ffn_up_shexp.weight
    336:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.21.attn_kv_a_mqa.weight
    337:        512 |   512,     1,     1,     1 | F32     | blk.21.attn_kv_a_norm.weight
    338:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.21.attn_kv_b.weight
    339:       5120 |  5120,     1,     1,     1 | F32     | blk.21.attn_norm.weight
    340:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.21.attn_output.weight
    341:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.21.attn_q_a.weight
    342:       1536 |  1536,     1,     1,     1 | F32     | blk.21.attn_q_a_norm.weight
    343:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.21.attn_q_b.weight
    344: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.21.ffn_down_exps.weight
    345:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.21.ffn_down_shexp.weight
    346: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.21.ffn_gate_exps.weight
    347:     819200 |  5120,   160,     1,     1 | F32     | blk.21.ffn_gate_inp.weight
    348:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.21.ffn_gate_shexp.weight
    349:       5120 |  5120,     1,     1,     1 | F32     | blk.21.ffn_norm.weight
    350: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.21.ffn_up_exps.weight
    351:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.21.ffn_up_shexp.weight
    352:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.22.attn_kv_a_mqa.weight
    353:        512 |   512,     1,     1,     1 | F32     | blk.22.attn_kv_a_norm.weight
    354:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.22.attn_kv_b.weight
    355:       5120 |  5120,     1,     1,     1 | F32     | blk.22.attn_norm.weight
    356:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.22.attn_output.weight
    357:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.22.attn_q_a.weight
    358:       1536 |  1536,     1,     1,     1 | F32     | blk.22.attn_q_a_norm.weight
    359:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.22.attn_q_b.weight
    360: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.22.ffn_down_exps.weight
    361:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.22.ffn_down_shexp.weight
    362: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.22.ffn_gate_exps.weight
    363:     819200 |  5120,   160,     1,     1 | F32     | blk.22.ffn_gate_inp.weight
    364:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.22.ffn_gate_shexp.weight
    365:       5120 |  5120,     1,     1,     1 | F32     | blk.22.ffn_norm.weight
    366: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.22.ffn_up_exps.weight
    367:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.22.ffn_up_shexp.weight
    368:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.23.attn_kv_a_mqa.weight
    369:        512 |   512,     1,     1,     1 | F32     | blk.23.attn_kv_a_norm.weight
    370:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.23.attn_kv_b.weight
    371:       5120 |  5120,     1,     1,     1 | F32     | blk.23.attn_norm.weight
    372:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.23.attn_output.weight
    373:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.23.attn_q_a.weight
    374:       1536 |  1536,     1,     1,     1 | F32     | blk.23.attn_q_a_norm.weight
    375:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.23.attn_q_b.weight
    376: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.23.ffn_down_exps.weight
    377:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.23.ffn_down_shexp.weight
    378: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.23.ffn_gate_exps.weight
    379:     819200 |  5120,   160,     1,     1 | F32     | blk.23.ffn_gate_inp.weight
    380:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.23.ffn_gate_shexp.weight
    381:       5120 |  5120,     1,     1,     1 | F32     | blk.23.ffn_norm.weight
    382: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.23.ffn_up_exps.weight
    383:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.23.ffn_up_shexp.weight
    384:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.24.attn_kv_a_mqa.weight
    385:        512 |   512,     1,     1,     1 | F32     | blk.24.attn_kv_a_norm.weight
    386:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.24.attn_kv_b.weight
    387:       5120 |  5120,     1,     1,     1 | F32     | blk.24.attn_norm.weight
    388:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.24.attn_output.weight
    389:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.24.attn_q_a.weight
    390:       1536 |  1536,     1,     1,     1 | F32     | blk.24.attn_q_a_norm.weight
    391:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.24.attn_q_b.weight
    392: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.24.ffn_down_exps.weight
    393:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.24.ffn_down_shexp.weight
    394: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.24.ffn_gate_exps.weight
    395:     819200 |  5120,   160,     1,     1 | F32     | blk.24.ffn_gate_inp.weight
    396:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.24.ffn_gate_shexp.weight
    397:       5120 |  5120,     1,     1,     1 | F32     | blk.24.ffn_norm.weight
    398: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.24.ffn_up_exps.weight
    399:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.24.ffn_up_shexp.weight
    400:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.25.attn_kv_a_mqa.weight
    401:        512 |   512,     1,     1,     1 | F32     | blk.25.attn_kv_a_norm.weight
    402:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.25.attn_kv_b.weight
    403:       5120 |  5120,     1,     1,     1 | F32     | blk.25.attn_norm.weight
    404:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.25.attn_output.weight
    405:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.25.attn_q_a.weight
    406:       1536 |  1536,     1,     1,     1 | F32     | blk.25.attn_q_a_norm.weight
    407:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.25.attn_q_b.weight
    408: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.25.ffn_down_exps.weight
    409:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.25.ffn_down_shexp.weight
    410: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.25.ffn_gate_exps.weight
    411:     819200 |  5120,   160,     1,     1 | F32     | blk.25.ffn_gate_inp.weight
    412:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.25.ffn_gate_shexp.weight
    413:       5120 |  5120,     1,     1,     1 | F32     | blk.25.ffn_norm.weight
    414: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.25.ffn_up_exps.weight
    415:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.25.ffn_up_shexp.weight
    416:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.26.attn_kv_a_mqa.weight
    417:        512 |   512,     1,     1,     1 | F32     | blk.26.attn_kv_a_norm.weight
    418:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.26.attn_kv_b.weight
    419:       5120 |  5120,     1,     1,     1 | F32     | blk.26.attn_norm.weight
    420:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.26.attn_output.weight
    421:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.26.attn_q_a.weight
    422:       1536 |  1536,     1,     1,     1 | F32     | blk.26.attn_q_a_norm.weight
    423:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.26.attn_q_b.weight
    424: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.26.ffn_down_exps.weight
    425:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.26.ffn_down_shexp.weight
    426: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.26.ffn_gate_exps.weight
    427:     819200 |  5120,   160,     1,     1 | F32     | blk.26.ffn_gate_inp.weight
    428:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.26.ffn_gate_shexp.weight
    429:       5120 |  5120,     1,     1,     1 | F32     | blk.26.ffn_norm.weight
    430: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.26.ffn_up_exps.weight
    431:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.26.ffn_up_shexp.weight
    432:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.27.attn_kv_a_mqa.weight
    433:        512 |   512,     1,     1,     1 | F32     | blk.27.attn_kv_a_norm.weight
    434:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.27.attn_kv_b.weight
    435:       5120 |  5120,     1,     1,     1 | F32     | blk.27.attn_norm.weight
    436:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.27.attn_output.weight
    437:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.27.attn_q_a.weight
    438:       1536 |  1536,     1,     1,     1 | F32     | blk.27.attn_q_a_norm.weight
    439:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.27.attn_q_b.weight
    440: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.27.ffn_down_exps.weight
    441:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.27.ffn_down_shexp.weight
    442: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.27.ffn_gate_exps.weight
    443:     819200 |  5120,   160,     1,     1 | F32     | blk.27.ffn_gate_inp.weight
    444:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.27.ffn_gate_shexp.weight
    445:       5120 |  5120,     1,     1,     1 | F32     | blk.27.ffn_norm.weight
    446: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.27.ffn_up_exps.weight
    447:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.27.ffn_up_shexp.weight
    448:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.28.attn_kv_a_mqa.weight
    449:        512 |   512,     1,     1,     1 | F32     | blk.28.attn_kv_a_norm.weight
    450:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.28.attn_kv_b.weight
    451:       5120 |  5120,     1,     1,     1 | F32     | blk.28.attn_norm.weight
    452:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.28.attn_output.weight
    453:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.28.attn_q_a.weight
    454:       1536 |  1536,     1,     1,     1 | F32     | blk.28.attn_q_a_norm.weight
    455:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.28.attn_q_b.weight
    456: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.28.ffn_down_exps.weight
    457:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.28.ffn_down_shexp.weight
    458: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.28.ffn_gate_exps.weight
    459:     819200 |  5120,   160,     1,     1 | F32     | blk.28.ffn_gate_inp.weight
    460:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.28.ffn_gate_shexp.weight
    461:       5120 |  5120,     1,     1,     1 | F32     | blk.28.ffn_norm.weight
    462: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.28.ffn_up_exps.weight
    463:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.28.ffn_up_shexp.weight
    464:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.29.attn_kv_a_mqa.weight
    465:        512 |   512,     1,     1,     1 | F32     | blk.29.attn_kv_a_norm.weight
    466:   16777216 |   512, 32768,     1,     1 | Q6_K    | blk.29.attn_kv_b.weight
    467:       5120 |  5120,     1,     1,     1 | F32     | blk.29.attn_norm.weight
    468:   83886080 | 16384,  5120,     1,     1 | Q4_K    | blk.29.attn_output.weight
    469:    7864320 |  5120,  1536,     1,     1 | Q4_K    | blk.29.attn_q_a.weight
    470:       1536 |  1536,     1,     1,     1 | F32     | blk.29.attn_q_a_norm.weight
    471:   37748736 |  1536, 24576,     1,     1 | Q4_K    | blk.29.attn_q_b.weight
    472: 1258291200 |  1536,  5120,   160,     1 | Q2_K    | blk.29.ffn_down_exps.weight
    473:   15728640 |  3072,  5120,     1,     1 | Q6_K    | blk.29.ffn_down_shexp.weight
    474: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.29.ffn_gate_exps.weight
    475:     819200 |  5120,   160,     1,     1 | F32     | blk.29.ffn_gate_inp.weight
    476:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.29.ffn_gate_shexp.weight
    477:       5120 |  5120,     1,     1,     1 | F32     | blk.29.ffn_norm.weight
    478: 1258291200 |  5120,  1536,   160,     1 | IQ2_XS  | blk.29.ffn_up_exps.weight
    479:   15728640 |  5120,  3072,     1,     1 | Q5_K    | blk.29.ffn_up_shexp.weight
    480:    2949120 |  5120,   576,     1,     1 | Q6_K    | blk.30.attn_kv_a_mqa.weight