|
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq1_m-00001-of-00002.gguf |
|
* File is LITTLE endian, script is running on a LITTLE endian host. |
|
* Dumping 56 key/value pair(s) |
|
1: UINT32 | 1 | GGUF.version = 3 |
|
2: UINT64 | 1 | GGUF.tensor_count = 480 |
|
3: UINT64 | 1 | GGUF.kv_count = 53 |
|
4: STRING | 1 | general.architecture = 'deepseek2' |
|
5: STRING | 1 | general.type = 'model' |
|
6: STRING | 1 | general.name = 'Dsv25' |
|
7: STRING | 1 | general.size_label = '160x14B' |
|
8: STRING | 1 | general.license = 'other' |
|
9: STRING | 1 | general.license.name = 'deepseek' |
|
10: STRING | 1 | general.license.link = 'https://github.com/deepseek-ai/DeepSeek-V2/blob/main/LICENSE' |
|
11: UINT32 | 1 | deepseek2.block_count = 60 |
|
12: UINT32 | 1 | deepseek2.context_length = 163840 |
|
13: UINT32 | 1 | deepseek2.embedding_length = 5120 |
|
14: UINT32 | 1 | deepseek2.feed_forward_length = 12288 |
|
15: UINT32 | 1 | deepseek2.attention.head_count = 128 |
|
16: UINT32 | 1 | deepseek2.attention.head_count_kv = 128 |
|
17: FLOAT32 | 1 | deepseek2.rope.freq_base = 10000.0 |
|
18: FLOAT32 | 1 | deepseek2.attention.layer_norm_rms_epsilon = 9.999999974752427e-07 |
|
19: UINT32 | 1 | deepseek2.expert_used_count = 6 |
|
20: UINT32 | 1 | deepseek2.leading_dense_block_count = 1 |
|
21: UINT32 | 1 | deepseek2.vocab_size = 102400 |
|
22: UINT32 | 1 | deepseek2.attention.q_lora_rank = 1536 |
|
23: UINT32 | 1 | deepseek2.attention.kv_lora_rank = 512 |
|
24: UINT32 | 1 | deepseek2.attention.key_length = 192 |
|
25: UINT32 | 1 | deepseek2.attention.value_length = 128 |
|
26: UINT32 | 1 | deepseek2.expert_feed_forward_length = 1536 |
|
27: UINT32 | 1 | deepseek2.expert_count = 160 |
|
28: UINT32 | 1 | deepseek2.expert_shared_count = 2 |
|
29: FLOAT32 | 1 | deepseek2.expert_weights_scale = 16.0 |
|
30: BOOL | 1 | deepseek2.expert_weights_norm = False |
|
31: UINT32 | 1 | deepseek2.expert_gating_func = 1 |
|
32: UINT32 | 1 | deepseek2.rope.dimension_count = 64 |
|
33: STRING | 1 | deepseek2.rope.scaling.type = 'yarn' |
|
34: FLOAT32 | 1 | deepseek2.rope.scaling.factor = 40.0 |
|
35: UINT32 | 1 | deepseek2.rope.scaling.original_context_length = 4096 |
|
36: FLOAT32 | 1 | deepseek2.rope.scaling.yarn_log_multiplier = 0.10000000149011612 |
|
37: STRING | 1 | tokenizer.ggml.model = 'gpt2' |
|
38: STRING | 1 | tokenizer.ggml.pre = 'deepseek-llm' |
|
39: [STRING] | 102400 | tokenizer.ggml.tokens |
|
40: [INT32] | 102400 | tokenizer.ggml.token_type |
|
41: [STRING] | 99757 | tokenizer.ggml.merges |
|
42: UINT32 | 1 | tokenizer.ggml.bos_token_id = 100000 |
|
43: UINT32 | 1 | tokenizer.ggml.eos_token_id = 100001 |
|
44: UINT32 | 1 | tokenizer.ggml.padding_token_id = 100001 |
|
45: BOOL | 1 | tokenizer.ggml.add_bos_token = True |
|
46: BOOL | 1 | tokenizer.ggml.add_eos_token = False |
|
47: STRING | 1 | tokenizer.chat_template = '{% if not add_generation_prompt is defined %}{% set add_gene' |
|
48: UINT32 | 1 | general.quantization_version = 2 |
|
49: UINT32 | 1 | general.file_type = 31 |
|
50: STRING | 1 | quantize.imatrix.file = '/archive/nuc/LLM/raw/imatrix-DeepSeek-V2.5-1210-bartowski.da' |
|
51: STRING | 1 | quantize.imatrix.dataset = '/training_dir/calibration_datav3.txt' |
|
52: INT32 | 1 | quantize.imatrix.entries_count = 716 |
|
53: INT32 | 1 | quantize.imatrix.chunks_count = 139 |
|
54: UINT16 | 1 | split.no = 0 |
|
55: INT32 | 1 | split.tensors.count = 959 |
|
56: UINT16 | 1 | split.count = 2 |
|
* Dumping 480 tensor(s) |
|
1: 524288000 | 5120, 102400, 1, 1 | Q6_K | output.weight |
|
2: 5120 | 5120, 1, 1, 1 | F32 | output_norm.weight |
|
3: 524288000 | 5120, 102400, 1, 1 | Q6_K | token_embd.weight |
|
4: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.0.attn_kv_a_mqa.weight |
|
5: 512 | 512, 1, 1, 1 | F32 | blk.0.attn_kv_a_norm.weight |
|
6: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.0.attn_kv_b.weight |
|
7: 5120 | 5120, 1, 1, 1 | F32 | blk.0.attn_norm.weight |
|
8: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.0.attn_output.weight |
|
9: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.0.attn_q_a.weight |
|
10: 1536 | 1536, 1, 1, 1 | F32 | blk.0.attn_q_a_norm.weight |
|
11: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.0.attn_q_b.weight |
|
12: 62914560 | 12288, 5120, 1, 1 | Q6_K | blk.0.ffn_down.weight |
|
13: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_gate.weight |
|
14: 5120 | 5120, 1, 1, 1 | F32 | blk.0.ffn_norm.weight |
|
15: 62914560 | 5120, 12288, 1, 1 | Q4_K | blk.0.ffn_up.weight |
|
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.1.attn_kv_a_mqa.weight |
|
17: 512 | 512, 1, 1, 1 | F32 | blk.1.attn_kv_a_norm.weight |
|
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.1.attn_kv_b.weight |
|
19: 5120 | 5120, 1, 1, 1 | F32 | blk.1.attn_norm.weight |
|
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.1.attn_output.weight |
|
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.1.attn_q_a.weight |
|
22: 1536 | 1536, 1, 1, 1 | F32 | blk.1.attn_q_a_norm.weight |
|
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.1.attn_q_b.weight |
|
24: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.1.ffn_down_exps.weight |
|
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.1.ffn_down_shexp.weight |
|
26: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.1.ffn_gate_exps.weight |
|
27: 819200 | 5120, 160, 1, 1 | F32 | blk.1.ffn_gate_inp.weight |
|
28: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.1.ffn_gate_shexp.weight |
|
29: 5120 | 5120, 1, 1, 1 | F32 | blk.1.ffn_norm.weight |
|
30: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.1.ffn_up_exps.weight |
|
31: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.1.ffn_up_shexp.weight |
|
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.2.attn_kv_a_mqa.weight |
|
33: 512 | 512, 1, 1, 1 | F32 | blk.2.attn_kv_a_norm.weight |
|
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.2.attn_kv_b.weight |
|
35: 5120 | 5120, 1, 1, 1 | F32 | blk.2.attn_norm.weight |
|
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.2.attn_output.weight |
|
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.2.attn_q_a.weight |
|
38: 1536 | 1536, 1, 1, 1 | F32 | blk.2.attn_q_a_norm.weight |
|
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.2.attn_q_b.weight |
|
40: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.2.ffn_down_exps.weight |
|
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.2.ffn_down_shexp.weight |
|
42: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.2.ffn_gate_exps.weight |
|
43: 819200 | 5120, 160, 1, 1 | F32 | blk.2.ffn_gate_inp.weight |
|
44: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.2.ffn_gate_shexp.weight |
|
45: 5120 | 5120, 1, 1, 1 | F32 | blk.2.ffn_norm.weight |
|
46: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.2.ffn_up_exps.weight |
|
47: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.2.ffn_up_shexp.weight |
|
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.3.attn_kv_a_mqa.weight |
|
49: 512 | 512, 1, 1, 1 | F32 | blk.3.attn_kv_a_norm.weight |
|
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.3.attn_kv_b.weight |
|
51: 5120 | 5120, 1, 1, 1 | F32 | blk.3.attn_norm.weight |
|
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.3.attn_output.weight |
|
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.3.attn_q_a.weight |
|
54: 1536 | 1536, 1, 1, 1 | F32 | blk.3.attn_q_a_norm.weight |
|
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.3.attn_q_b.weight |
|
56: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.3.ffn_down_exps.weight |
|
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.3.ffn_down_shexp.weight |
|
58: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.3.ffn_gate_exps.weight |
|
59: 819200 | 5120, 160, 1, 1 | F32 | blk.3.ffn_gate_inp.weight |
|
60: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.3.ffn_gate_shexp.weight |
|
61: 5120 | 5120, 1, 1, 1 | F32 | blk.3.ffn_norm.weight |
|
62: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.3.ffn_up_exps.weight |
|
63: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.3.ffn_up_shexp.weight |
|
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.4.attn_kv_a_mqa.weight |
|
65: 512 | 512, 1, 1, 1 | F32 | blk.4.attn_kv_a_norm.weight |
|
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.4.attn_kv_b.weight |
|
67: 5120 | 5120, 1, 1, 1 | F32 | blk.4.attn_norm.weight |
|
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.4.attn_output.weight |
|
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.4.attn_q_a.weight |
|
70: 1536 | 1536, 1, 1, 1 | F32 | blk.4.attn_q_a_norm.weight |
|
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.4.attn_q_b.weight |
|
72: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.4.ffn_down_exps.weight |
|
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.4.ffn_down_shexp.weight |
|
74: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.4.ffn_gate_exps.weight |
|
75: 819200 | 5120, 160, 1, 1 | F32 | blk.4.ffn_gate_inp.weight |
|
76: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.4.ffn_gate_shexp.weight |
|
77: 5120 | 5120, 1, 1, 1 | F32 | blk.4.ffn_norm.weight |
|
78: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.4.ffn_up_exps.weight |
|
79: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.4.ffn_up_shexp.weight |
|
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.5.attn_kv_a_mqa.weight |
|
81: 512 | 512, 1, 1, 1 | F32 | blk.5.attn_kv_a_norm.weight |
|
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.5.attn_kv_b.weight |
|
83: 5120 | 5120, 1, 1, 1 | F32 | blk.5.attn_norm.weight |
|
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.5.attn_output.weight |
|
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.5.attn_q_a.weight |
|
86: 1536 | 1536, 1, 1, 1 | F32 | blk.5.attn_q_a_norm.weight |
|
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.5.attn_q_b.weight |
|
88: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.5.ffn_down_exps.weight |
|
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.5.ffn_down_shexp.weight |
|
90: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.5.ffn_gate_exps.weight |
|
91: 819200 | 5120, 160, 1, 1 | F32 | blk.5.ffn_gate_inp.weight |
|
92: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.5.ffn_gate_shexp.weight |
|
93: 5120 | 5120, 1, 1, 1 | F32 | blk.5.ffn_norm.weight |
|
94: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.5.ffn_up_exps.weight |
|
95: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.5.ffn_up_shexp.weight |
|
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.6.attn_kv_a_mqa.weight |
|
97: 512 | 512, 1, 1, 1 | F32 | blk.6.attn_kv_a_norm.weight |
|
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.6.attn_kv_b.weight |
|
99: 5120 | 5120, 1, 1, 1 | F32 | blk.6.attn_norm.weight |
|
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.6.attn_output.weight |
|
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.6.attn_q_a.weight |
|
102: 1536 | 1536, 1, 1, 1 | F32 | blk.6.attn_q_a_norm.weight |
|
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.6.attn_q_b.weight |
|
104: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.6.ffn_down_exps.weight |
|
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.6.ffn_down_shexp.weight |
|
106: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.6.ffn_gate_exps.weight |
|
107: 819200 | 5120, 160, 1, 1 | F32 | blk.6.ffn_gate_inp.weight |
|
108: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.6.ffn_gate_shexp.weight |
|
109: 5120 | 5120, 1, 1, 1 | F32 | blk.6.ffn_norm.weight |
|
110: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.6.ffn_up_exps.weight |
|
111: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.6.ffn_up_shexp.weight |
|
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.7.attn_kv_a_mqa.weight |
|
113: 512 | 512, 1, 1, 1 | F32 | blk.7.attn_kv_a_norm.weight |
|
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.7.attn_kv_b.weight |
|
115: 5120 | 5120, 1, 1, 1 | F32 | blk.7.attn_norm.weight |
|
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.7.attn_output.weight |
|
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.7.attn_q_a.weight |
|
118: 1536 | 1536, 1, 1, 1 | F32 | blk.7.attn_q_a_norm.weight |
|
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.7.attn_q_b.weight |
|
120: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.7.ffn_down_exps.weight |
|
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.7.ffn_down_shexp.weight |
|
122: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.7.ffn_gate_exps.weight |
|
123: 819200 | 5120, 160, 1, 1 | F32 | blk.7.ffn_gate_inp.weight |
|
124: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.7.ffn_gate_shexp.weight |
|
125: 5120 | 5120, 1, 1, 1 | F32 | blk.7.ffn_norm.weight |
|
126: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.7.ffn_up_exps.weight |
|
127: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.7.ffn_up_shexp.weight |
|
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.8.attn_kv_a_mqa.weight |
|
129: 512 | 512, 1, 1, 1 | F32 | blk.8.attn_kv_a_norm.weight |
|
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.8.attn_kv_b.weight |
|
131: 5120 | 5120, 1, 1, 1 | F32 | blk.8.attn_norm.weight |
|
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.8.attn_output.weight |
|
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.8.attn_q_a.weight |
|
134: 1536 | 1536, 1, 1, 1 | F32 | blk.8.attn_q_a_norm.weight |
|
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.8.attn_q_b.weight |
|
136: 1258291200 | 1536, 5120, 160, 1 | IQ2_XXS | blk.8.ffn_down_exps.weight |
|
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.8.ffn_down_shexp.weight |
|
138: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.8.ffn_gate_exps.weight |
|
139: 819200 | 5120, 160, 1, 1 | F32 | blk.8.ffn_gate_inp.weight |
|
140: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.8.ffn_gate_shexp.weight |
|
141: 5120 | 5120, 1, 1, 1 | F32 | blk.8.ffn_norm.weight |
|
142: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.8.ffn_up_exps.weight |
|
143: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.8.ffn_up_shexp.weight |
|
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.9.attn_kv_a_mqa.weight |
|
145: 512 | 512, 1, 1, 1 | F32 | blk.9.attn_kv_a_norm.weight |
|
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.9.attn_kv_b.weight |
|
147: 5120 | 5120, 1, 1, 1 | F32 | blk.9.attn_norm.weight |
|
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.9.attn_output.weight |
|
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.9.attn_q_a.weight |
|
150: 1536 | 1536, 1, 1, 1 | F32 | blk.9.attn_q_a_norm.weight |
|
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.9.attn_q_b.weight |
|
152: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.9.ffn_down_exps.weight |
|
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.9.ffn_down_shexp.weight |
|
154: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.9.ffn_gate_exps.weight |
|
155: 819200 | 5120, 160, 1, 1 | F32 | blk.9.ffn_gate_inp.weight |
|
156: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.9.ffn_gate_shexp.weight |
|
157: 5120 | 5120, 1, 1, 1 | F32 | blk.9.ffn_norm.weight |
|
158: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.9.ffn_up_exps.weight |
|
159: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.9.ffn_up_shexp.weight |
|
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.10.attn_kv_a_mqa.weight |
|
161: 512 | 512, 1, 1, 1 | F32 | blk.10.attn_kv_a_norm.weight |
|
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.10.attn_kv_b.weight |
|
163: 5120 | 5120, 1, 1, 1 | F32 | blk.10.attn_norm.weight |
|
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.10.attn_output.weight |
|
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.10.attn_q_a.weight |
|
166: 1536 | 1536, 1, 1, 1 | F32 | blk.10.attn_q_a_norm.weight |
|
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.10.attn_q_b.weight |
|
168: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.10.ffn_down_exps.weight |
|
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.10.ffn_down_shexp.weight |
|
170: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.10.ffn_gate_exps.weight |
|
171: 819200 | 5120, 160, 1, 1 | F32 | blk.10.ffn_gate_inp.weight |
|
172: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.10.ffn_gate_shexp.weight |
|
173: 5120 | 5120, 1, 1, 1 | F32 | blk.10.ffn_norm.weight |
|
174: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.10.ffn_up_exps.weight |
|
175: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.10.ffn_up_shexp.weight |
|
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.11.attn_kv_a_mqa.weight |
|
177: 512 | 512, 1, 1, 1 | F32 | blk.11.attn_kv_a_norm.weight |
|
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.11.attn_kv_b.weight |
|
179: 5120 | 5120, 1, 1, 1 | F32 | blk.11.attn_norm.weight |
|
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.11.attn_output.weight |
|
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.11.attn_q_a.weight |
|
182: 1536 | 1536, 1, 1, 1 | F32 | blk.11.attn_q_a_norm.weight |
|
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.11.attn_q_b.weight |
|
184: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.11.ffn_down_exps.weight |
|
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.11.ffn_down_shexp.weight |
|
186: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.11.ffn_gate_exps.weight |
|
187: 819200 | 5120, 160, 1, 1 | F32 | blk.11.ffn_gate_inp.weight |
|
188: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.11.ffn_gate_shexp.weight |
|
189: 5120 | 5120, 1, 1, 1 | F32 | blk.11.ffn_norm.weight |
|
190: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.11.ffn_up_exps.weight |
|
191: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.11.ffn_up_shexp.weight |
|
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.12.attn_kv_a_mqa.weight |
|
193: 512 | 512, 1, 1, 1 | F32 | blk.12.attn_kv_a_norm.weight |
|
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.12.attn_kv_b.weight |
|
195: 5120 | 5120, 1, 1, 1 | F32 | blk.12.attn_norm.weight |
|
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.12.attn_output.weight |
|
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.12.attn_q_a.weight |
|
198: 1536 | 1536, 1, 1, 1 | F32 | blk.12.attn_q_a_norm.weight |
|
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.12.attn_q_b.weight |
|
200: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.12.ffn_down_exps.weight |
|
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.12.ffn_down_shexp.weight |
|
202: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.12.ffn_gate_exps.weight |
|
203: 819200 | 5120, 160, 1, 1 | F32 | blk.12.ffn_gate_inp.weight |
|
204: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.12.ffn_gate_shexp.weight |
|
205: 5120 | 5120, 1, 1, 1 | F32 | blk.12.ffn_norm.weight |
|
206: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.12.ffn_up_exps.weight |
|
207: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.12.ffn_up_shexp.weight |
|
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.13.attn_kv_a_mqa.weight |
|
209: 512 | 512, 1, 1, 1 | F32 | blk.13.attn_kv_a_norm.weight |
|
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.13.attn_kv_b.weight |
|
211: 5120 | 5120, 1, 1, 1 | F32 | blk.13.attn_norm.weight |
|
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.13.attn_output.weight |
|
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.13.attn_q_a.weight |
|
214: 1536 | 1536, 1, 1, 1 | F32 | blk.13.attn_q_a_norm.weight |
|
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.13.attn_q_b.weight |
|
216: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.13.ffn_down_exps.weight |
|
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.13.ffn_down_shexp.weight |
|
218: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.13.ffn_gate_exps.weight |
|
219: 819200 | 5120, 160, 1, 1 | F32 | blk.13.ffn_gate_inp.weight |
|
220: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.13.ffn_gate_shexp.weight |
|
221: 5120 | 5120, 1, 1, 1 | F32 | blk.13.ffn_norm.weight |
|
222: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.13.ffn_up_exps.weight |
|
223: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.13.ffn_up_shexp.weight |
|
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.14.attn_kv_a_mqa.weight |
|
225: 512 | 512, 1, 1, 1 | F32 | blk.14.attn_kv_a_norm.weight |
|
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.14.attn_kv_b.weight |
|
227: 5120 | 5120, 1, 1, 1 | F32 | blk.14.attn_norm.weight |
|
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.14.attn_output.weight |
|
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.14.attn_q_a.weight |
|
230: 1536 | 1536, 1, 1, 1 | F32 | blk.14.attn_q_a_norm.weight |
|
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.14.attn_q_b.weight |
|
232: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.14.ffn_down_exps.weight |
|
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.14.ffn_down_shexp.weight |
|
234: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.14.ffn_gate_exps.weight |
|
235: 819200 | 5120, 160, 1, 1 | F32 | blk.14.ffn_gate_inp.weight |
|
236: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.14.ffn_gate_shexp.weight |
|
237: 5120 | 5120, 1, 1, 1 | F32 | blk.14.ffn_norm.weight |
|
238: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.14.ffn_up_exps.weight |
|
239: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.14.ffn_up_shexp.weight |
|
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.15.attn_kv_a_mqa.weight |
|
241: 512 | 512, 1, 1, 1 | F32 | blk.15.attn_kv_a_norm.weight |
|
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.15.attn_kv_b.weight |
|
243: 5120 | 5120, 1, 1, 1 | F32 | blk.15.attn_norm.weight |
|
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.15.attn_output.weight |
|
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.15.attn_q_a.weight |
|
246: 1536 | 1536, 1, 1, 1 | F32 | blk.15.attn_q_a_norm.weight |
|
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.15.attn_q_b.weight |
|
248: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.15.ffn_down_exps.weight |
|
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.15.ffn_down_shexp.weight |
|
250: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.15.ffn_gate_exps.weight |
|
251: 819200 | 5120, 160, 1, 1 | F32 | blk.15.ffn_gate_inp.weight |
|
252: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.15.ffn_gate_shexp.weight |
|
253: 5120 | 5120, 1, 1, 1 | F32 | blk.15.ffn_norm.weight |
|
254: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.15.ffn_up_exps.weight |
|
255: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.15.ffn_up_shexp.weight |
|
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.16.attn_kv_a_mqa.weight |
|
257: 512 | 512, 1, 1, 1 | F32 | blk.16.attn_kv_a_norm.weight |
|
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.16.attn_kv_b.weight |
|
259: 5120 | 5120, 1, 1, 1 | F32 | blk.16.attn_norm.weight |
|
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.16.attn_output.weight |
|
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.16.attn_q_a.weight |
|
262: 1536 | 1536, 1, 1, 1 | F32 | blk.16.attn_q_a_norm.weight |
|
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.16.attn_q_b.weight |
|
264: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.16.ffn_down_exps.weight |
|
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.16.ffn_down_shexp.weight |
|
266: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.16.ffn_gate_exps.weight |
|
267: 819200 | 5120, 160, 1, 1 | F32 | blk.16.ffn_gate_inp.weight |
|
268: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.16.ffn_gate_shexp.weight |
|
269: 5120 | 5120, 1, 1, 1 | F32 | blk.16.ffn_norm.weight |
|
270: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.16.ffn_up_exps.weight |
|
271: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.16.ffn_up_shexp.weight |
|
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.17.attn_kv_a_mqa.weight |
|
273: 512 | 512, 1, 1, 1 | F32 | blk.17.attn_kv_a_norm.weight |
|
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.17.attn_kv_b.weight |
|
275: 5120 | 5120, 1, 1, 1 | F32 | blk.17.attn_norm.weight |
|
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.17.attn_output.weight |
|
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.17.attn_q_a.weight |
|
278: 1536 | 1536, 1, 1, 1 | F32 | blk.17.attn_q_a_norm.weight |
|
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.17.attn_q_b.weight |
|
280: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.17.ffn_down_exps.weight |
|
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.17.ffn_down_shexp.weight |
|
282: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.17.ffn_gate_exps.weight |
|
283: 819200 | 5120, 160, 1, 1 | F32 | blk.17.ffn_gate_inp.weight |
|
284: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.17.ffn_gate_shexp.weight |
|
285: 5120 | 5120, 1, 1, 1 | F32 | blk.17.ffn_norm.weight |
|
286: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.17.ffn_up_exps.weight |
|
287: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.17.ffn_up_shexp.weight |
|
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.18.attn_kv_a_mqa.weight |
|
289: 512 | 512, 1, 1, 1 | F32 | blk.18.attn_kv_a_norm.weight |
|
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.18.attn_kv_b.weight |
|
291: 5120 | 5120, 1, 1, 1 | F32 | blk.18.attn_norm.weight |
|
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.18.attn_output.weight |
|
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.18.attn_q_a.weight |
|
294: 1536 | 1536, 1, 1, 1 | F32 | blk.18.attn_q_a_norm.weight |
|
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.18.attn_q_b.weight |
|
296: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.18.ffn_down_exps.weight |
|
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.18.ffn_down_shexp.weight |
|
298: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.18.ffn_gate_exps.weight |
|
299: 819200 | 5120, 160, 1, 1 | F32 | blk.18.ffn_gate_inp.weight |
|
300: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.18.ffn_gate_shexp.weight |
|
301: 5120 | 5120, 1, 1, 1 | F32 | blk.18.ffn_norm.weight |
|
302: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.18.ffn_up_exps.weight |
|
303: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.18.ffn_up_shexp.weight |
|
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.19.attn_kv_a_mqa.weight |
|
305: 512 | 512, 1, 1, 1 | F32 | blk.19.attn_kv_a_norm.weight |
|
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.19.attn_kv_b.weight |
|
307: 5120 | 5120, 1, 1, 1 | F32 | blk.19.attn_norm.weight |
|
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.19.attn_output.weight |
|
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.19.attn_q_a.weight |
|
310: 1536 | 1536, 1, 1, 1 | F32 | blk.19.attn_q_a_norm.weight |
|
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.19.attn_q_b.weight |
|
312: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.19.ffn_down_exps.weight |
|
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.19.ffn_down_shexp.weight |
|
314: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.19.ffn_gate_exps.weight |
|
315: 819200 | 5120, 160, 1, 1 | F32 | blk.19.ffn_gate_inp.weight |
|
316: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.19.ffn_gate_shexp.weight |
|
317: 5120 | 5120, 1, 1, 1 | F32 | blk.19.ffn_norm.weight |
|
318: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.19.ffn_up_exps.weight |
|
319: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.19.ffn_up_shexp.weight |
|
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.20.attn_kv_a_mqa.weight |
|
321: 512 | 512, 1, 1, 1 | F32 | blk.20.attn_kv_a_norm.weight |
|
322: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.20.attn_kv_b.weight |
|
323: 5120 | 5120, 1, 1, 1 | F32 | blk.20.attn_norm.weight |
|
324: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.20.attn_output.weight |
|
325: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.20.attn_q_a.weight |
|
326: 1536 | 1536, 1, 1, 1 | F32 | blk.20.attn_q_a_norm.weight |
|
327: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.20.attn_q_b.weight |
|
328: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.20.ffn_down_exps.weight |
|
329: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.20.ffn_down_shexp.weight |
|
330: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.20.ffn_gate_exps.weight |
|
331: 819200 | 5120, 160, 1, 1 | F32 | blk.20.ffn_gate_inp.weight |
|
332: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.20.ffn_gate_shexp.weight |
|
333: 5120 | 5120, 1, 1, 1 | F32 | blk.20.ffn_norm.weight |
|
334: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.20.ffn_up_exps.weight |
|
335: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.20.ffn_up_shexp.weight |
|
336: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.21.attn_kv_a_mqa.weight |
|
337: 512 | 512, 1, 1, 1 | F32 | blk.21.attn_kv_a_norm.weight |
|
338: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.21.attn_kv_b.weight |
|
339: 5120 | 5120, 1, 1, 1 | F32 | blk.21.attn_norm.weight |
|
340: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.21.attn_output.weight |
|
341: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.21.attn_q_a.weight |
|
342: 1536 | 1536, 1, 1, 1 | F32 | blk.21.attn_q_a_norm.weight |
|
343: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.21.attn_q_b.weight |
|
344: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.21.ffn_down_exps.weight |
|
345: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.21.ffn_down_shexp.weight |
|
346: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.21.ffn_gate_exps.weight |
|
347: 819200 | 5120, 160, 1, 1 | F32 | blk.21.ffn_gate_inp.weight |
|
348: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.21.ffn_gate_shexp.weight |
|
349: 5120 | 5120, 1, 1, 1 | F32 | blk.21.ffn_norm.weight |
|
350: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.21.ffn_up_exps.weight |
|
351: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.21.ffn_up_shexp.weight |
|
352: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.22.attn_kv_a_mqa.weight |
|
353: 512 | 512, 1, 1, 1 | F32 | blk.22.attn_kv_a_norm.weight |
|
354: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.22.attn_kv_b.weight |
|
355: 5120 | 5120, 1, 1, 1 | F32 | blk.22.attn_norm.weight |
|
356: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.22.attn_output.weight |
|
357: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.22.attn_q_a.weight |
|
358: 1536 | 1536, 1, 1, 1 | F32 | blk.22.attn_q_a_norm.weight |
|
359: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.22.attn_q_b.weight |
|
360: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.22.ffn_down_exps.weight |
|
361: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.22.ffn_down_shexp.weight |
|
362: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.22.ffn_gate_exps.weight |
|
363: 819200 | 5120, 160, 1, 1 | F32 | blk.22.ffn_gate_inp.weight |
|
364: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.22.ffn_gate_shexp.weight |
|
365: 5120 | 5120, 1, 1, 1 | F32 | blk.22.ffn_norm.weight |
|
366: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.22.ffn_up_exps.weight |
|
367: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.22.ffn_up_shexp.weight |
|
368: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.23.attn_kv_a_mqa.weight |
|
369: 512 | 512, 1, 1, 1 | F32 | blk.23.attn_kv_a_norm.weight |
|
370: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.23.attn_kv_b.weight |
|
371: 5120 | 5120, 1, 1, 1 | F32 | blk.23.attn_norm.weight |
|
372: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.23.attn_output.weight |
|
373: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.23.attn_q_a.weight |
|
374: 1536 | 1536, 1, 1, 1 | F32 | blk.23.attn_q_a_norm.weight |
|
375: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.23.attn_q_b.weight |
|
376: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.23.ffn_down_exps.weight |
|
377: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.23.ffn_down_shexp.weight |
|
378: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.23.ffn_gate_exps.weight |
|
379: 819200 | 5120, 160, 1, 1 | F32 | blk.23.ffn_gate_inp.weight |
|
380: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.23.ffn_gate_shexp.weight |
|
381: 5120 | 5120, 1, 1, 1 | F32 | blk.23.ffn_norm.weight |
|
382: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.23.ffn_up_exps.weight |
|
383: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.23.ffn_up_shexp.weight |
|
384: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.24.attn_kv_a_mqa.weight |
|
385: 512 | 512, 1, 1, 1 | F32 | blk.24.attn_kv_a_norm.weight |
|
386: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.24.attn_kv_b.weight |
|
387: 5120 | 5120, 1, 1, 1 | F32 | blk.24.attn_norm.weight |
|
388: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.24.attn_output.weight |
|
389: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.24.attn_q_a.weight |
|
390: 1536 | 1536, 1, 1, 1 | F32 | blk.24.attn_q_a_norm.weight |
|
391: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.24.attn_q_b.weight |
|
392: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.24.ffn_down_exps.weight |
|
393: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.24.ffn_down_shexp.weight |
|
394: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.24.ffn_gate_exps.weight |
|
395: 819200 | 5120, 160, 1, 1 | F32 | blk.24.ffn_gate_inp.weight |
|
396: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.24.ffn_gate_shexp.weight |
|
397: 5120 | 5120, 1, 1, 1 | F32 | blk.24.ffn_norm.weight |
|
398: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.24.ffn_up_exps.weight |
|
399: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.24.ffn_up_shexp.weight |
|
400: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.25.attn_kv_a_mqa.weight |
|
401: 512 | 512, 1, 1, 1 | F32 | blk.25.attn_kv_a_norm.weight |
|
402: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.25.attn_kv_b.weight |
|
403: 5120 | 5120, 1, 1, 1 | F32 | blk.25.attn_norm.weight |
|
404: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.25.attn_output.weight |
|
405: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.25.attn_q_a.weight |
|
406: 1536 | 1536, 1, 1, 1 | F32 | blk.25.attn_q_a_norm.weight |
|
407: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.25.attn_q_b.weight |
|
408: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.25.ffn_down_exps.weight |
|
409: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.25.ffn_down_shexp.weight |
|
410: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.25.ffn_gate_exps.weight |
|
411: 819200 | 5120, 160, 1, 1 | F32 | blk.25.ffn_gate_inp.weight |
|
412: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.25.ffn_gate_shexp.weight |
|
413: 5120 | 5120, 1, 1, 1 | F32 | blk.25.ffn_norm.weight |
|
414: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.25.ffn_up_exps.weight |
|
415: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.25.ffn_up_shexp.weight |
|
416: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.26.attn_kv_a_mqa.weight |
|
417: 512 | 512, 1, 1, 1 | F32 | blk.26.attn_kv_a_norm.weight |
|
418: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.26.attn_kv_b.weight |
|
419: 5120 | 5120, 1, 1, 1 | F32 | blk.26.attn_norm.weight |
|
420: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.26.attn_output.weight |
|
421: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.26.attn_q_a.weight |
|
422: 1536 | 1536, 1, 1, 1 | F32 | blk.26.attn_q_a_norm.weight |
|
423: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.26.attn_q_b.weight |
|
424: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.26.ffn_down_exps.weight |
|
425: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.26.ffn_down_shexp.weight |
|
426: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.26.ffn_gate_exps.weight |
|
427: 819200 | 5120, 160, 1, 1 | F32 | blk.26.ffn_gate_inp.weight |
|
428: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.26.ffn_gate_shexp.weight |
|
429: 5120 | 5120, 1, 1, 1 | F32 | blk.26.ffn_norm.weight |
|
430: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.26.ffn_up_exps.weight |
|
431: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.26.ffn_up_shexp.weight |
|
432: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.27.attn_kv_a_mqa.weight |
|
433: 512 | 512, 1, 1, 1 | F32 | blk.27.attn_kv_a_norm.weight |
|
434: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.27.attn_kv_b.weight |
|
435: 5120 | 5120, 1, 1, 1 | F32 | blk.27.attn_norm.weight |
|
436: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.27.attn_output.weight |
|
437: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.27.attn_q_a.weight |
|
438: 1536 | 1536, 1, 1, 1 | F32 | blk.27.attn_q_a_norm.weight |
|
439: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.27.attn_q_b.weight |
|
440: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.27.ffn_down_exps.weight |
|
441: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.27.ffn_down_shexp.weight |
|
442: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.27.ffn_gate_exps.weight |
|
443: 819200 | 5120, 160, 1, 1 | F32 | blk.27.ffn_gate_inp.weight |
|
444: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.27.ffn_gate_shexp.weight |
|
445: 5120 | 5120, 1, 1, 1 | F32 | blk.27.ffn_norm.weight |
|
446: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.27.ffn_up_exps.weight |
|
447: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.27.ffn_up_shexp.weight |
|
448: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.28.attn_kv_a_mqa.weight |
|
449: 512 | 512, 1, 1, 1 | F32 | blk.28.attn_kv_a_norm.weight |
|
450: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.28.attn_kv_b.weight |
|
451: 5120 | 5120, 1, 1, 1 | F32 | blk.28.attn_norm.weight |
|
452: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.28.attn_output.weight |
|
453: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.28.attn_q_a.weight |
|
454: 1536 | 1536, 1, 1, 1 | F32 | blk.28.attn_q_a_norm.weight |
|
455: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.28.attn_q_b.weight |
|
456: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.28.ffn_down_exps.weight |
|
457: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.28.ffn_down_shexp.weight |
|
458: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.28.ffn_gate_exps.weight |
|
459: 819200 | 5120, 160, 1, 1 | F32 | blk.28.ffn_gate_inp.weight |
|
460: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.28.ffn_gate_shexp.weight |
|
461: 5120 | 5120, 1, 1, 1 | F32 | blk.28.ffn_norm.weight |
|
462: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.28.ffn_up_exps.weight |
|
463: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.28.ffn_up_shexp.weight |
|
464: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.29.attn_kv_a_mqa.weight |
|
465: 512 | 512, 1, 1, 1 | F32 | blk.29.attn_kv_a_norm.weight |
|
466: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.29.attn_kv_b.weight |
|
467: 5120 | 5120, 1, 1, 1 | F32 | blk.29.attn_norm.weight |
|
468: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.29.attn_output.weight |
|
469: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.29.attn_q_a.weight |
|
470: 1536 | 1536, 1, 1, 1 | F32 | blk.29.attn_q_a_norm.weight |
|
471: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.29.attn_q_b.weight |
|
472: 1258291200 | 1536, 5120, 160, 1 | IQ1_M | blk.29.ffn_down_exps.weight |
|
473: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.29.ffn_down_shexp.weight |
|
474: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.29.ffn_gate_exps.weight |
|
475: 819200 | 5120, 160, 1, 1 | F32 | blk.29.ffn_gate_inp.weight |
|
476: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.29.ffn_gate_shexp.weight |
|
477: 5120 | 5120, 1, 1, 1 | F32 | blk.29.ffn_norm.weight |
|
478: 1258291200 | 5120, 1536, 160, 1 | IQ1_M | blk.29.ffn_up_exps.weight |
|
479: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.29.ffn_up_shexp.weight |
|
480: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.30.attn_kv_a_mqa.weight |
|
|