|
INFO:gguf-dump:* Loading: DeepSeek-v2.5-1210-UD-iq2_s-00002-of-00002.gguf |
|
* File is LITTLE endian, script is running on a LITTLE endian host. |
|
* Dumping 6 key/value pair(s) |
|
1: UINT32 | 1 | GGUF.version = 3 |
|
2: UINT64 | 1 | GGUF.tensor_count = 479 |
|
3: UINT64 | 1 | GGUF.kv_count = 3 |
|
4: UINT16 | 1 | split.no = 1 |
|
5: INT32 | 1 | split.tensors.count = 959 |
|
6: UINT16 | 1 | split.count = 2 |
|
* Dumping 479 tensor(s) |
|
1: 512 | 512, 1, 1, 1 | F32 | blk.30.attn_kv_a_norm.weight |
|
2: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.30.attn_kv_b.weight |
|
3: 5120 | 5120, 1, 1, 1 | F32 | blk.30.attn_norm.weight |
|
4: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.30.attn_output.weight |
|
5: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.30.attn_q_a.weight |
|
6: 1536 | 1536, 1, 1, 1 | F32 | blk.30.attn_q_a_norm.weight |
|
7: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.30.attn_q_b.weight |
|
8: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.30.ffn_down_exps.weight |
|
9: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.30.ffn_down_shexp.weight |
|
10: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.30.ffn_gate_exps.weight |
|
11: 819200 | 5120, 160, 1, 1 | F32 | blk.30.ffn_gate_inp.weight |
|
12: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.30.ffn_gate_shexp.weight |
|
13: 5120 | 5120, 1, 1, 1 | F32 | blk.30.ffn_norm.weight |
|
14: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.30.ffn_up_exps.weight |
|
15: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.30.ffn_up_shexp.weight |
|
16: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.31.attn_kv_a_mqa.weight |
|
17: 512 | 512, 1, 1, 1 | F32 | blk.31.attn_kv_a_norm.weight |
|
18: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.31.attn_kv_b.weight |
|
19: 5120 | 5120, 1, 1, 1 | F32 | blk.31.attn_norm.weight |
|
20: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.31.attn_output.weight |
|
21: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.31.attn_q_a.weight |
|
22: 1536 | 1536, 1, 1, 1 | F32 | blk.31.attn_q_a_norm.weight |
|
23: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.31.attn_q_b.weight |
|
24: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.31.ffn_down_exps.weight |
|
25: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.31.ffn_down_shexp.weight |
|
26: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.31.ffn_gate_exps.weight |
|
27: 819200 | 5120, 160, 1, 1 | F32 | blk.31.ffn_gate_inp.weight |
|
28: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.31.ffn_gate_shexp.weight |
|
29: 5120 | 5120, 1, 1, 1 | F32 | blk.31.ffn_norm.weight |
|
30: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.31.ffn_up_exps.weight |
|
31: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.31.ffn_up_shexp.weight |
|
32: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.32.attn_kv_a_mqa.weight |
|
33: 512 | 512, 1, 1, 1 | F32 | blk.32.attn_kv_a_norm.weight |
|
34: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.32.attn_kv_b.weight |
|
35: 5120 | 5120, 1, 1, 1 | F32 | blk.32.attn_norm.weight |
|
36: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.32.attn_output.weight |
|
37: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.32.attn_q_a.weight |
|
38: 1536 | 1536, 1, 1, 1 | F32 | blk.32.attn_q_a_norm.weight |
|
39: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.32.attn_q_b.weight |
|
40: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.32.ffn_down_exps.weight |
|
41: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.32.ffn_down_shexp.weight |
|
42: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.32.ffn_gate_exps.weight |
|
43: 819200 | 5120, 160, 1, 1 | F32 | blk.32.ffn_gate_inp.weight |
|
44: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.32.ffn_gate_shexp.weight |
|
45: 5120 | 5120, 1, 1, 1 | F32 | blk.32.ffn_norm.weight |
|
46: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.32.ffn_up_exps.weight |
|
47: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.32.ffn_up_shexp.weight |
|
48: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.33.attn_kv_a_mqa.weight |
|
49: 512 | 512, 1, 1, 1 | F32 | blk.33.attn_kv_a_norm.weight |
|
50: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.33.attn_kv_b.weight |
|
51: 5120 | 5120, 1, 1, 1 | F32 | blk.33.attn_norm.weight |
|
52: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.33.attn_output.weight |
|
53: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.33.attn_q_a.weight |
|
54: 1536 | 1536, 1, 1, 1 | F32 | blk.33.attn_q_a_norm.weight |
|
55: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.33.attn_q_b.weight |
|
56: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.33.ffn_down_exps.weight |
|
57: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.33.ffn_down_shexp.weight |
|
58: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.33.ffn_gate_exps.weight |
|
59: 819200 | 5120, 160, 1, 1 | F32 | blk.33.ffn_gate_inp.weight |
|
60: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.33.ffn_gate_shexp.weight |
|
61: 5120 | 5120, 1, 1, 1 | F32 | blk.33.ffn_norm.weight |
|
62: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.33.ffn_up_exps.weight |
|
63: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.33.ffn_up_shexp.weight |
|
64: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.34.attn_kv_a_mqa.weight |
|
65: 512 | 512, 1, 1, 1 | F32 | blk.34.attn_kv_a_norm.weight |
|
66: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.34.attn_kv_b.weight |
|
67: 5120 | 5120, 1, 1, 1 | F32 | blk.34.attn_norm.weight |
|
68: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.34.attn_output.weight |
|
69: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.34.attn_q_a.weight |
|
70: 1536 | 1536, 1, 1, 1 | F32 | blk.34.attn_q_a_norm.weight |
|
71: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.34.attn_q_b.weight |
|
72: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.34.ffn_down_exps.weight |
|
73: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.34.ffn_down_shexp.weight |
|
74: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.34.ffn_gate_exps.weight |
|
75: 819200 | 5120, 160, 1, 1 | F32 | blk.34.ffn_gate_inp.weight |
|
76: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.34.ffn_gate_shexp.weight |
|
77: 5120 | 5120, 1, 1, 1 | F32 | blk.34.ffn_norm.weight |
|
78: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.34.ffn_up_exps.weight |
|
79: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.34.ffn_up_shexp.weight |
|
80: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.35.attn_kv_a_mqa.weight |
|
81: 512 | 512, 1, 1, 1 | F32 | blk.35.attn_kv_a_norm.weight |
|
82: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.35.attn_kv_b.weight |
|
83: 5120 | 5120, 1, 1, 1 | F32 | blk.35.attn_norm.weight |
|
84: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.35.attn_output.weight |
|
85: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.35.attn_q_a.weight |
|
86: 1536 | 1536, 1, 1, 1 | F32 | blk.35.attn_q_a_norm.weight |
|
87: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.35.attn_q_b.weight |
|
88: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.35.ffn_down_exps.weight |
|
89: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.35.ffn_down_shexp.weight |
|
90: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.35.ffn_gate_exps.weight |
|
91: 819200 | 5120, 160, 1, 1 | F32 | blk.35.ffn_gate_inp.weight |
|
92: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.35.ffn_gate_shexp.weight |
|
93: 5120 | 5120, 1, 1, 1 | F32 | blk.35.ffn_norm.weight |
|
94: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.35.ffn_up_exps.weight |
|
95: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.35.ffn_up_shexp.weight |
|
96: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.36.attn_kv_a_mqa.weight |
|
97: 512 | 512, 1, 1, 1 | F32 | blk.36.attn_kv_a_norm.weight |
|
98: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.36.attn_kv_b.weight |
|
99: 5120 | 5120, 1, 1, 1 | F32 | blk.36.attn_norm.weight |
|
100: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.36.attn_output.weight |
|
101: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.36.attn_q_a.weight |
|
102: 1536 | 1536, 1, 1, 1 | F32 | blk.36.attn_q_a_norm.weight |
|
103: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.36.attn_q_b.weight |
|
104: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.36.ffn_down_exps.weight |
|
105: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.36.ffn_down_shexp.weight |
|
106: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.36.ffn_gate_exps.weight |
|
107: 819200 | 5120, 160, 1, 1 | F32 | blk.36.ffn_gate_inp.weight |
|
108: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.36.ffn_gate_shexp.weight |
|
109: 5120 | 5120, 1, 1, 1 | F32 | blk.36.ffn_norm.weight |
|
110: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.36.ffn_up_exps.weight |
|
111: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.36.ffn_up_shexp.weight |
|
112: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.37.attn_kv_a_mqa.weight |
|
113: 512 | 512, 1, 1, 1 | F32 | blk.37.attn_kv_a_norm.weight |
|
114: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.37.attn_kv_b.weight |
|
115: 5120 | 5120, 1, 1, 1 | F32 | blk.37.attn_norm.weight |
|
116: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.37.attn_output.weight |
|
117: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.37.attn_q_a.weight |
|
118: 1536 | 1536, 1, 1, 1 | F32 | blk.37.attn_q_a_norm.weight |
|
119: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.37.attn_q_b.weight |
|
120: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.37.ffn_down_exps.weight |
|
121: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.37.ffn_down_shexp.weight |
|
122: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.37.ffn_gate_exps.weight |
|
123: 819200 | 5120, 160, 1, 1 | F32 | blk.37.ffn_gate_inp.weight |
|
124: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.37.ffn_gate_shexp.weight |
|
125: 5120 | 5120, 1, 1, 1 | F32 | blk.37.ffn_norm.weight |
|
126: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.37.ffn_up_exps.weight |
|
127: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.37.ffn_up_shexp.weight |
|
128: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.38.attn_kv_a_mqa.weight |
|
129: 512 | 512, 1, 1, 1 | F32 | blk.38.attn_kv_a_norm.weight |
|
130: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.38.attn_kv_b.weight |
|
131: 5120 | 5120, 1, 1, 1 | F32 | blk.38.attn_norm.weight |
|
132: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.38.attn_output.weight |
|
133: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.38.attn_q_a.weight |
|
134: 1536 | 1536, 1, 1, 1 | F32 | blk.38.attn_q_a_norm.weight |
|
135: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.38.attn_q_b.weight |
|
136: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.38.ffn_down_exps.weight |
|
137: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.38.ffn_down_shexp.weight |
|
138: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.38.ffn_gate_exps.weight |
|
139: 819200 | 5120, 160, 1, 1 | F32 | blk.38.ffn_gate_inp.weight |
|
140: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.38.ffn_gate_shexp.weight |
|
141: 5120 | 5120, 1, 1, 1 | F32 | blk.38.ffn_norm.weight |
|
142: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.38.ffn_up_exps.weight |
|
143: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.38.ffn_up_shexp.weight |
|
144: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.39.attn_kv_a_mqa.weight |
|
145: 512 | 512, 1, 1, 1 | F32 | blk.39.attn_kv_a_norm.weight |
|
146: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.39.attn_kv_b.weight |
|
147: 5120 | 5120, 1, 1, 1 | F32 | blk.39.attn_norm.weight |
|
148: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.39.attn_output.weight |
|
149: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.39.attn_q_a.weight |
|
150: 1536 | 1536, 1, 1, 1 | F32 | blk.39.attn_q_a_norm.weight |
|
151: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.39.attn_q_b.weight |
|
152: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.39.ffn_down_exps.weight |
|
153: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.39.ffn_down_shexp.weight |
|
154: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.39.ffn_gate_exps.weight |
|
155: 819200 | 5120, 160, 1, 1 | F32 | blk.39.ffn_gate_inp.weight |
|
156: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.39.ffn_gate_shexp.weight |
|
157: 5120 | 5120, 1, 1, 1 | F32 | blk.39.ffn_norm.weight |
|
158: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.39.ffn_up_exps.weight |
|
159: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.39.ffn_up_shexp.weight |
|
160: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.40.attn_kv_a_mqa.weight |
|
161: 512 | 512, 1, 1, 1 | F32 | blk.40.attn_kv_a_norm.weight |
|
162: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.40.attn_kv_b.weight |
|
163: 5120 | 5120, 1, 1, 1 | F32 | blk.40.attn_norm.weight |
|
164: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.40.attn_output.weight |
|
165: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.40.attn_q_a.weight |
|
166: 1536 | 1536, 1, 1, 1 | F32 | blk.40.attn_q_a_norm.weight |
|
167: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.40.attn_q_b.weight |
|
168: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.40.ffn_down_exps.weight |
|
169: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.40.ffn_down_shexp.weight |
|
170: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.40.ffn_gate_exps.weight |
|
171: 819200 | 5120, 160, 1, 1 | F32 | blk.40.ffn_gate_inp.weight |
|
172: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.40.ffn_gate_shexp.weight |
|
173: 5120 | 5120, 1, 1, 1 | F32 | blk.40.ffn_norm.weight |
|
174: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.40.ffn_up_exps.weight |
|
175: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.40.ffn_up_shexp.weight |
|
176: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.41.attn_kv_a_mqa.weight |
|
177: 512 | 512, 1, 1, 1 | F32 | blk.41.attn_kv_a_norm.weight |
|
178: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.41.attn_kv_b.weight |
|
179: 5120 | 5120, 1, 1, 1 | F32 | blk.41.attn_norm.weight |
|
180: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.41.attn_output.weight |
|
181: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.41.attn_q_a.weight |
|
182: 1536 | 1536, 1, 1, 1 | F32 | blk.41.attn_q_a_norm.weight |
|
183: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.41.attn_q_b.weight |
|
184: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.41.ffn_down_exps.weight |
|
185: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.41.ffn_down_shexp.weight |
|
186: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.41.ffn_gate_exps.weight |
|
187: 819200 | 5120, 160, 1, 1 | F32 | blk.41.ffn_gate_inp.weight |
|
188: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.41.ffn_gate_shexp.weight |
|
189: 5120 | 5120, 1, 1, 1 | F32 | blk.41.ffn_norm.weight |
|
190: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.41.ffn_up_exps.weight |
|
191: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.41.ffn_up_shexp.weight |
|
192: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.42.attn_kv_a_mqa.weight |
|
193: 512 | 512, 1, 1, 1 | F32 | blk.42.attn_kv_a_norm.weight |
|
194: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.42.attn_kv_b.weight |
|
195: 5120 | 5120, 1, 1, 1 | F32 | blk.42.attn_norm.weight |
|
196: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.42.attn_output.weight |
|
197: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.42.attn_q_a.weight |
|
198: 1536 | 1536, 1, 1, 1 | F32 | blk.42.attn_q_a_norm.weight |
|
199: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.42.attn_q_b.weight |
|
200: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.42.ffn_down_exps.weight |
|
201: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.42.ffn_down_shexp.weight |
|
202: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.42.ffn_gate_exps.weight |
|
203: 819200 | 5120, 160, 1, 1 | F32 | blk.42.ffn_gate_inp.weight |
|
204: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.42.ffn_gate_shexp.weight |
|
205: 5120 | 5120, 1, 1, 1 | F32 | blk.42.ffn_norm.weight |
|
206: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.42.ffn_up_exps.weight |
|
207: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.42.ffn_up_shexp.weight |
|
208: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.43.attn_kv_a_mqa.weight |
|
209: 512 | 512, 1, 1, 1 | F32 | blk.43.attn_kv_a_norm.weight |
|
210: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.43.attn_kv_b.weight |
|
211: 5120 | 5120, 1, 1, 1 | F32 | blk.43.attn_norm.weight |
|
212: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.43.attn_output.weight |
|
213: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.43.attn_q_a.weight |
|
214: 1536 | 1536, 1, 1, 1 | F32 | blk.43.attn_q_a_norm.weight |
|
215: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.43.attn_q_b.weight |
|
216: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.43.ffn_down_exps.weight |
|
217: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.43.ffn_down_shexp.weight |
|
218: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.43.ffn_gate_exps.weight |
|
219: 819200 | 5120, 160, 1, 1 | F32 | blk.43.ffn_gate_inp.weight |
|
220: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.43.ffn_gate_shexp.weight |
|
221: 5120 | 5120, 1, 1, 1 | F32 | blk.43.ffn_norm.weight |
|
222: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.43.ffn_up_exps.weight |
|
223: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.43.ffn_up_shexp.weight |
|
224: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.44.attn_kv_a_mqa.weight |
|
225: 512 | 512, 1, 1, 1 | F32 | blk.44.attn_kv_a_norm.weight |
|
226: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.44.attn_kv_b.weight |
|
227: 5120 | 5120, 1, 1, 1 | F32 | blk.44.attn_norm.weight |
|
228: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.44.attn_output.weight |
|
229: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.44.attn_q_a.weight |
|
230: 1536 | 1536, 1, 1, 1 | F32 | blk.44.attn_q_a_norm.weight |
|
231: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.44.attn_q_b.weight |
|
232: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.44.ffn_down_exps.weight |
|
233: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.44.ffn_down_shexp.weight |
|
234: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.44.ffn_gate_exps.weight |
|
235: 819200 | 5120, 160, 1, 1 | F32 | blk.44.ffn_gate_inp.weight |
|
236: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.44.ffn_gate_shexp.weight |
|
237: 5120 | 5120, 1, 1, 1 | F32 | blk.44.ffn_norm.weight |
|
238: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.44.ffn_up_exps.weight |
|
239: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.44.ffn_up_shexp.weight |
|
240: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.45.attn_kv_a_mqa.weight |
|
241: 512 | 512, 1, 1, 1 | F32 | blk.45.attn_kv_a_norm.weight |
|
242: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.45.attn_kv_b.weight |
|
243: 5120 | 5120, 1, 1, 1 | F32 | blk.45.attn_norm.weight |
|
244: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.45.attn_output.weight |
|
245: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.45.attn_q_a.weight |
|
246: 1536 | 1536, 1, 1, 1 | F32 | blk.45.attn_q_a_norm.weight |
|
247: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.45.attn_q_b.weight |
|
248: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.45.ffn_down_exps.weight |
|
249: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.45.ffn_down_shexp.weight |
|
250: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.45.ffn_gate_exps.weight |
|
251: 819200 | 5120, 160, 1, 1 | F32 | blk.45.ffn_gate_inp.weight |
|
252: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.45.ffn_gate_shexp.weight |
|
253: 5120 | 5120, 1, 1, 1 | F32 | blk.45.ffn_norm.weight |
|
254: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.45.ffn_up_exps.weight |
|
255: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.45.ffn_up_shexp.weight |
|
256: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.46.attn_kv_a_mqa.weight |
|
257: 512 | 512, 1, 1, 1 | F32 | blk.46.attn_kv_a_norm.weight |
|
258: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.46.attn_kv_b.weight |
|
259: 5120 | 5120, 1, 1, 1 | F32 | blk.46.attn_norm.weight |
|
260: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.46.attn_output.weight |
|
261: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.46.attn_q_a.weight |
|
262: 1536 | 1536, 1, 1, 1 | F32 | blk.46.attn_q_a_norm.weight |
|
263: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.46.attn_q_b.weight |
|
264: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.46.ffn_down_exps.weight |
|
265: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.46.ffn_down_shexp.weight |
|
266: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.46.ffn_gate_exps.weight |
|
267: 819200 | 5120, 160, 1, 1 | F32 | blk.46.ffn_gate_inp.weight |
|
268: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.46.ffn_gate_shexp.weight |
|
269: 5120 | 5120, 1, 1, 1 | F32 | blk.46.ffn_norm.weight |
|
270: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.46.ffn_up_exps.weight |
|
271: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.46.ffn_up_shexp.weight |
|
272: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.47.attn_kv_a_mqa.weight |
|
273: 512 | 512, 1, 1, 1 | F32 | blk.47.attn_kv_a_norm.weight |
|
274: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.47.attn_kv_b.weight |
|
275: 5120 | 5120, 1, 1, 1 | F32 | blk.47.attn_norm.weight |
|
276: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.47.attn_output.weight |
|
277: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.47.attn_q_a.weight |
|
278: 1536 | 1536, 1, 1, 1 | F32 | blk.47.attn_q_a_norm.weight |
|
279: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.47.attn_q_b.weight |
|
280: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.47.ffn_down_exps.weight |
|
281: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.47.ffn_down_shexp.weight |
|
282: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.47.ffn_gate_exps.weight |
|
283: 819200 | 5120, 160, 1, 1 | F32 | blk.47.ffn_gate_inp.weight |
|
284: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.47.ffn_gate_shexp.weight |
|
285: 5120 | 5120, 1, 1, 1 | F32 | blk.47.ffn_norm.weight |
|
286: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.47.ffn_up_exps.weight |
|
287: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.47.ffn_up_shexp.weight |
|
288: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.48.attn_kv_a_mqa.weight |
|
289: 512 | 512, 1, 1, 1 | F32 | blk.48.attn_kv_a_norm.weight |
|
290: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.48.attn_kv_b.weight |
|
291: 5120 | 5120, 1, 1, 1 | F32 | blk.48.attn_norm.weight |
|
292: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.48.attn_output.weight |
|
293: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.48.attn_q_a.weight |
|
294: 1536 | 1536, 1, 1, 1 | F32 | blk.48.attn_q_a_norm.weight |
|
295: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.48.attn_q_b.weight |
|
296: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.48.ffn_down_exps.weight |
|
297: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.48.ffn_down_shexp.weight |
|
298: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.48.ffn_gate_exps.weight |
|
299: 819200 | 5120, 160, 1, 1 | F32 | blk.48.ffn_gate_inp.weight |
|
300: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.48.ffn_gate_shexp.weight |
|
301: 5120 | 5120, 1, 1, 1 | F32 | blk.48.ffn_norm.weight |
|
302: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.48.ffn_up_exps.weight |
|
303: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.48.ffn_up_shexp.weight |
|
304: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.49.attn_kv_a_mqa.weight |
|
305: 512 | 512, 1, 1, 1 | F32 | blk.49.attn_kv_a_norm.weight |
|
306: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.49.attn_kv_b.weight |
|
307: 5120 | 5120, 1, 1, 1 | F32 | blk.49.attn_norm.weight |
|
308: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.49.attn_output.weight |
|
309: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.49.attn_q_a.weight |
|
310: 1536 | 1536, 1, 1, 1 | F32 | blk.49.attn_q_a_norm.weight |
|
311: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.49.attn_q_b.weight |
|
312: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.49.ffn_down_exps.weight |
|
313: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.49.ffn_down_shexp.weight |
|
314: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.49.ffn_gate_exps.weight |
|
315: 819200 | 5120, 160, 1, 1 | F32 | blk.49.ffn_gate_inp.weight |
|
316: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.49.ffn_gate_shexp.weight |
|
317: 5120 | 5120, 1, 1, 1 | F32 | blk.49.ffn_norm.weight |
|
318: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.49.ffn_up_exps.weight |
|
319: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.49.ffn_up_shexp.weight |
|
320: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.50.attn_kv_a_mqa.weight |
|
321: 512 | 512, 1, 1, 1 | F32 | blk.50.attn_kv_a_norm.weight |
|
322: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.50.attn_kv_b.weight |
|
323: 5120 | 5120, 1, 1, 1 | F32 | blk.50.attn_norm.weight |
|
324: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.50.attn_output.weight |
|
325: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.50.attn_q_a.weight |
|
326: 1536 | 1536, 1, 1, 1 | F32 | blk.50.attn_q_a_norm.weight |
|
327: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.50.attn_q_b.weight |
|
328: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.50.ffn_down_exps.weight |
|
329: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.50.ffn_down_shexp.weight |
|
330: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.50.ffn_gate_exps.weight |
|
331: 819200 | 5120, 160, 1, 1 | F32 | blk.50.ffn_gate_inp.weight |
|
332: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.50.ffn_gate_shexp.weight |
|
333: 5120 | 5120, 1, 1, 1 | F32 | blk.50.ffn_norm.weight |
|
334: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.50.ffn_up_exps.weight |
|
335: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.50.ffn_up_shexp.weight |
|
336: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.51.attn_kv_a_mqa.weight |
|
337: 512 | 512, 1, 1, 1 | F32 | blk.51.attn_kv_a_norm.weight |
|
338: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.51.attn_kv_b.weight |
|
339: 5120 | 5120, 1, 1, 1 | F32 | blk.51.attn_norm.weight |
|
340: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.51.attn_output.weight |
|
341: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.51.attn_q_a.weight |
|
342: 1536 | 1536, 1, 1, 1 | F32 | blk.51.attn_q_a_norm.weight |
|
343: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.51.attn_q_b.weight |
|
344: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.51.ffn_down_exps.weight |
|
345: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.51.ffn_down_shexp.weight |
|
346: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.51.ffn_gate_exps.weight |
|
347: 819200 | 5120, 160, 1, 1 | F32 | blk.51.ffn_gate_inp.weight |
|
348: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.51.ffn_gate_shexp.weight |
|
349: 5120 | 5120, 1, 1, 1 | F32 | blk.51.ffn_norm.weight |
|
350: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.51.ffn_up_exps.weight |
|
351: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.51.ffn_up_shexp.weight |
|
352: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.52.attn_kv_a_mqa.weight |
|
353: 512 | 512, 1, 1, 1 | F32 | blk.52.attn_kv_a_norm.weight |
|
354: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.52.attn_kv_b.weight |
|
355: 5120 | 5120, 1, 1, 1 | F32 | blk.52.attn_norm.weight |
|
356: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.52.attn_output.weight |
|
357: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.52.attn_q_a.weight |
|
358: 1536 | 1536, 1, 1, 1 | F32 | blk.52.attn_q_a_norm.weight |
|
359: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.52.attn_q_b.weight |
|
360: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.52.ffn_down_exps.weight |
|
361: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.52.ffn_down_shexp.weight |
|
362: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.52.ffn_gate_exps.weight |
|
363: 819200 | 5120, 160, 1, 1 | F32 | blk.52.ffn_gate_inp.weight |
|
364: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.52.ffn_gate_shexp.weight |
|
365: 5120 | 5120, 1, 1, 1 | F32 | blk.52.ffn_norm.weight |
|
366: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.52.ffn_up_exps.weight |
|
367: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.52.ffn_up_shexp.weight |
|
368: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.53.attn_kv_a_mqa.weight |
|
369: 512 | 512, 1, 1, 1 | F32 | blk.53.attn_kv_a_norm.weight |
|
370: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.53.attn_kv_b.weight |
|
371: 5120 | 5120, 1, 1, 1 | F32 | blk.53.attn_norm.weight |
|
372: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.53.attn_output.weight |
|
373: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.53.attn_q_a.weight |
|
374: 1536 | 1536, 1, 1, 1 | F32 | blk.53.attn_q_a_norm.weight |
|
375: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.53.attn_q_b.weight |
|
376: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.53.ffn_down_exps.weight |
|
377: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.53.ffn_down_shexp.weight |
|
378: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.53.ffn_gate_exps.weight |
|
379: 819200 | 5120, 160, 1, 1 | F32 | blk.53.ffn_gate_inp.weight |
|
380: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.53.ffn_gate_shexp.weight |
|
381: 5120 | 5120, 1, 1, 1 | F32 | blk.53.ffn_norm.weight |
|
382: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.53.ffn_up_exps.weight |
|
383: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.53.ffn_up_shexp.weight |
|
384: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.54.attn_kv_a_mqa.weight |
|
385: 512 | 512, 1, 1, 1 | F32 | blk.54.attn_kv_a_norm.weight |
|
386: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.54.attn_kv_b.weight |
|
387: 5120 | 5120, 1, 1, 1 | F32 | blk.54.attn_norm.weight |
|
388: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.54.attn_output.weight |
|
389: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.54.attn_q_a.weight |
|
390: 1536 | 1536, 1, 1, 1 | F32 | blk.54.attn_q_a_norm.weight |
|
391: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.54.attn_q_b.weight |
|
392: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.54.ffn_down_exps.weight |
|
393: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.54.ffn_down_shexp.weight |
|
394: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.54.ffn_gate_exps.weight |
|
395: 819200 | 5120, 160, 1, 1 | F32 | blk.54.ffn_gate_inp.weight |
|
396: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.54.ffn_gate_shexp.weight |
|
397: 5120 | 5120, 1, 1, 1 | F32 | blk.54.ffn_norm.weight |
|
398: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.54.ffn_up_exps.weight |
|
399: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.54.ffn_up_shexp.weight |
|
400: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.55.attn_kv_a_mqa.weight |
|
401: 512 | 512, 1, 1, 1 | F32 | blk.55.attn_kv_a_norm.weight |
|
402: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.55.attn_kv_b.weight |
|
403: 5120 | 5120, 1, 1, 1 | F32 | blk.55.attn_norm.weight |
|
404: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.55.attn_output.weight |
|
405: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.55.attn_q_a.weight |
|
406: 1536 | 1536, 1, 1, 1 | F32 | blk.55.attn_q_a_norm.weight |
|
407: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.55.attn_q_b.weight |
|
408: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.55.ffn_down_exps.weight |
|
409: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.55.ffn_down_shexp.weight |
|
410: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.55.ffn_gate_exps.weight |
|
411: 819200 | 5120, 160, 1, 1 | F32 | blk.55.ffn_gate_inp.weight |
|
412: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.55.ffn_gate_shexp.weight |
|
413: 5120 | 5120, 1, 1, 1 | F32 | blk.55.ffn_norm.weight |
|
414: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.55.ffn_up_exps.weight |
|
415: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.55.ffn_up_shexp.weight |
|
416: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.56.attn_kv_a_mqa.weight |
|
417: 512 | 512, 1, 1, 1 | F32 | blk.56.attn_kv_a_norm.weight |
|
418: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.56.attn_kv_b.weight |
|
419: 5120 | 5120, 1, 1, 1 | F32 | blk.56.attn_norm.weight |
|
420: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.56.attn_output.weight |
|
421: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.56.attn_q_a.weight |
|
422: 1536 | 1536, 1, 1, 1 | F32 | blk.56.attn_q_a_norm.weight |
|
423: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.56.attn_q_b.weight |
|
424: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.56.ffn_down_exps.weight |
|
425: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.56.ffn_down_shexp.weight |
|
426: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.56.ffn_gate_exps.weight |
|
427: 819200 | 5120, 160, 1, 1 | F32 | blk.56.ffn_gate_inp.weight |
|
428: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.56.ffn_gate_shexp.weight |
|
429: 5120 | 5120, 1, 1, 1 | F32 | blk.56.ffn_norm.weight |
|
430: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.56.ffn_up_exps.weight |
|
431: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.56.ffn_up_shexp.weight |
|
432: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.57.attn_kv_a_mqa.weight |
|
433: 512 | 512, 1, 1, 1 | F32 | blk.57.attn_kv_a_norm.weight |
|
434: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.57.attn_kv_b.weight |
|
435: 5120 | 5120, 1, 1, 1 | F32 | blk.57.attn_norm.weight |
|
436: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.57.attn_output.weight |
|
437: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.57.attn_q_a.weight |
|
438: 1536 | 1536, 1, 1, 1 | F32 | blk.57.attn_q_a_norm.weight |
|
439: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.57.attn_q_b.weight |
|
440: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.57.ffn_down_exps.weight |
|
441: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.57.ffn_down_shexp.weight |
|
442: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.57.ffn_gate_exps.weight |
|
443: 819200 | 5120, 160, 1, 1 | F32 | blk.57.ffn_gate_inp.weight |
|
444: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.57.ffn_gate_shexp.weight |
|
445: 5120 | 5120, 1, 1, 1 | F32 | blk.57.ffn_norm.weight |
|
446: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.57.ffn_up_exps.weight |
|
447: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.57.ffn_up_shexp.weight |
|
448: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.58.attn_kv_a_mqa.weight |
|
449: 512 | 512, 1, 1, 1 | F32 | blk.58.attn_kv_a_norm.weight |
|
450: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.58.attn_kv_b.weight |
|
451: 5120 | 5120, 1, 1, 1 | F32 | blk.58.attn_norm.weight |
|
452: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.58.attn_output.weight |
|
453: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.58.attn_q_a.weight |
|
454: 1536 | 1536, 1, 1, 1 | F32 | blk.58.attn_q_a_norm.weight |
|
455: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.58.attn_q_b.weight |
|
456: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.58.ffn_down_exps.weight |
|
457: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.58.ffn_down_shexp.weight |
|
458: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.58.ffn_gate_exps.weight |
|
459: 819200 | 5120, 160, 1, 1 | F32 | blk.58.ffn_gate_inp.weight |
|
460: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.58.ffn_gate_shexp.weight |
|
461: 5120 | 5120, 1, 1, 1 | F32 | blk.58.ffn_norm.weight |
|
462: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.58.ffn_up_exps.weight |
|
463: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.58.ffn_up_shexp.weight |
|
464: 2949120 | 5120, 576, 1, 1 | Q6_K | blk.59.attn_kv_a_mqa.weight |
|
465: 512 | 512, 1, 1, 1 | F32 | blk.59.attn_kv_a_norm.weight |
|
466: 16777216 | 512, 32768, 1, 1 | Q6_K | blk.59.attn_kv_b.weight |
|
467: 5120 | 5120, 1, 1, 1 | F32 | blk.59.attn_norm.weight |
|
468: 83886080 | 16384, 5120, 1, 1 | Q4_K | blk.59.attn_output.weight |
|
469: 7864320 | 5120, 1536, 1, 1 | Q4_K | blk.59.attn_q_a.weight |
|
470: 1536 | 1536, 1, 1, 1 | F32 | blk.59.attn_q_a_norm.weight |
|
471: 37748736 | 1536, 24576, 1, 1 | Q4_K | blk.59.attn_q_b.weight |
|
472: 1258291200 | 1536, 5120, 160, 1 | Q2_K | blk.59.ffn_down_exps.weight |
|
473: 15728640 | 3072, 5120, 1, 1 | Q6_K | blk.59.ffn_down_shexp.weight |
|
474: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.59.ffn_gate_exps.weight |
|
475: 819200 | 5120, 160, 1, 1 | F32 | blk.59.ffn_gate_inp.weight |
|
476: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.59.ffn_gate_shexp.weight |
|
477: 5120 | 5120, 1, 1, 1 | F32 | blk.59.ffn_norm.weight |
|
478: 1258291200 | 5120, 1536, 160, 1 | IQ2_XS | blk.59.ffn_up_exps.weight |
|
479: 15728640 | 5120, 3072, 1, 1 | Q5_K | blk.59.ffn_up_shexp.weight |
|
|