diff --git "a/config.json" "b/config.json" --- "a/config.json" +++ "b/config.json" @@ -1,5 +1,5 @@ { - "_name_or_path": "nvidia/Llama-3.1-Nemotron-70B-Instruct-HF", + "_name_or_path": "/home/aiscuser/yangwang/convert_model/models/VPTQ-community--Llama-3.1-Nemotron-70B-Instruct-HF-v8-k65536-65536-woft", "architectures": [ "LlamaForCausalLM" ], @@ -23,27 +23,12 @@ "num_hidden_layers": 80, "num_key_value_heads": 8, "pretraining_tp": 1, - "rms_norm_eps": 1e-05, - "rope_scaling": { - "factor": 8.0, - "high_freq_factor": 4.0, - "low_freq_factor": 1.0, - "original_max_position_embeddings": 8192, - "rope_type": "llama3" - }, - "rope_theta": 500000.0, - "tie_word_embeddings": false, - "torch_dtype": "bfloat16", - "transformers_version": "4.45.2", - "use_cache": true, - "vocab_size": 128256, "quantization_config": { - "quant_method": "vptq", "config_for_layers": { "model.layers.0.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -67,7 +52,7 @@ "model.layers.0.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -91,7 +76,7 @@ "model.layers.0.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -115,7 +100,7 @@ "model.layers.0.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -139,7 +124,7 @@ "model.layers.0.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -163,7 +148,7 @@ "model.layers.0.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -187,7 +172,7 @@ "model.layers.0.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -211,7 +196,7 @@ "model.layers.1.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -235,7 +220,7 @@ "model.layers.1.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -259,7 +244,7 @@ "model.layers.1.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -283,7 +268,7 @@ "model.layers.1.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -307,7 +292,7 @@ "model.layers.1.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -331,7 +316,7 @@ "model.layers.1.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -355,7 +340,7 @@ "model.layers.1.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -379,7 +364,7 @@ "model.layers.10.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -403,7 +388,7 @@ "model.layers.10.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -427,7 +412,7 @@ "model.layers.10.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -451,7 +436,7 @@ "model.layers.10.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -475,7 +460,7 @@ "model.layers.10.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -499,7 +484,7 @@ "model.layers.10.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -523,7 +508,7 @@ "model.layers.10.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -547,7 +532,7 @@ "model.layers.11.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -571,7 +556,7 @@ "model.layers.11.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -595,7 +580,7 @@ "model.layers.11.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -619,7 +604,7 @@ "model.layers.11.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -643,7 +628,7 @@ "model.layers.11.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -667,7 +652,7 @@ "model.layers.11.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -691,7 +676,7 @@ "model.layers.11.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -715,7 +700,7 @@ "model.layers.12.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -739,7 +724,7 @@ "model.layers.12.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -763,7 +748,7 @@ "model.layers.12.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -787,7 +772,7 @@ "model.layers.12.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -811,7 +796,7 @@ "model.layers.12.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -835,7 +820,7 @@ "model.layers.12.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -859,7 +844,7 @@ "model.layers.12.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -883,7 +868,7 @@ "model.layers.13.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -907,7 +892,7 @@ "model.layers.13.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -931,7 +916,7 @@ "model.layers.13.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -955,7 +940,7 @@ "model.layers.13.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -979,7 +964,7 @@ "model.layers.13.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1003,7 +988,7 @@ "model.layers.13.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1027,7 +1012,7 @@ "model.layers.13.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1051,7 +1036,7 @@ "model.layers.14.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1075,7 +1060,7 @@ "model.layers.14.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1099,7 +1084,7 @@ "model.layers.14.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1123,7 +1108,7 @@ "model.layers.14.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1147,7 +1132,7 @@ "model.layers.14.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1171,7 +1156,7 @@ "model.layers.14.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1195,7 +1180,7 @@ "model.layers.14.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1219,7 +1204,7 @@ "model.layers.15.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1243,7 +1228,7 @@ "model.layers.15.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1267,7 +1252,7 @@ "model.layers.15.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1291,7 +1276,7 @@ "model.layers.15.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1315,7 +1300,7 @@ "model.layers.15.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1339,7 +1324,7 @@ "model.layers.15.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1363,7 +1348,7 @@ "model.layers.15.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1387,7 +1372,7 @@ "model.layers.16.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1411,7 +1396,7 @@ "model.layers.16.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1435,7 +1420,7 @@ "model.layers.16.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1459,7 +1444,7 @@ "model.layers.16.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1483,7 +1468,7 @@ "model.layers.16.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1507,7 +1492,7 @@ "model.layers.16.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1531,7 +1516,7 @@ "model.layers.16.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1555,7 +1540,7 @@ "model.layers.17.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1579,7 +1564,7 @@ "model.layers.17.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1603,7 +1588,7 @@ "model.layers.17.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1627,7 +1612,7 @@ "model.layers.17.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1651,7 +1636,7 @@ "model.layers.17.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1675,7 +1660,7 @@ "model.layers.17.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1699,7 +1684,7 @@ "model.layers.17.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1723,7 +1708,7 @@ "model.layers.18.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1747,7 +1732,7 @@ "model.layers.18.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1771,7 +1756,7 @@ "model.layers.18.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1795,7 +1780,7 @@ "model.layers.18.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1819,7 +1804,7 @@ "model.layers.18.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1843,7 +1828,7 @@ "model.layers.18.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1867,7 +1852,7 @@ "model.layers.18.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1891,7 +1876,7 @@ "model.layers.19.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1915,7 +1900,7 @@ "model.layers.19.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1939,7 +1924,7 @@ "model.layers.19.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1963,7 +1948,7 @@ "model.layers.19.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1987,7 +1972,7 @@ "model.layers.19.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2011,7 +1996,7 @@ "model.layers.19.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2035,7 +2020,7 @@ "model.layers.19.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2059,7 +2044,7 @@ "model.layers.2.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2083,7 +2068,7 @@ "model.layers.2.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2107,7 +2092,7 @@ "model.layers.2.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2131,7 +2116,7 @@ "model.layers.2.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2155,7 +2140,7 @@ "model.layers.2.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2179,7 +2164,7 @@ "model.layers.2.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2203,7 +2188,7 @@ "model.layers.2.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2227,7 +2212,7 @@ "model.layers.20.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2251,7 +2236,7 @@ "model.layers.20.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2275,7 +2260,7 @@ "model.layers.20.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2299,7 +2284,7 @@ "model.layers.20.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2323,7 +2308,7 @@ "model.layers.20.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2347,7 +2332,7 @@ "model.layers.20.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2371,7 +2356,7 @@ "model.layers.20.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2395,7 +2380,7 @@ "model.layers.21.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2419,7 +2404,7 @@ "model.layers.21.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2443,7 +2428,7 @@ "model.layers.21.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2467,7 +2452,7 @@ "model.layers.21.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2491,7 +2476,7 @@ "model.layers.21.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2515,7 +2500,7 @@ "model.layers.21.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2539,7 +2524,7 @@ "model.layers.21.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2563,7 +2548,7 @@ "model.layers.22.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2587,7 +2572,7 @@ "model.layers.22.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2611,7 +2596,7 @@ "model.layers.22.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2635,7 +2620,7 @@ "model.layers.22.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2659,7 +2644,7 @@ "model.layers.22.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2683,7 +2668,7 @@ "model.layers.22.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2707,7 +2692,7 @@ "model.layers.22.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2731,7 +2716,7 @@ "model.layers.23.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2755,7 +2740,7 @@ "model.layers.23.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2779,7 +2764,7 @@ "model.layers.23.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2803,7 +2788,7 @@ "model.layers.23.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2827,7 +2812,7 @@ "model.layers.23.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2851,7 +2836,7 @@ "model.layers.23.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2875,7 +2860,7 @@ "model.layers.23.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2899,7 +2884,7 @@ "model.layers.24.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2923,7 +2908,7 @@ "model.layers.24.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2947,7 +2932,7 @@ "model.layers.24.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2971,7 +2956,7 @@ "model.layers.24.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2995,7 +2980,7 @@ "model.layers.24.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3019,7 +3004,7 @@ "model.layers.24.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3043,7 +3028,7 @@ "model.layers.24.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3067,7 +3052,7 @@ "model.layers.25.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3091,7 +3076,7 @@ "model.layers.25.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3115,7 +3100,7 @@ "model.layers.25.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3139,7 +3124,7 @@ "model.layers.25.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3163,7 +3148,7 @@ "model.layers.25.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3187,7 +3172,7 @@ "model.layers.25.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3211,7 +3196,7 @@ "model.layers.25.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3235,7 +3220,7 @@ "model.layers.26.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3259,7 +3244,7 @@ "model.layers.26.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3283,7 +3268,7 @@ "model.layers.26.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3307,7 +3292,7 @@ "model.layers.26.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3331,7 +3316,7 @@ "model.layers.26.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3355,7 +3340,7 @@ "model.layers.26.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3379,7 +3364,7 @@ "model.layers.26.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3403,7 +3388,7 @@ "model.layers.27.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3427,7 +3412,7 @@ "model.layers.27.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3451,7 +3436,7 @@ "model.layers.27.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3475,7 +3460,7 @@ "model.layers.27.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3499,7 +3484,7 @@ "model.layers.27.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3523,7 +3508,7 @@ "model.layers.27.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3547,7 +3532,7 @@ "model.layers.27.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3571,7 +3556,7 @@ "model.layers.28.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3595,7 +3580,7 @@ "model.layers.28.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3619,7 +3604,7 @@ "model.layers.28.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3643,7 +3628,7 @@ "model.layers.28.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3667,7 +3652,7 @@ "model.layers.28.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3691,7 +3676,7 @@ "model.layers.28.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3715,7 +3700,7 @@ "model.layers.28.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3739,7 +3724,7 @@ "model.layers.29.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3763,7 +3748,7 @@ "model.layers.29.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3787,7 +3772,7 @@ "model.layers.29.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3811,7 +3796,7 @@ "model.layers.29.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3835,7 +3820,7 @@ "model.layers.29.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3859,7 +3844,7 @@ "model.layers.29.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3883,7 +3868,7 @@ "model.layers.29.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3907,7 +3892,7 @@ "model.layers.3.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3931,7 +3916,7 @@ "model.layers.3.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3955,7 +3940,7 @@ "model.layers.3.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3979,7 +3964,7 @@ "model.layers.3.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4003,7 +3988,7 @@ "model.layers.3.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4027,7 +4012,7 @@ "model.layers.3.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4051,7 +4036,7 @@ "model.layers.3.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4075,7 +4060,7 @@ "model.layers.30.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4099,7 +4084,7 @@ "model.layers.30.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4123,7 +4108,7 @@ "model.layers.30.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4147,7 +4132,7 @@ "model.layers.30.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4171,7 +4156,7 @@ "model.layers.30.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4195,7 +4180,7 @@ "model.layers.30.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4219,7 +4204,7 @@ "model.layers.30.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4243,7 +4228,7 @@ "model.layers.31.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4267,7 +4252,7 @@ "model.layers.31.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4291,7 +4276,7 @@ "model.layers.31.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4315,7 +4300,7 @@ "model.layers.31.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4339,7 +4324,7 @@ "model.layers.31.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4363,7 +4348,7 @@ "model.layers.31.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4387,7 +4372,7 @@ "model.layers.31.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4411,7 +4396,7 @@ "model.layers.32.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4435,7 +4420,7 @@ "model.layers.32.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4459,7 +4444,7 @@ "model.layers.32.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4483,7 +4468,7 @@ "model.layers.32.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4507,7 +4492,7 @@ "model.layers.32.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4531,7 +4516,7 @@ "model.layers.32.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4555,7 +4540,7 @@ "model.layers.32.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4579,7 +4564,7 @@ "model.layers.33.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4603,7 +4588,7 @@ "model.layers.33.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4627,7 +4612,7 @@ "model.layers.33.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4651,7 +4636,7 @@ "model.layers.33.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4675,7 +4660,7 @@ "model.layers.33.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4699,7 +4684,7 @@ "model.layers.33.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4723,7 +4708,7 @@ "model.layers.33.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4747,7 +4732,7 @@ "model.layers.34.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4771,7 +4756,7 @@ "model.layers.34.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4795,7 +4780,7 @@ "model.layers.34.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4819,7 +4804,7 @@ "model.layers.34.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4843,7 +4828,7 @@ "model.layers.34.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4867,7 +4852,7 @@ "model.layers.34.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4891,7 +4876,7 @@ "model.layers.34.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4915,7 +4900,7 @@ "model.layers.35.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4939,7 +4924,7 @@ "model.layers.35.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4963,7 +4948,7 @@ "model.layers.35.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4987,7 +4972,7 @@ "model.layers.35.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5011,7 +4996,7 @@ "model.layers.35.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5035,7 +5020,7 @@ "model.layers.35.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5059,7 +5044,7 @@ "model.layers.35.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5083,7 +5068,7 @@ "model.layers.36.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5107,7 +5092,7 @@ "model.layers.36.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5131,7 +5116,7 @@ "model.layers.36.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5155,7 +5140,7 @@ "model.layers.36.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5179,7 +5164,7 @@ "model.layers.36.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5203,7 +5188,7 @@ "model.layers.36.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5227,7 +5212,7 @@ "model.layers.36.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5251,7 +5236,7 @@ "model.layers.37.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5275,7 +5260,7 @@ "model.layers.37.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5299,7 +5284,7 @@ "model.layers.37.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5323,7 +5308,7 @@ "model.layers.37.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5347,7 +5332,7 @@ "model.layers.37.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5371,7 +5356,7 @@ "model.layers.37.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5395,7 +5380,7 @@ "model.layers.37.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5419,7 +5404,7 @@ "model.layers.38.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5443,7 +5428,7 @@ "model.layers.38.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5467,7 +5452,7 @@ "model.layers.38.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5491,7 +5476,7 @@ "model.layers.38.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5515,7 +5500,7 @@ "model.layers.38.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5539,7 +5524,7 @@ "model.layers.38.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5563,7 +5548,7 @@ "model.layers.38.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5587,7 +5572,7 @@ "model.layers.39.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5611,7 +5596,7 @@ "model.layers.39.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5635,7 +5620,7 @@ "model.layers.39.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5659,7 +5644,7 @@ "model.layers.39.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5683,7 +5668,7 @@ "model.layers.39.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5707,7 +5692,7 @@ "model.layers.39.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5731,7 +5716,7 @@ "model.layers.39.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5755,7 +5740,7 @@ "model.layers.4.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5779,7 +5764,7 @@ "model.layers.4.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5803,7 +5788,7 @@ "model.layers.4.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5827,7 +5812,7 @@ "model.layers.4.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5851,7 +5836,7 @@ "model.layers.4.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5875,7 +5860,7 @@ "model.layers.4.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5899,7 +5884,7 @@ "model.layers.4.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5923,7 +5908,7 @@ "model.layers.40.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5947,7 +5932,7 @@ "model.layers.40.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5971,7 +5956,7 @@ "model.layers.40.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5995,7 +5980,7 @@ "model.layers.40.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6019,7 +6004,7 @@ "model.layers.40.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6043,7 +6028,7 @@ "model.layers.40.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6067,7 +6052,7 @@ "model.layers.40.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6091,7 +6076,7 @@ "model.layers.41.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6115,7 +6100,7 @@ "model.layers.41.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6139,7 +6124,7 @@ "model.layers.41.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6163,7 +6148,7 @@ "model.layers.41.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6187,7 +6172,7 @@ "model.layers.41.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6211,7 +6196,7 @@ "model.layers.41.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6235,7 +6220,7 @@ "model.layers.41.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6259,7 +6244,7 @@ "model.layers.42.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6283,7 +6268,7 @@ "model.layers.42.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6307,7 +6292,7 @@ "model.layers.42.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6331,7 +6316,7 @@ "model.layers.42.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6355,7 +6340,7 @@ "model.layers.42.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6379,7 +6364,7 @@ "model.layers.42.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6403,7 +6388,7 @@ "model.layers.42.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6427,7 +6412,7 @@ "model.layers.43.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6451,7 +6436,7 @@ "model.layers.43.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6475,7 +6460,7 @@ "model.layers.43.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6499,7 +6484,7 @@ "model.layers.43.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6523,7 +6508,7 @@ "model.layers.43.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6547,7 +6532,7 @@ "model.layers.43.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6571,7 +6556,7 @@ "model.layers.43.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6595,7 +6580,7 @@ "model.layers.44.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6619,7 +6604,7 @@ "model.layers.44.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6643,7 +6628,7 @@ "model.layers.44.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6667,7 +6652,7 @@ "model.layers.44.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6691,7 +6676,7 @@ "model.layers.44.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6715,7 +6700,7 @@ "model.layers.44.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6739,7 +6724,7 @@ "model.layers.44.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6763,7 +6748,7 @@ "model.layers.45.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6787,7 +6772,7 @@ "model.layers.45.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6811,7 +6796,7 @@ "model.layers.45.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6835,7 +6820,7 @@ "model.layers.45.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6859,7 +6844,7 @@ "model.layers.45.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6883,7 +6868,7 @@ "model.layers.45.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6907,7 +6892,7 @@ "model.layers.45.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6931,7 +6916,7 @@ "model.layers.46.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6955,7 +6940,7 @@ "model.layers.46.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6979,7 +6964,7 @@ "model.layers.46.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7003,7 +6988,7 @@ "model.layers.46.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7027,7 +7012,7 @@ "model.layers.46.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7051,7 +7036,7 @@ "model.layers.46.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7075,7 +7060,7 @@ "model.layers.46.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7099,7 +7084,7 @@ "model.layers.47.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7123,7 +7108,7 @@ "model.layers.47.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7147,7 +7132,7 @@ "model.layers.47.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7171,7 +7156,7 @@ "model.layers.47.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7195,7 +7180,7 @@ "model.layers.47.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7219,7 +7204,7 @@ "model.layers.47.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7243,7 +7228,7 @@ "model.layers.47.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7267,7 +7252,7 @@ "model.layers.48.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7291,7 +7276,7 @@ "model.layers.48.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7315,7 +7300,7 @@ "model.layers.48.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7339,7 +7324,7 @@ "model.layers.48.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7363,7 +7348,7 @@ "model.layers.48.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7387,7 +7372,7 @@ "model.layers.48.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7411,7 +7396,7 @@ "model.layers.48.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7435,7 +7420,7 @@ "model.layers.49.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7459,7 +7444,7 @@ "model.layers.49.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7483,7 +7468,7 @@ "model.layers.49.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7507,7 +7492,7 @@ "model.layers.49.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7531,7 +7516,7 @@ "model.layers.49.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7555,7 +7540,7 @@ "model.layers.49.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7579,7 +7564,7 @@ "model.layers.49.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7603,7 +7588,7 @@ "model.layers.5.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7627,7 +7612,7 @@ "model.layers.5.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7651,7 +7636,7 @@ "model.layers.5.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7675,7 +7660,7 @@ "model.layers.5.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7699,7 +7684,7 @@ "model.layers.5.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7723,7 +7708,7 @@ "model.layers.5.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7747,7 +7732,7 @@ "model.layers.5.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7771,7 +7756,7 @@ "model.layers.50.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7795,7 +7780,7 @@ "model.layers.50.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7819,7 +7804,7 @@ "model.layers.50.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7843,7 +7828,7 @@ "model.layers.50.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7867,7 +7852,7 @@ "model.layers.50.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7891,7 +7876,7 @@ "model.layers.50.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7915,7 +7900,7 @@ "model.layers.50.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7939,7 +7924,7 @@ "model.layers.51.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7963,7 +7948,7 @@ "model.layers.51.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7987,7 +7972,7 @@ "model.layers.51.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8011,7 +7996,7 @@ "model.layers.51.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8035,7 +8020,7 @@ "model.layers.51.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8059,7 +8044,7 @@ "model.layers.51.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8083,7 +8068,7 @@ "model.layers.51.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8107,7 +8092,7 @@ "model.layers.52.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8131,7 +8116,7 @@ "model.layers.52.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8155,7 +8140,7 @@ "model.layers.52.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8179,7 +8164,7 @@ "model.layers.52.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8203,7 +8188,7 @@ "model.layers.52.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8227,7 +8212,7 @@ "model.layers.52.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8251,7 +8236,7 @@ "model.layers.52.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8275,7 +8260,7 @@ "model.layers.53.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8299,7 +8284,7 @@ "model.layers.53.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8323,7 +8308,7 @@ "model.layers.53.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8347,7 +8332,7 @@ "model.layers.53.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8371,7 +8356,7 @@ "model.layers.53.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8395,7 +8380,7 @@ "model.layers.53.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8419,7 +8404,7 @@ "model.layers.53.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8443,7 +8428,7 @@ "model.layers.54.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8467,7 +8452,7 @@ "model.layers.54.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8491,7 +8476,7 @@ "model.layers.54.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8515,7 +8500,7 @@ "model.layers.54.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8539,7 +8524,7 @@ "model.layers.54.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8563,7 +8548,7 @@ "model.layers.54.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8587,7 +8572,7 @@ "model.layers.54.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8611,7 +8596,7 @@ "model.layers.55.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8635,7 +8620,7 @@ "model.layers.55.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8659,7 +8644,7 @@ "model.layers.55.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8683,7 +8668,7 @@ "model.layers.55.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8707,7 +8692,7 @@ "model.layers.55.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8731,7 +8716,7 @@ "model.layers.55.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8755,7 +8740,7 @@ "model.layers.55.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8779,7 +8764,7 @@ "model.layers.56.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8803,7 +8788,7 @@ "model.layers.56.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8827,7 +8812,7 @@ "model.layers.56.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8851,7 +8836,7 @@ "model.layers.56.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8875,7 +8860,7 @@ "model.layers.56.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8899,7 +8884,7 @@ "model.layers.56.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8923,7 +8908,7 @@ "model.layers.56.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8947,7 +8932,7 @@ "model.layers.57.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8971,7 +8956,7 @@ "model.layers.57.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8995,7 +8980,7 @@ "model.layers.57.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9019,7 +9004,7 @@ "model.layers.57.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9043,7 +9028,7 @@ "model.layers.57.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9067,7 +9052,7 @@ "model.layers.57.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9091,7 +9076,7 @@ "model.layers.57.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9115,7 +9100,7 @@ "model.layers.58.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9139,7 +9124,7 @@ "model.layers.58.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9163,7 +9148,7 @@ "model.layers.58.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9187,7 +9172,7 @@ "model.layers.58.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9211,7 +9196,7 @@ "model.layers.58.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9235,7 +9220,7 @@ "model.layers.58.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9259,7 +9244,7 @@ "model.layers.58.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9283,7 +9268,7 @@ "model.layers.59.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9307,7 +9292,7 @@ "model.layers.59.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9331,7 +9316,7 @@ "model.layers.59.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9355,7 +9340,7 @@ "model.layers.59.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9379,7 +9364,7 @@ "model.layers.59.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9403,7 +9388,7 @@ "model.layers.59.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9427,7 +9412,7 @@ "model.layers.59.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9451,7 +9436,7 @@ "model.layers.6.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9475,7 +9460,7 @@ "model.layers.6.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9499,7 +9484,7 @@ "model.layers.6.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9523,7 +9508,7 @@ "model.layers.6.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9547,7 +9532,7 @@ "model.layers.6.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9571,7 +9556,7 @@ "model.layers.6.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9595,7 +9580,7 @@ "model.layers.6.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9619,7 +9604,7 @@ "model.layers.60.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9643,7 +9628,7 @@ "model.layers.60.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9667,7 +9652,7 @@ "model.layers.60.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9691,7 +9676,7 @@ "model.layers.60.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9715,7 +9700,7 @@ "model.layers.60.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9739,7 +9724,7 @@ "model.layers.60.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9763,7 +9748,7 @@ "model.layers.60.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9787,7 +9772,7 @@ "model.layers.61.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9811,7 +9796,7 @@ "model.layers.61.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9835,7 +9820,7 @@ "model.layers.61.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9859,7 +9844,7 @@ "model.layers.61.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9883,7 +9868,7 @@ "model.layers.61.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9907,7 +9892,7 @@ "model.layers.61.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9931,7 +9916,7 @@ "model.layers.61.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9955,7 +9940,7 @@ "model.layers.62.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9979,7 +9964,7 @@ "model.layers.62.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10003,7 +9988,7 @@ "model.layers.62.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10027,7 +10012,7 @@ "model.layers.62.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10051,7 +10036,7 @@ "model.layers.62.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10075,7 +10060,7 @@ "model.layers.62.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10099,7 +10084,7 @@ "model.layers.62.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10123,7 +10108,7 @@ "model.layers.63.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10147,7 +10132,7 @@ "model.layers.63.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10171,7 +10156,7 @@ "model.layers.63.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10195,7 +10180,7 @@ "model.layers.63.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10219,7 +10204,7 @@ "model.layers.63.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10243,7 +10228,7 @@ "model.layers.63.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10267,7 +10252,7 @@ "model.layers.63.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10291,7 +10276,7 @@ "model.layers.64.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10315,7 +10300,7 @@ "model.layers.64.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10339,7 +10324,7 @@ "model.layers.64.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10363,7 +10348,7 @@ "model.layers.64.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10387,7 +10372,7 @@ "model.layers.64.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10411,7 +10396,7 @@ "model.layers.64.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10435,7 +10420,7 @@ "model.layers.64.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10459,7 +10444,7 @@ "model.layers.65.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10483,7 +10468,7 @@ "model.layers.65.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10507,7 +10492,7 @@ "model.layers.65.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10531,7 +10516,7 @@ "model.layers.65.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10555,7 +10540,7 @@ "model.layers.65.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10579,7 +10564,7 @@ "model.layers.65.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10603,7 +10588,7 @@ "model.layers.65.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10627,7 +10612,7 @@ "model.layers.66.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10651,7 +10636,7 @@ "model.layers.66.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10675,7 +10660,7 @@ "model.layers.66.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10699,7 +10684,7 @@ "model.layers.66.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10723,7 +10708,7 @@ "model.layers.66.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10747,7 +10732,7 @@ "model.layers.66.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10771,7 +10756,7 @@ "model.layers.66.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10795,7 +10780,7 @@ "model.layers.67.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10819,7 +10804,7 @@ "model.layers.67.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10843,7 +10828,7 @@ "model.layers.67.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10867,7 +10852,7 @@ "model.layers.67.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10891,7 +10876,7 @@ "model.layers.67.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10915,7 +10900,7 @@ "model.layers.67.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10939,7 +10924,7 @@ "model.layers.67.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10963,7 +10948,7 @@ "model.layers.68.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10987,7 +10972,7 @@ "model.layers.68.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11011,7 +10996,7 @@ "model.layers.68.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11035,7 +11020,7 @@ "model.layers.68.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11059,7 +11044,7 @@ "model.layers.68.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11083,7 +11068,7 @@ "model.layers.68.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11107,7 +11092,7 @@ "model.layers.68.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11131,7 +11116,7 @@ "model.layers.69.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11155,7 +11140,7 @@ "model.layers.69.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11179,7 +11164,7 @@ "model.layers.69.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11203,7 +11188,7 @@ "model.layers.69.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11227,7 +11212,7 @@ "model.layers.69.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11251,7 +11236,7 @@ "model.layers.69.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11275,7 +11260,7 @@ "model.layers.69.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11299,7 +11284,7 @@ "model.layers.7.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11323,7 +11308,7 @@ "model.layers.7.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11347,7 +11332,7 @@ "model.layers.7.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11371,7 +11356,7 @@ "model.layers.7.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11395,7 +11380,7 @@ "model.layers.7.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11419,7 +11404,7 @@ "model.layers.7.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11443,7 +11428,7 @@ "model.layers.7.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11467,7 +11452,7 @@ "model.layers.70.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11491,7 +11476,7 @@ "model.layers.70.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11515,7 +11500,7 @@ "model.layers.70.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11539,7 +11524,7 @@ "model.layers.70.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11563,7 +11548,7 @@ "model.layers.70.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11587,7 +11572,7 @@ "model.layers.70.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11611,7 +11596,7 @@ "model.layers.70.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11635,7 +11620,7 @@ "model.layers.71.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11659,7 +11644,7 @@ "model.layers.71.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11683,7 +11668,7 @@ "model.layers.71.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11707,7 +11692,7 @@ "model.layers.71.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11731,7 +11716,7 @@ "model.layers.71.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11755,7 +11740,7 @@ "model.layers.71.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11779,7 +11764,7 @@ "model.layers.71.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11803,7 +11788,7 @@ "model.layers.72.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11827,7 +11812,7 @@ "model.layers.72.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11851,7 +11836,7 @@ "model.layers.72.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11875,7 +11860,7 @@ "model.layers.72.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11899,7 +11884,7 @@ "model.layers.72.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11923,7 +11908,7 @@ "model.layers.72.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11947,7 +11932,7 @@ "model.layers.72.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11971,7 +11956,7 @@ "model.layers.73.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11995,7 +11980,7 @@ "model.layers.73.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12019,7 +12004,7 @@ "model.layers.73.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12043,7 +12028,7 @@ "model.layers.73.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12067,7 +12052,7 @@ "model.layers.73.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12091,7 +12076,7 @@ "model.layers.73.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12115,7 +12100,7 @@ "model.layers.73.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12139,7 +12124,7 @@ "model.layers.74.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -12163,7 +12148,7 @@ "model.layers.74.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12187,7 +12172,7 @@ "model.layers.74.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12211,7 +12196,7 @@ "model.layers.74.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12235,7 +12220,7 @@ "model.layers.74.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12259,7 +12244,7 @@ "model.layers.74.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12283,7 +12268,7 @@ "model.layers.74.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12307,7 +12292,7 @@ "model.layers.75.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -12331,7 +12316,7 @@ "model.layers.75.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12355,7 +12340,7 @@ "model.layers.75.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12379,7 +12364,7 @@ "model.layers.75.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12403,7 +12388,7 @@ "model.layers.75.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12427,7 +12412,7 @@ "model.layers.75.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12451,7 +12436,7 @@ "model.layers.75.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12475,7 +12460,7 @@ "model.layers.76.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -12499,7 +12484,7 @@ "model.layers.76.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12523,7 +12508,7 @@ "model.layers.76.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12547,7 +12532,7 @@ "model.layers.76.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12571,7 +12556,7 @@ "model.layers.76.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12595,7 +12580,7 @@ "model.layers.76.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12619,7 +12604,7 @@ "model.layers.76.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12643,7 +12628,7 @@ "model.layers.77.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -12667,7 +12652,7 @@ "model.layers.77.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12691,7 +12676,7 @@ "model.layers.77.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12715,7 +12700,7 @@ "model.layers.77.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12739,7 +12724,7 @@ "model.layers.77.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12763,7 +12748,7 @@ "model.layers.77.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12787,7 +12772,7 @@ "model.layers.77.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12811,7 +12796,7 @@ "model.layers.78.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -12835,7 +12820,7 @@ "model.layers.78.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12859,7 +12844,7 @@ "model.layers.78.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12883,7 +12868,7 @@ "model.layers.78.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12907,7 +12892,7 @@ "model.layers.78.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12931,7 +12916,7 @@ "model.layers.78.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12955,7 +12940,7 @@ "model.layers.78.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12979,7 +12964,7 @@ "model.layers.79.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -13003,7 +12988,7 @@ "model.layers.79.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13027,7 +13012,7 @@ "model.layers.79.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13051,7 +13036,7 @@ "model.layers.79.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13075,7 +13060,7 @@ "model.layers.79.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13099,7 +13084,7 @@ "model.layers.79.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13123,7 +13108,7 @@ "model.layers.79.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13147,7 +13132,7 @@ "model.layers.8.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -13171,7 +13156,7 @@ "model.layers.8.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13195,7 +13180,7 @@ "model.layers.8.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13219,7 +13204,7 @@ "model.layers.8.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13243,7 +13228,7 @@ "model.layers.8.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13267,7 +13252,7 @@ "model.layers.8.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13291,7 +13276,7 @@ "model.layers.8.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13315,7 +13300,7 @@ "model.layers.9.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -13339,7 +13324,7 @@ "model.layers.9.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13363,7 +13348,7 @@ "model.layers.9.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13387,7 +13372,7 @@ "model.layers.9.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13411,7 +13396,7 @@ "model.layers.9.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13435,7 +13420,7 @@ "model.layers.9.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13459,7 +13444,7 @@ "model.layers.9.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13480,6 +13465,21 @@ 8 ] } - } - } -} \ No newline at end of file + }, + "quant_method": "vptq" + }, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.49.0", + "use_cache": true, + "vocab_size": 128256 +}