diff --git "a/config.json" "b/config.json" --- "a/config.json" +++ "b/config.json" @@ -1,5 +1,5 @@ { - "_name_or_path": "meta-llama/Meta-Llama-3.1-70B-Instruct", + "_name_or_path": "/home/aiscuser/yangwang/convert_model/models/VPTQ-community--Meta-Llama-3.1-70B-Instruct-v16-k65536-32768-woft", "architectures": [ "LlamaForCausalLM" ], @@ -11,6 +11,7 @@ 128008, 128009 ], + "head_dim": 128, "hidden_act": "silu", "hidden_size": 8192, "initializer_range": 0.02, @@ -22,27 +23,12 @@ "num_hidden_layers": 80, "num_key_value_heads": 8, "pretraining_tp": 1, - "rms_norm_eps": 1e-05, - "rope_scaling": { - "factor": 8.0, - "high_freq_factor": 4.0, - "low_freq_factor": 1.0, - "original_max_position_embeddings": 8192, - "rope_type": "llama3" - }, - "rope_theta": 500000.0, - "tie_word_embeddings": false, - "torch_dtype": "bfloat16", - "transformers_version": "4.44.2", - "use_cache": true, - "vocab_size": 128256, "quantization_config": { - "quant_method": "vptq", "config_for_layers": { "model.layers.0.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -66,7 +52,7 @@ "model.layers.0.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -90,7 +76,7 @@ "model.layers.0.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -114,7 +100,7 @@ "model.layers.0.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -138,7 +124,7 @@ "model.layers.0.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -162,7 +148,7 @@ "model.layers.0.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -186,7 +172,7 @@ "model.layers.0.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -210,7 +196,7 @@ "model.layers.1.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -234,7 +220,7 @@ "model.layers.1.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -258,7 +244,7 @@ "model.layers.1.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -282,7 +268,7 @@ "model.layers.1.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -306,7 +292,7 @@ "model.layers.1.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -330,7 +316,7 @@ "model.layers.1.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -354,7 +340,7 @@ "model.layers.1.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -378,7 +364,7 @@ "model.layers.10.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -402,7 +388,7 @@ "model.layers.10.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -426,7 +412,7 @@ "model.layers.10.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -450,7 +436,7 @@ "model.layers.10.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -474,7 +460,7 @@ "model.layers.10.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -498,7 +484,7 @@ "model.layers.10.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -522,7 +508,7 @@ "model.layers.10.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -546,7 +532,7 @@ "model.layers.11.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -570,7 +556,7 @@ "model.layers.11.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -594,7 +580,7 @@ "model.layers.11.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -618,7 +604,7 @@ "model.layers.11.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -642,7 +628,7 @@ "model.layers.11.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -666,7 +652,7 @@ "model.layers.11.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -690,7 +676,7 @@ "model.layers.11.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -714,7 +700,7 @@ "model.layers.12.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -738,7 +724,7 @@ "model.layers.12.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -762,7 +748,7 @@ "model.layers.12.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -786,7 +772,7 @@ "model.layers.12.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -810,7 +796,7 @@ "model.layers.12.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -834,7 +820,7 @@ "model.layers.12.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -858,7 +844,7 @@ "model.layers.12.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -882,7 +868,7 @@ "model.layers.13.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -906,7 +892,7 @@ "model.layers.13.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -930,7 +916,7 @@ "model.layers.13.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -954,7 +940,7 @@ "model.layers.13.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -978,7 +964,7 @@ "model.layers.13.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1002,7 +988,7 @@ "model.layers.13.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1026,7 +1012,7 @@ "model.layers.13.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1050,7 +1036,7 @@ "model.layers.14.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1074,7 +1060,7 @@ "model.layers.14.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1098,7 +1084,7 @@ "model.layers.14.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1122,7 +1108,7 @@ "model.layers.14.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1146,7 +1132,7 @@ "model.layers.14.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1170,7 +1156,7 @@ "model.layers.14.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1194,7 +1180,7 @@ "model.layers.14.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1218,7 +1204,7 @@ "model.layers.15.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1242,7 +1228,7 @@ "model.layers.15.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1266,7 +1252,7 @@ "model.layers.15.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1290,7 +1276,7 @@ "model.layers.15.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1314,7 +1300,7 @@ "model.layers.15.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1338,7 +1324,7 @@ "model.layers.15.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1362,7 +1348,7 @@ "model.layers.15.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1386,7 +1372,7 @@ "model.layers.16.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1410,7 +1396,7 @@ "model.layers.16.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1434,7 +1420,7 @@ "model.layers.16.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1458,7 +1444,7 @@ "model.layers.16.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1482,7 +1468,7 @@ "model.layers.16.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1506,7 +1492,7 @@ "model.layers.16.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1530,7 +1516,7 @@ "model.layers.16.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1554,7 +1540,7 @@ "model.layers.17.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1578,7 +1564,7 @@ "model.layers.17.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1602,7 +1588,7 @@ "model.layers.17.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1626,7 +1612,7 @@ "model.layers.17.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1650,7 +1636,7 @@ "model.layers.17.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1674,7 +1660,7 @@ "model.layers.17.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1698,7 +1684,7 @@ "model.layers.17.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1722,7 +1708,7 @@ "model.layers.18.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1746,7 +1732,7 @@ "model.layers.18.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1770,7 +1756,7 @@ "model.layers.18.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1794,7 +1780,7 @@ "model.layers.18.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1818,7 +1804,7 @@ "model.layers.18.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1842,7 +1828,7 @@ "model.layers.18.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1866,7 +1852,7 @@ "model.layers.18.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1890,7 +1876,7 @@ "model.layers.19.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -1914,7 +1900,7 @@ "model.layers.19.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1938,7 +1924,7 @@ "model.layers.19.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1962,7 +1948,7 @@ "model.layers.19.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -1986,7 +1972,7 @@ "model.layers.19.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2010,7 +1996,7 @@ "model.layers.19.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2034,7 +2020,7 @@ "model.layers.19.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2058,7 +2044,7 @@ "model.layers.2.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2082,7 +2068,7 @@ "model.layers.2.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2106,7 +2092,7 @@ "model.layers.2.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2130,7 +2116,7 @@ "model.layers.2.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2154,7 +2140,7 @@ "model.layers.2.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2178,7 +2164,7 @@ "model.layers.2.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2202,7 +2188,7 @@ "model.layers.2.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2226,7 +2212,7 @@ "model.layers.20.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2250,7 +2236,7 @@ "model.layers.20.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2274,7 +2260,7 @@ "model.layers.20.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2298,7 +2284,7 @@ "model.layers.20.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2322,7 +2308,7 @@ "model.layers.20.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2346,7 +2332,7 @@ "model.layers.20.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2370,7 +2356,7 @@ "model.layers.20.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2394,7 +2380,7 @@ "model.layers.21.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2418,7 +2404,7 @@ "model.layers.21.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2442,7 +2428,7 @@ "model.layers.21.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2466,7 +2452,7 @@ "model.layers.21.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2490,7 +2476,7 @@ "model.layers.21.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2514,7 +2500,7 @@ "model.layers.21.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2538,7 +2524,7 @@ "model.layers.21.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2562,7 +2548,7 @@ "model.layers.22.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2586,7 +2572,7 @@ "model.layers.22.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2610,7 +2596,7 @@ "model.layers.22.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2634,7 +2620,7 @@ "model.layers.22.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2658,7 +2644,7 @@ "model.layers.22.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2682,7 +2668,7 @@ "model.layers.22.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2706,7 +2692,7 @@ "model.layers.22.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2730,7 +2716,7 @@ "model.layers.23.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2754,7 +2740,7 @@ "model.layers.23.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2778,7 +2764,7 @@ "model.layers.23.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2802,7 +2788,7 @@ "model.layers.23.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2826,7 +2812,7 @@ "model.layers.23.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2850,7 +2836,7 @@ "model.layers.23.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2874,7 +2860,7 @@ "model.layers.23.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2898,7 +2884,7 @@ "model.layers.24.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -2922,7 +2908,7 @@ "model.layers.24.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2946,7 +2932,7 @@ "model.layers.24.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2970,7 +2956,7 @@ "model.layers.24.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -2994,7 +2980,7 @@ "model.layers.24.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3018,7 +3004,7 @@ "model.layers.24.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3042,7 +3028,7 @@ "model.layers.24.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3066,7 +3052,7 @@ "model.layers.25.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3090,7 +3076,7 @@ "model.layers.25.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3114,7 +3100,7 @@ "model.layers.25.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3138,7 +3124,7 @@ "model.layers.25.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3162,7 +3148,7 @@ "model.layers.25.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3186,7 +3172,7 @@ "model.layers.25.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3210,7 +3196,7 @@ "model.layers.25.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3234,7 +3220,7 @@ "model.layers.26.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3258,7 +3244,7 @@ "model.layers.26.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3282,7 +3268,7 @@ "model.layers.26.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3306,7 +3292,7 @@ "model.layers.26.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3330,7 +3316,7 @@ "model.layers.26.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3354,7 +3340,7 @@ "model.layers.26.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3378,7 +3364,7 @@ "model.layers.26.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3402,7 +3388,7 @@ "model.layers.27.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3426,7 +3412,7 @@ "model.layers.27.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3450,7 +3436,7 @@ "model.layers.27.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3474,7 +3460,7 @@ "model.layers.27.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3498,7 +3484,7 @@ "model.layers.27.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3522,7 +3508,7 @@ "model.layers.27.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3546,7 +3532,7 @@ "model.layers.27.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3570,7 +3556,7 @@ "model.layers.28.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3594,7 +3580,7 @@ "model.layers.28.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3618,7 +3604,7 @@ "model.layers.28.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3642,7 +3628,7 @@ "model.layers.28.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3666,7 +3652,7 @@ "model.layers.28.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3690,7 +3676,7 @@ "model.layers.28.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3714,7 +3700,7 @@ "model.layers.28.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3738,7 +3724,7 @@ "model.layers.29.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3762,7 +3748,7 @@ "model.layers.29.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3786,7 +3772,7 @@ "model.layers.29.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3810,7 +3796,7 @@ "model.layers.29.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3834,7 +3820,7 @@ "model.layers.29.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3858,7 +3844,7 @@ "model.layers.29.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3882,7 +3868,7 @@ "model.layers.29.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3906,7 +3892,7 @@ "model.layers.3.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -3930,7 +3916,7 @@ "model.layers.3.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3954,7 +3940,7 @@ "model.layers.3.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -3978,7 +3964,7 @@ "model.layers.3.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4002,7 +3988,7 @@ "model.layers.3.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4026,7 +4012,7 @@ "model.layers.3.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4050,7 +4036,7 @@ "model.layers.3.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4074,7 +4060,7 @@ "model.layers.30.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4098,7 +4084,7 @@ "model.layers.30.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4122,7 +4108,7 @@ "model.layers.30.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4146,7 +4132,7 @@ "model.layers.30.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4170,7 +4156,7 @@ "model.layers.30.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4194,7 +4180,7 @@ "model.layers.30.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4218,7 +4204,7 @@ "model.layers.30.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4242,7 +4228,7 @@ "model.layers.31.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4266,7 +4252,7 @@ "model.layers.31.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4290,7 +4276,7 @@ "model.layers.31.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4314,7 +4300,7 @@ "model.layers.31.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4338,7 +4324,7 @@ "model.layers.31.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4362,7 +4348,7 @@ "model.layers.31.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4386,7 +4372,7 @@ "model.layers.31.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4410,7 +4396,7 @@ "model.layers.32.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4434,7 +4420,7 @@ "model.layers.32.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4458,7 +4444,7 @@ "model.layers.32.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4482,7 +4468,7 @@ "model.layers.32.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4506,7 +4492,7 @@ "model.layers.32.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4530,7 +4516,7 @@ "model.layers.32.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4554,7 +4540,7 @@ "model.layers.32.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4578,7 +4564,7 @@ "model.layers.33.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4602,7 +4588,7 @@ "model.layers.33.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4626,7 +4612,7 @@ "model.layers.33.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4650,7 +4636,7 @@ "model.layers.33.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4674,7 +4660,7 @@ "model.layers.33.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4698,7 +4684,7 @@ "model.layers.33.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4722,7 +4708,7 @@ "model.layers.33.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4746,7 +4732,7 @@ "model.layers.34.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4770,7 +4756,7 @@ "model.layers.34.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4794,7 +4780,7 @@ "model.layers.34.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4818,7 +4804,7 @@ "model.layers.34.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4842,7 +4828,7 @@ "model.layers.34.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4866,7 +4852,7 @@ "model.layers.34.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4890,7 +4876,7 @@ "model.layers.34.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4914,7 +4900,7 @@ "model.layers.35.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -4938,7 +4924,7 @@ "model.layers.35.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4962,7 +4948,7 @@ "model.layers.35.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -4986,7 +4972,7 @@ "model.layers.35.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5010,7 +4996,7 @@ "model.layers.35.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5034,7 +5020,7 @@ "model.layers.35.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5058,7 +5044,7 @@ "model.layers.35.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5082,7 +5068,7 @@ "model.layers.36.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5106,7 +5092,7 @@ "model.layers.36.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5130,7 +5116,7 @@ "model.layers.36.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5154,7 +5140,7 @@ "model.layers.36.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5178,7 +5164,7 @@ "model.layers.36.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5202,7 +5188,7 @@ "model.layers.36.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5226,7 +5212,7 @@ "model.layers.36.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5250,7 +5236,7 @@ "model.layers.37.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5274,7 +5260,7 @@ "model.layers.37.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5298,7 +5284,7 @@ "model.layers.37.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5322,7 +5308,7 @@ "model.layers.37.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5346,7 +5332,7 @@ "model.layers.37.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5370,7 +5356,7 @@ "model.layers.37.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5394,7 +5380,7 @@ "model.layers.37.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5418,7 +5404,7 @@ "model.layers.38.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5442,7 +5428,7 @@ "model.layers.38.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5466,7 +5452,7 @@ "model.layers.38.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5490,7 +5476,7 @@ "model.layers.38.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5514,7 +5500,7 @@ "model.layers.38.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5538,7 +5524,7 @@ "model.layers.38.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5562,7 +5548,7 @@ "model.layers.38.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5586,7 +5572,7 @@ "model.layers.39.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5610,7 +5596,7 @@ "model.layers.39.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5634,7 +5620,7 @@ "model.layers.39.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5658,7 +5644,7 @@ "model.layers.39.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5682,7 +5668,7 @@ "model.layers.39.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5706,7 +5692,7 @@ "model.layers.39.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5730,7 +5716,7 @@ "model.layers.39.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5754,7 +5740,7 @@ "model.layers.4.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5778,7 +5764,7 @@ "model.layers.4.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5802,7 +5788,7 @@ "model.layers.4.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5826,7 +5812,7 @@ "model.layers.4.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5850,7 +5836,7 @@ "model.layers.4.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5874,7 +5860,7 @@ "model.layers.4.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5898,7 +5884,7 @@ "model.layers.4.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5922,7 +5908,7 @@ "model.layers.40.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -5946,7 +5932,7 @@ "model.layers.40.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5970,7 +5956,7 @@ "model.layers.40.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -5994,7 +5980,7 @@ "model.layers.40.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6018,7 +6004,7 @@ "model.layers.40.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6042,7 +6028,7 @@ "model.layers.40.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6066,7 +6052,7 @@ "model.layers.40.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6090,7 +6076,7 @@ "model.layers.41.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6114,7 +6100,7 @@ "model.layers.41.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6138,7 +6124,7 @@ "model.layers.41.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6162,7 +6148,7 @@ "model.layers.41.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6186,7 +6172,7 @@ "model.layers.41.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6210,7 +6196,7 @@ "model.layers.41.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6234,7 +6220,7 @@ "model.layers.41.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6258,7 +6244,7 @@ "model.layers.42.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6282,7 +6268,7 @@ "model.layers.42.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6306,7 +6292,7 @@ "model.layers.42.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6330,7 +6316,7 @@ "model.layers.42.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6354,7 +6340,7 @@ "model.layers.42.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6378,7 +6364,7 @@ "model.layers.42.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6402,7 +6388,7 @@ "model.layers.42.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6426,7 +6412,7 @@ "model.layers.43.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6450,7 +6436,7 @@ "model.layers.43.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6474,7 +6460,7 @@ "model.layers.43.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6498,7 +6484,7 @@ "model.layers.43.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6522,7 +6508,7 @@ "model.layers.43.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6546,7 +6532,7 @@ "model.layers.43.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6570,7 +6556,7 @@ "model.layers.43.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6594,7 +6580,7 @@ "model.layers.44.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6618,7 +6604,7 @@ "model.layers.44.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6642,7 +6628,7 @@ "model.layers.44.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6666,7 +6652,7 @@ "model.layers.44.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6690,7 +6676,7 @@ "model.layers.44.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6714,7 +6700,7 @@ "model.layers.44.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6738,7 +6724,7 @@ "model.layers.44.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6762,7 +6748,7 @@ "model.layers.45.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6786,7 +6772,7 @@ "model.layers.45.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6810,7 +6796,7 @@ "model.layers.45.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6834,7 +6820,7 @@ "model.layers.45.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6858,7 +6844,7 @@ "model.layers.45.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6882,7 +6868,7 @@ "model.layers.45.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6906,7 +6892,7 @@ "model.layers.45.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6930,7 +6916,7 @@ "model.layers.46.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -6954,7 +6940,7 @@ "model.layers.46.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -6978,7 +6964,7 @@ "model.layers.46.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7002,7 +6988,7 @@ "model.layers.46.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7026,7 +7012,7 @@ "model.layers.46.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7050,7 +7036,7 @@ "model.layers.46.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7074,7 +7060,7 @@ "model.layers.46.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7098,7 +7084,7 @@ "model.layers.47.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7122,7 +7108,7 @@ "model.layers.47.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7146,7 +7132,7 @@ "model.layers.47.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7170,7 +7156,7 @@ "model.layers.47.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7194,7 +7180,7 @@ "model.layers.47.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7218,7 +7204,7 @@ "model.layers.47.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7242,7 +7228,7 @@ "model.layers.47.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7266,7 +7252,7 @@ "model.layers.48.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7290,7 +7276,7 @@ "model.layers.48.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7314,7 +7300,7 @@ "model.layers.48.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7338,7 +7324,7 @@ "model.layers.48.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7362,7 +7348,7 @@ "model.layers.48.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7386,7 +7372,7 @@ "model.layers.48.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7410,7 +7396,7 @@ "model.layers.48.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7434,7 +7420,7 @@ "model.layers.49.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7458,7 +7444,7 @@ "model.layers.49.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7482,7 +7468,7 @@ "model.layers.49.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7506,7 +7492,7 @@ "model.layers.49.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7530,7 +7516,7 @@ "model.layers.49.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7554,7 +7540,7 @@ "model.layers.49.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7578,7 +7564,7 @@ "model.layers.49.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7602,7 +7588,7 @@ "model.layers.5.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7626,7 +7612,7 @@ "model.layers.5.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7650,7 +7636,7 @@ "model.layers.5.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7674,7 +7660,7 @@ "model.layers.5.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7698,7 +7684,7 @@ "model.layers.5.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7722,7 +7708,7 @@ "model.layers.5.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7746,7 +7732,7 @@ "model.layers.5.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7770,7 +7756,7 @@ "model.layers.50.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7794,7 +7780,7 @@ "model.layers.50.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7818,7 +7804,7 @@ "model.layers.50.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7842,7 +7828,7 @@ "model.layers.50.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7866,7 +7852,7 @@ "model.layers.50.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7890,7 +7876,7 @@ "model.layers.50.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7914,7 +7900,7 @@ "model.layers.50.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7938,7 +7924,7 @@ "model.layers.51.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -7962,7 +7948,7 @@ "model.layers.51.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -7986,7 +7972,7 @@ "model.layers.51.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8010,7 +7996,7 @@ "model.layers.51.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8034,7 +8020,7 @@ "model.layers.51.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8058,7 +8044,7 @@ "model.layers.51.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8082,7 +8068,7 @@ "model.layers.51.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8106,7 +8092,7 @@ "model.layers.52.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8130,7 +8116,7 @@ "model.layers.52.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8154,7 +8140,7 @@ "model.layers.52.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8178,7 +8164,7 @@ "model.layers.52.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8202,7 +8188,7 @@ "model.layers.52.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8226,7 +8212,7 @@ "model.layers.52.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8250,7 +8236,7 @@ "model.layers.52.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8274,7 +8260,7 @@ "model.layers.53.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8298,7 +8284,7 @@ "model.layers.53.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8322,7 +8308,7 @@ "model.layers.53.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8346,7 +8332,7 @@ "model.layers.53.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8370,7 +8356,7 @@ "model.layers.53.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8394,7 +8380,7 @@ "model.layers.53.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8418,7 +8404,7 @@ "model.layers.53.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8442,7 +8428,7 @@ "model.layers.54.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8466,7 +8452,7 @@ "model.layers.54.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8490,7 +8476,7 @@ "model.layers.54.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8514,7 +8500,7 @@ "model.layers.54.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8538,7 +8524,7 @@ "model.layers.54.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8562,7 +8548,7 @@ "model.layers.54.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8586,7 +8572,7 @@ "model.layers.54.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8610,7 +8596,7 @@ "model.layers.55.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8634,7 +8620,7 @@ "model.layers.55.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8658,7 +8644,7 @@ "model.layers.55.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8682,7 +8668,7 @@ "model.layers.55.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8706,7 +8692,7 @@ "model.layers.55.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8730,7 +8716,7 @@ "model.layers.55.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8754,7 +8740,7 @@ "model.layers.55.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8778,7 +8764,7 @@ "model.layers.56.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8802,7 +8788,7 @@ "model.layers.56.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8826,7 +8812,7 @@ "model.layers.56.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8850,7 +8836,7 @@ "model.layers.56.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8874,7 +8860,7 @@ "model.layers.56.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8898,7 +8884,7 @@ "model.layers.56.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8922,7 +8908,7 @@ "model.layers.56.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8946,7 +8932,7 @@ "model.layers.57.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -8970,7 +8956,7 @@ "model.layers.57.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -8994,7 +8980,7 @@ "model.layers.57.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9018,7 +9004,7 @@ "model.layers.57.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9042,7 +9028,7 @@ "model.layers.57.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9066,7 +9052,7 @@ "model.layers.57.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9090,7 +9076,7 @@ "model.layers.57.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9114,7 +9100,7 @@ "model.layers.58.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9138,7 +9124,7 @@ "model.layers.58.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9162,7 +9148,7 @@ "model.layers.58.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9186,7 +9172,7 @@ "model.layers.58.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9210,7 +9196,7 @@ "model.layers.58.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9234,7 +9220,7 @@ "model.layers.58.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9258,7 +9244,7 @@ "model.layers.58.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9282,7 +9268,7 @@ "model.layers.59.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9306,7 +9292,7 @@ "model.layers.59.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9330,7 +9316,7 @@ "model.layers.59.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9354,7 +9340,7 @@ "model.layers.59.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9378,7 +9364,7 @@ "model.layers.59.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9402,7 +9388,7 @@ "model.layers.59.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9426,7 +9412,7 @@ "model.layers.59.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9450,7 +9436,7 @@ "model.layers.6.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9474,7 +9460,7 @@ "model.layers.6.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9498,7 +9484,7 @@ "model.layers.6.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9522,7 +9508,7 @@ "model.layers.6.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9546,7 +9532,7 @@ "model.layers.6.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9570,7 +9556,7 @@ "model.layers.6.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9594,7 +9580,7 @@ "model.layers.6.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9618,7 +9604,7 @@ "model.layers.60.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9642,7 +9628,7 @@ "model.layers.60.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9666,7 +9652,7 @@ "model.layers.60.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9690,7 +9676,7 @@ "model.layers.60.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9714,7 +9700,7 @@ "model.layers.60.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9738,7 +9724,7 @@ "model.layers.60.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9762,7 +9748,7 @@ "model.layers.60.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9786,7 +9772,7 @@ "model.layers.61.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9810,7 +9796,7 @@ "model.layers.61.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9834,7 +9820,7 @@ "model.layers.61.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9858,7 +9844,7 @@ "model.layers.61.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9882,7 +9868,7 @@ "model.layers.61.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9906,7 +9892,7 @@ "model.layers.61.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9930,7 +9916,7 @@ "model.layers.61.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -9954,7 +9940,7 @@ "model.layers.62.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -9978,7 +9964,7 @@ "model.layers.62.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10002,7 +9988,7 @@ "model.layers.62.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10026,7 +10012,7 @@ "model.layers.62.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10050,7 +10036,7 @@ "model.layers.62.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10074,7 +10060,7 @@ "model.layers.62.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10098,7 +10084,7 @@ "model.layers.62.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10122,7 +10108,7 @@ "model.layers.63.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10146,7 +10132,7 @@ "model.layers.63.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10170,7 +10156,7 @@ "model.layers.63.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10194,7 +10180,7 @@ "model.layers.63.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10218,7 +10204,7 @@ "model.layers.63.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10242,7 +10228,7 @@ "model.layers.63.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10266,7 +10252,7 @@ "model.layers.63.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10290,7 +10276,7 @@ "model.layers.64.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10314,7 +10300,7 @@ "model.layers.64.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10338,7 +10324,7 @@ "model.layers.64.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10362,7 +10348,7 @@ "model.layers.64.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10386,7 +10372,7 @@ "model.layers.64.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10410,7 +10396,7 @@ "model.layers.64.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10434,7 +10420,7 @@ "model.layers.64.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10458,7 +10444,7 @@ "model.layers.65.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10482,7 +10468,7 @@ "model.layers.65.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10506,7 +10492,7 @@ "model.layers.65.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10530,7 +10516,7 @@ "model.layers.65.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10554,7 +10540,7 @@ "model.layers.65.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10578,7 +10564,7 @@ "model.layers.65.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10602,7 +10588,7 @@ "model.layers.65.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10626,7 +10612,7 @@ "model.layers.66.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10650,7 +10636,7 @@ "model.layers.66.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10674,7 +10660,7 @@ "model.layers.66.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10698,7 +10684,7 @@ "model.layers.66.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10722,7 +10708,7 @@ "model.layers.66.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10746,7 +10732,7 @@ "model.layers.66.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10770,7 +10756,7 @@ "model.layers.66.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10794,7 +10780,7 @@ "model.layers.67.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10818,7 +10804,7 @@ "model.layers.67.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10842,7 +10828,7 @@ "model.layers.67.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10866,7 +10852,7 @@ "model.layers.67.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10890,7 +10876,7 @@ "model.layers.67.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10914,7 +10900,7 @@ "model.layers.67.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10938,7 +10924,7 @@ "model.layers.67.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -10962,7 +10948,7 @@ "model.layers.68.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -10986,7 +10972,7 @@ "model.layers.68.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11010,7 +10996,7 @@ "model.layers.68.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11034,7 +11020,7 @@ "model.layers.68.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11058,7 +11044,7 @@ "model.layers.68.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11082,7 +11068,7 @@ "model.layers.68.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11106,7 +11092,7 @@ "model.layers.68.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11130,7 +11116,7 @@ "model.layers.69.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11154,7 +11140,7 @@ "model.layers.69.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11178,7 +11164,7 @@ "model.layers.69.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11202,7 +11188,7 @@ "model.layers.69.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11226,7 +11212,7 @@ "model.layers.69.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11250,7 +11236,7 @@ "model.layers.69.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11274,7 +11260,7 @@ "model.layers.69.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11298,7 +11284,7 @@ "model.layers.7.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11322,7 +11308,7 @@ "model.layers.7.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11346,7 +11332,7 @@ "model.layers.7.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11370,7 +11356,7 @@ "model.layers.7.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11394,7 +11380,7 @@ "model.layers.7.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11418,7 +11404,7 @@ "model.layers.7.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11442,7 +11428,7 @@ "model.layers.7.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11466,7 +11452,7 @@ "model.layers.70.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11490,7 +11476,7 @@ "model.layers.70.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11514,7 +11500,7 @@ "model.layers.70.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11538,7 +11524,7 @@ "model.layers.70.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11562,7 +11548,7 @@ "model.layers.70.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11586,7 +11572,7 @@ "model.layers.70.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11610,7 +11596,7 @@ "model.layers.70.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11634,7 +11620,7 @@ "model.layers.71.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11658,7 +11644,7 @@ "model.layers.71.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11682,7 +11668,7 @@ "model.layers.71.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11706,7 +11692,7 @@ "model.layers.71.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11730,7 +11716,7 @@ "model.layers.71.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11754,7 +11740,7 @@ "model.layers.71.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11778,7 +11764,7 @@ "model.layers.71.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11802,7 +11788,7 @@ "model.layers.72.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11826,7 +11812,7 @@ "model.layers.72.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11850,7 +11836,7 @@ "model.layers.72.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11874,7 +11860,7 @@ "model.layers.72.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11898,7 +11884,7 @@ "model.layers.72.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11922,7 +11908,7 @@ "model.layers.72.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11946,7 +11932,7 @@ "model.layers.72.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -11970,7 +11956,7 @@ "model.layers.73.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -11994,7 +11980,7 @@ "model.layers.73.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12018,7 +12004,7 @@ "model.layers.73.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12042,7 +12028,7 @@ "model.layers.73.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12066,7 +12052,7 @@ "model.layers.73.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12090,7 +12076,7 @@ "model.layers.73.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12114,7 +12100,7 @@ "model.layers.73.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12138,7 +12124,7 @@ "model.layers.74.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -12162,7 +12148,7 @@ "model.layers.74.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12186,7 +12172,7 @@ "model.layers.74.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12210,7 +12196,7 @@ "model.layers.74.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12234,7 +12220,7 @@ "model.layers.74.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12258,7 +12244,7 @@ "model.layers.74.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12282,7 +12268,7 @@ "model.layers.74.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12306,7 +12292,7 @@ "model.layers.75.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -12330,7 +12316,7 @@ "model.layers.75.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12354,7 +12340,7 @@ "model.layers.75.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12378,7 +12364,7 @@ "model.layers.75.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12402,7 +12388,7 @@ "model.layers.75.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12426,7 +12412,7 @@ "model.layers.75.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12450,7 +12436,7 @@ "model.layers.75.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12474,7 +12460,7 @@ "model.layers.76.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -12498,7 +12484,7 @@ "model.layers.76.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12522,7 +12508,7 @@ "model.layers.76.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12546,7 +12532,7 @@ "model.layers.76.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12570,7 +12556,7 @@ "model.layers.76.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12594,7 +12580,7 @@ "model.layers.76.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12618,7 +12604,7 @@ "model.layers.76.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12642,7 +12628,7 @@ "model.layers.77.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -12666,7 +12652,7 @@ "model.layers.77.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12690,7 +12676,7 @@ "model.layers.77.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12714,7 +12700,7 @@ "model.layers.77.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12738,7 +12724,7 @@ "model.layers.77.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12762,7 +12748,7 @@ "model.layers.77.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12786,7 +12772,7 @@ "model.layers.77.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12810,7 +12796,7 @@ "model.layers.78.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -12834,7 +12820,7 @@ "model.layers.78.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12858,7 +12844,7 @@ "model.layers.78.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12882,7 +12868,7 @@ "model.layers.78.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12906,7 +12892,7 @@ "model.layers.78.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12930,7 +12916,7 @@ "model.layers.78.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12954,7 +12940,7 @@ "model.layers.78.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -12978,7 +12964,7 @@ "model.layers.79.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -13002,7 +12988,7 @@ "model.layers.79.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13026,7 +13012,7 @@ "model.layers.79.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13050,7 +13036,7 @@ "model.layers.79.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13074,7 +13060,7 @@ "model.layers.79.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13098,7 +13084,7 @@ "model.layers.79.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13122,7 +13108,7 @@ "model.layers.79.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13146,7 +13132,7 @@ "model.layers.8.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -13170,7 +13156,7 @@ "model.layers.8.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13194,7 +13180,7 @@ "model.layers.8.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13218,7 +13204,7 @@ "model.layers.8.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13242,7 +13228,7 @@ "model.layers.8.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13266,7 +13252,7 @@ "model.layers.8.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13290,7 +13276,7 @@ "model.layers.8.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13314,7 +13300,7 @@ "model.layers.9.mlp.down_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 28672, "in_features": 28672, @@ -13338,7 +13324,7 @@ "model.layers.9.mlp.gate_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13362,7 +13348,7 @@ "model.layers.9.mlp.up_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13386,7 +13372,7 @@ "model.layers.9.self_attn.k_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13410,7 +13396,7 @@ "model.layers.9.self_attn.o_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13434,7 +13420,7 @@ "model.layers.9.self_attn.q_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13458,7 +13444,7 @@ "model.layers.9.self_attn.v_proj": { "bias": null, "enable_norm": true, - "enable_perm": true, + "enable_perm": false, "group_num": 1, "group_size": 8192, "in_features": 8192, @@ -13479,6 +13465,21 @@ 16 ] } - } - } -} \ No newline at end of file + }, + "quant_method": "vptq" + }, + "rms_norm_eps": 1e-05, + "rope_scaling": { + "factor": 8.0, + "high_freq_factor": 4.0, + "low_freq_factor": 1.0, + "original_max_position_embeddings": 8192, + "rope_type": "llama3" + }, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "torch_dtype": "bfloat16", + "transformers_version": "4.49.0", + "use_cache": true, + "vocab_size": 128256 +}