diff --git "a/measurement.json" "b/measurement.json" --- "a/measurement.json" +++ "b/measurement.json" @@ -2,7 +2,7 @@ "measurement": { "model.layers.0.self_attn": [ { - "accuracy": 0.9515928328037262, + "accuracy": 0.9515531063079834, "total_bits": 30308928, "q_proj": { "group_size": { @@ -66,7 +66,7 @@ } }, { - "accuracy": 0.953981950879097, + "accuracy": 0.9539748653769493, "total_bits": 31455808, "q_proj": { "group_size": { @@ -130,7 +130,7 @@ } }, { - "accuracy": 0.9591670855879784, + "accuracy": 0.9591861926019192, "total_bits": 33412832, "q_proj": { "group_size": { @@ -194,7 +194,7 @@ } }, { - "accuracy": 0.9699935875833035, + "accuracy": 0.9699958208948374, "total_bits": 37983200, "q_proj": { "group_size": { @@ -258,7 +258,7 @@ } }, { - "accuracy": 0.976397393271327, + "accuracy": 0.9763969834893942, "total_bits": 44838176, "q_proj": { "group_size": { @@ -322,7 +322,7 @@ } }, { - "accuracy": 0.9767184294760227, + "accuracy": 0.9767143614590168, "total_bits": 44912768, "q_proj": { "group_size": { @@ -386,7 +386,7 @@ } }, { - "accuracy": 0.986974217928946, + "accuracy": 0.9869659701362252, "total_bits": 57355552, "q_proj": { "group_size": { @@ -438,7 +438,7 @@ } }, { - "accuracy": 0.9872219935059547, + "accuracy": 0.9872188298031688, "total_bits": 57430144, "q_proj": { "group_size": { @@ -490,7 +490,7 @@ } }, { - "accuracy": 0.9881364433094859, + "accuracy": 0.9881322896108031, "total_bits": 57950464, "q_proj": { "group_size": { @@ -542,7 +542,7 @@ } }, { - "accuracy": 0.9888399662449956, + "accuracy": 0.9888321068137884, "total_bits": 58692736, "q_proj": { "group_size": { @@ -594,7 +594,7 @@ } }, { - "accuracy": 0.9880855781957507, + "accuracy": 0.9880868950858712, "total_bits": 59068544, "q_proj": { "group_size": { @@ -658,7 +658,7 @@ } }, { - "accuracy": 0.9889282267540693, + "accuracy": 0.9889282938092947, "total_bits": 59588864, "q_proj": { "group_size": { @@ -722,7 +722,7 @@ } }, { - "accuracy": 0.9899680046364665, + "accuracy": 0.9899678928777575, "total_bits": 61536832, "q_proj": { "group_size": { @@ -783,7 +783,7 @@ } }, { - "accuracy": 0.9907521335408092, + "accuracy": 0.9907488031312823, "total_bits": 62354560, "q_proj": { "group_size": { @@ -844,7 +844,7 @@ } }, { - "accuracy": 0.9944849004969001, + "accuracy": 0.9944888786412776, "total_bits": 75246880, "q_proj": { "group_size": { @@ -905,7 +905,7 @@ } }, { - "accuracy": 0.9953417172655463, + "accuracy": 0.9953421992249787, "total_bits": 76510336, "q_proj": { "group_size": { @@ -966,7 +966,7 @@ } }, { - "accuracy": 0.9965903947595507, + "accuracy": 0.9965901931282133, "total_bits": 85667104, "q_proj": { "group_size": { @@ -1018,7 +1018,7 @@ } }, { - "accuracy": 0.9975632540881634, + "accuracy": 0.9975674538873136, "total_bits": 91722880, "q_proj": { "group_size": { @@ -1070,7 +1070,7 @@ } }, { - "accuracy": 0.9990884908474982, + "accuracy": 0.9990892710047774, "total_bits": 113978656, "q_proj": { "group_size": { @@ -1124,7 +1124,7 @@ ], "model.layers.0.mlp": [ { - "accuracy": 0.8881748169660568, + "accuracy": 0.8882661387324333, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -1176,7 +1176,7 @@ } }, { - "accuracy": 0.8919973969459534, + "accuracy": 0.8919670283794403, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -1228,7 +1228,7 @@ } }, { - "accuracy": 0.9069116935133934, + "accuracy": 0.9069375917315483, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -1277,7 +1277,7 @@ } }, { - "accuracy": 0.9124017059803009, + "accuracy": 0.9124317467212677, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -1326,7 +1326,7 @@ } }, { - "accuracy": 0.9430184848606586, + "accuracy": 0.9430231153964996, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -1378,7 +1378,7 @@ } }, { - "accuracy": 0.9480531290173531, + "accuracy": 0.9480909705162048, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -1430,7 +1430,7 @@ } }, { - "accuracy": 0.9544955678284168, + "accuracy": 0.9545128084719181, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -1479,7 +1479,7 @@ } }, { - "accuracy": 0.968281302601099, + "accuracy": 0.9682874381542206, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -1522,7 +1522,7 @@ } }, { - "accuracy": 0.9713601395487785, + "accuracy": 0.971364825963974, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -1565,7 +1565,7 @@ } }, { - "accuracy": 0.9707059450447559, + "accuracy": 0.9707299135625362, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -1617,7 +1617,7 @@ } }, { - "accuracy": 0.9745050817728043, + "accuracy": 0.974507249891758, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -1669,7 +1669,7 @@ } }, { - "accuracy": 0.9848953913897276, + "accuracy": 0.9848882537335157, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -1721,7 +1721,7 @@ } }, { - "accuracy": 0.9872103426605463, + "accuracy": 0.9872004305943847, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -1773,7 +1773,7 @@ } }, { - "accuracy": 0.9911489551886916, + "accuracy": 0.9911568406969309, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -1816,7 +1816,7 @@ } }, { - "accuracy": 0.9923222842626274, + "accuracy": 0.9923209701664746, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -1865,7 +1865,7 @@ } }, { - "accuracy": 0.9939925689250231, + "accuracy": 0.9939967971295118, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -1911,7 +1911,7 @@ } }, { - "accuracy": 0.9975718185305595, + "accuracy": 0.9975708881393075, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -1953,7 +1953,7 @@ ], "model.layers.1.self_attn": [ { - "accuracy": 0.9072708263993263, + "accuracy": 0.9073722139000893, "total_bits": 30308928, "q_proj": { "group_size": { @@ -2017,7 +2017,7 @@ } }, { - "accuracy": 0.9114431366324425, + "accuracy": 0.91156817227602, "total_bits": 31455808, "q_proj": { "group_size": { @@ -2081,7 +2081,7 @@ } }, { - "accuracy": 0.9211425334215164, + "accuracy": 0.92121671885252, "total_bits": 33412832, "q_proj": { "group_size": { @@ -2145,7 +2145,7 @@ } }, { - "accuracy": 0.940546628087759, + "accuracy": 0.9407354593276978, "total_bits": 37983200, "q_proj": { "group_size": { @@ -2209,7 +2209,7 @@ } }, { - "accuracy": 0.9535201378166676, + "accuracy": 0.9535512514412403, "total_bits": 44838176, "q_proj": { "group_size": { @@ -2273,7 +2273,7 @@ } }, { - "accuracy": 0.9539150819182396, + "accuracy": 0.953955851495266, "total_bits": 44912768, "q_proj": { "group_size": { @@ -2337,7 +2337,7 @@ } }, { - "accuracy": 0.9746329039335251, + "accuracy": 0.9746336918324232, "total_bits": 57355552, "q_proj": { "group_size": { @@ -2389,7 +2389,7 @@ } }, { - "accuracy": 0.9750404637306929, + "accuracy": 0.9750551991164684, "total_bits": 57430144, "q_proj": { "group_size": { @@ -2441,7 +2441,7 @@ } }, { - "accuracy": 0.976738478988409, + "accuracy": 0.976717684417963, "total_bits": 57950464, "q_proj": { "group_size": { @@ -2493,7 +2493,7 @@ } }, { - "accuracy": 0.9780394490808249, + "accuracy": 0.9780480619519949, "total_bits": 58692736, "q_proj": { "group_size": { @@ -2545,7 +2545,7 @@ } }, { - "accuracy": 0.9763826839625835, + "accuracy": 0.9763856939971447, "total_bits": 59068544, "q_proj": { "group_size": { @@ -2609,7 +2609,7 @@ } }, { - "accuracy": 0.9780621360987425, + "accuracy": 0.9780414216220379, "total_bits": 59588864, "q_proj": { "group_size": { @@ -2673,7 +2673,7 @@ } }, { - "accuracy": 0.9801010321825743, + "accuracy": 0.9800688195973635, "total_bits": 61536832, "q_proj": { "group_size": { @@ -2734,7 +2734,7 @@ } }, { - "accuracy": 0.981600085273385, + "accuracy": 0.9815671853721142, "total_bits": 62354560, "q_proj": { "group_size": { @@ -2795,7 +2795,7 @@ } }, { - "accuracy": 0.9890466667711735, + "accuracy": 0.9890200421214104, "total_bits": 75246880, "q_proj": { "group_size": { @@ -2856,7 +2856,7 @@ } }, { - "accuracy": 0.9907460613176227, + "accuracy": 0.9907318344339728, "total_bits": 76510336, "q_proj": { "group_size": { @@ -2917,7 +2917,7 @@ } }, { - "accuracy": 0.9933391944505274, + "accuracy": 0.9933400782756507, "total_bits": 85667104, "q_proj": { "group_size": { @@ -2969,7 +2969,7 @@ } }, { - "accuracy": 0.9952039420604706, + "accuracy": 0.9951940830796957, "total_bits": 91722880, "q_proj": { "group_size": { @@ -3021,7 +3021,7 @@ } }, { - "accuracy": 0.9982604767428711, + "accuracy": 0.9982599728973582, "total_bits": 113978656, "q_proj": { "group_size": { @@ -3075,7 +3075,7 @@ ], "model.layers.1.mlp": [ { - "accuracy": 0.8869373872876167, + "accuracy": 0.887041375041008, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -3127,7 +3127,7 @@ } }, { - "accuracy": 0.891030453145504, + "accuracy": 0.8909792527556419, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -3179,7 +3179,7 @@ } }, { - "accuracy": 0.9027609676122665, + "accuracy": 0.9027382656931877, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -3228,7 +3228,7 @@ } }, { - "accuracy": 0.9062561988830566, + "accuracy": 0.9062387868762016, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -3277,7 +3277,7 @@ } }, { - "accuracy": 0.9437772929668427, + "accuracy": 0.943806029856205, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -3329,7 +3329,7 @@ } }, { - "accuracy": 0.9482904970645905, + "accuracy": 0.9483064226806164, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -3381,7 +3381,7 @@ } }, { - "accuracy": 0.952780719846487, + "accuracy": 0.9527781158685684, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -3430,7 +3430,7 @@ } }, { - "accuracy": 0.9698743838816881, + "accuracy": 0.9698769953101873, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -3473,7 +3473,7 @@ } }, { - "accuracy": 0.9721903912723064, + "accuracy": 0.9722175262868404, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -3516,7 +3516,7 @@ } }, { - "accuracy": 0.9712930209934711, + "accuracy": 0.9713117778301239, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -3568,7 +3568,7 @@ } }, { - "accuracy": 0.9747709520161152, + "accuracy": 0.9747742302715778, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -3620,7 +3620,7 @@ } }, { - "accuracy": 0.9853192111477256, + "accuracy": 0.9853277914226055, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -3672,7 +3672,7 @@ } }, { - "accuracy": 0.987357254140079, + "accuracy": 0.9873669799417257, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -3724,7 +3724,7 @@ } }, { - "accuracy": 0.9915956920012832, + "accuracy": 0.9915947569534183, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -3767,7 +3767,7 @@ } }, { - "accuracy": 0.9925124426372349, + "accuracy": 0.9925175970420241, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -3816,7 +3816,7 @@ } }, { - "accuracy": 0.9935486940667033, + "accuracy": 0.9935514670796692, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -3862,7 +3862,7 @@ } }, { - "accuracy": 0.9976398337166756, + "accuracy": 0.9976405743509531, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -3904,7 +3904,7 @@ ], "model.layers.2.self_attn": [ { - "accuracy": 0.8655510395765305, + "accuracy": 0.8655463457107544, "total_bits": 30308928, "q_proj": { "group_size": { @@ -3968,7 +3968,7 @@ } }, { - "accuracy": 0.8742070347070694, + "accuracy": 0.874164268374443, "total_bits": 31455808, "q_proj": { "group_size": { @@ -4032,7 +4032,7 @@ } }, { - "accuracy": 0.8933860436081886, + "accuracy": 0.8934662640094757, "total_bits": 33412832, "q_proj": { "group_size": { @@ -4096,7 +4096,7 @@ } }, { - "accuracy": 0.9261169582605362, + "accuracy": 0.926240935921669, "total_bits": 37983200, "q_proj": { "group_size": { @@ -4160,7 +4160,7 @@ } }, { - "accuracy": 0.933709405362606, + "accuracy": 0.9337229505181313, "total_bits": 44838176, "q_proj": { "group_size": { @@ -4224,7 +4224,7 @@ } }, { - "accuracy": 0.9347171932458878, + "accuracy": 0.9346923530101776, "total_bits": 44912768, "q_proj": { "group_size": { @@ -4288,7 +4288,7 @@ } }, { - "accuracy": 0.9634591825306416, + "accuracy": 0.9634601436555386, "total_bits": 57355552, "q_proj": { "group_size": { @@ -4340,7 +4340,7 @@ } }, { - "accuracy": 0.9642514251172543, + "accuracy": 0.9642136543989182, "total_bits": 57430144, "q_proj": { "group_size": { @@ -4392,7 +4392,7 @@ } }, { - "accuracy": 0.9666738845407963, + "accuracy": 0.9666857272386551, "total_bits": 57950464, "q_proj": { "group_size": { @@ -4444,7 +4444,7 @@ } }, { - "accuracy": 0.9683135040104389, + "accuracy": 0.9683275371789932, "total_bits": 58692736, "q_proj": { "group_size": { @@ -4496,7 +4496,7 @@ } }, { - "accuracy": 0.966770775616169, + "accuracy": 0.9667858779430389, "total_bits": 59068544, "q_proj": { "group_size": { @@ -4560,7 +4560,7 @@ } }, { - "accuracy": 0.9689657036215067, + "accuracy": 0.9689403381198645, "total_bits": 59588864, "q_proj": { "group_size": { @@ -4624,7 +4624,7 @@ } }, { - "accuracy": 0.9732588063925505, + "accuracy": 0.9732514582574368, "total_bits": 61536832, "q_proj": { "group_size": { @@ -4685,7 +4685,7 @@ } }, { - "accuracy": 0.9749700985848904, + "accuracy": 0.9749796185642481, "total_bits": 62354560, "q_proj": { "group_size": { @@ -4746,7 +4746,7 @@ } }, { - "accuracy": 0.985321925021708, + "accuracy": 0.9853210505098104, "total_bits": 75246880, "q_proj": { "group_size": { @@ -4807,7 +4807,7 @@ } }, { - "accuracy": 0.9874144792556763, + "accuracy": 0.9874111460521817, "total_bits": 76510336, "q_proj": { "group_size": { @@ -4868,7 +4868,7 @@ } }, { - "accuracy": 0.9904179144650698, + "accuracy": 0.9904154865071177, "total_bits": 85667104, "q_proj": { "group_size": { @@ -4920,7 +4920,7 @@ } }, { - "accuracy": 0.9935114970430732, + "accuracy": 0.9935085913166404, "total_bits": 91722880, "q_proj": { "group_size": { @@ -4972,7 +4972,7 @@ } }, { - "accuracy": 0.9975107992067933, + "accuracy": 0.9975118087604642, "total_bits": 113978656, "q_proj": { "group_size": { @@ -5026,7 +5026,7 @@ ], "model.layers.2.mlp": [ { - "accuracy": 0.8512221872806549, + "accuracy": 0.851137638092041, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -5078,7 +5078,7 @@ } }, { - "accuracy": 0.8556944578886032, + "accuracy": 0.8557578176259995, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -5130,7 +5130,7 @@ } }, { - "accuracy": 0.8742920905351639, + "accuracy": 0.8742973953485489, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -5179,7 +5179,7 @@ } }, { - "accuracy": 0.8798726350069046, + "accuracy": 0.8798764571547508, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -5228,7 +5228,7 @@ } }, { - "accuracy": 0.9260013550519943, + "accuracy": 0.9259674102067947, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -5280,7 +5280,7 @@ } }, { - "accuracy": 0.9317035898566246, + "accuracy": 0.9316787645220757, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -5332,7 +5332,7 @@ } }, { - "accuracy": 0.9391488991677761, + "accuracy": 0.9391309916973114, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -5381,7 +5381,7 @@ } }, { - "accuracy": 0.9611527696251869, + "accuracy": 0.9611707739531994, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -5424,7 +5424,7 @@ } }, { - "accuracy": 0.9643270559608936, + "accuracy": 0.964320108294487, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -5467,7 +5467,7 @@ } }, { - "accuracy": 0.9622061587870121, + "accuracy": 0.962238498032093, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -5519,7 +5519,7 @@ } }, { - "accuracy": 0.966707780957222, + "accuracy": 0.9667122215032578, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -5571,7 +5571,7 @@ } }, { - "accuracy": 0.9806768018752337, + "accuracy": 0.9806710071861744, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -5623,7 +5623,7 @@ } }, { - "accuracy": 0.9833411537110806, + "accuracy": 0.9833368640393019, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -5675,7 +5675,7 @@ } }, { - "accuracy": 0.9893169151619077, + "accuracy": 0.98932437133044, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -5718,7 +5718,7 @@ } }, { - "accuracy": 0.9900901559740305, + "accuracy": 0.990092589519918, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -5767,7 +5767,7 @@ } }, { - "accuracy": 0.9917803723365068, + "accuracy": 0.9917868180200458, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -5813,7 +5813,7 @@ } }, { - "accuracy": 0.997135940939188, + "accuracy": 0.9971363425720483, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -5855,7 +5855,7 @@ ], "model.layers.3.self_attn": [ { - "accuracy": 0.8845625817775726, + "accuracy": 0.8846139460802078, "total_bits": 30308928, "q_proj": { "group_size": { @@ -5919,7 +5919,7 @@ } }, { - "accuracy": 0.8901228457689285, + "accuracy": 0.8900518491864204, "total_bits": 31455808, "q_proj": { "group_size": { @@ -5983,7 +5983,7 @@ } }, { - "accuracy": 0.9061683937907219, + "accuracy": 0.9061124995350838, "total_bits": 33412832, "q_proj": { "group_size": { @@ -6047,7 +6047,7 @@ } }, { - "accuracy": 0.9347674697637558, + "accuracy": 0.9347528889775276, "total_bits": 37983200, "q_proj": { "group_size": { @@ -6111,7 +6111,7 @@ } }, { - "accuracy": 0.9422827735543251, + "accuracy": 0.9422792084515095, "total_bits": 44838176, "q_proj": { "group_size": { @@ -6175,7 +6175,7 @@ } }, { - "accuracy": 0.943145889788866, + "accuracy": 0.9431353025138378, "total_bits": 44912768, "q_proj": { "group_size": { @@ -6239,7 +6239,7 @@ } }, { - "accuracy": 0.9687017947435379, + "accuracy": 0.9687346704304218, "total_bits": 57355552, "q_proj": { "group_size": { @@ -6291,7 +6291,7 @@ } }, { - "accuracy": 0.969449121505022, + "accuracy": 0.9694707691669464, "total_bits": 57430144, "q_proj": { "group_size": { @@ -6343,7 +6343,7 @@ } }, { - "accuracy": 0.9714747574180365, + "accuracy": 0.9715053513646126, "total_bits": 57950464, "q_proj": { "group_size": { @@ -6395,7 +6395,7 @@ } }, { - "accuracy": 0.9727979246526957, + "accuracy": 0.9728143084794283, "total_bits": 58692736, "q_proj": { "group_size": { @@ -6447,7 +6447,7 @@ } }, { - "accuracy": 0.9711320530623198, + "accuracy": 0.9711146093904972, "total_bits": 59068544, "q_proj": { "group_size": { @@ -6511,7 +6511,7 @@ } }, { - "accuracy": 0.9730110038071871, + "accuracy": 0.9730188455432653, "total_bits": 59588864, "q_proj": { "group_size": { @@ -6575,7 +6575,7 @@ } }, { - "accuracy": 0.9766805954277515, + "accuracy": 0.9766947887837887, "total_bits": 61536832, "q_proj": { "group_size": { @@ -6636,7 +6636,7 @@ } }, { - "accuracy": 0.9783372972160578, + "accuracy": 0.9783317521214485, "total_bits": 62354560, "q_proj": { "group_size": { @@ -6697,7 +6697,7 @@ } }, { - "accuracy": 0.9873075932264328, + "accuracy": 0.9873018255457282, "total_bits": 75246880, "q_proj": { "group_size": { @@ -6758,7 +6758,7 @@ } }, { - "accuracy": 0.9891520766541362, + "accuracy": 0.9891604781150818, "total_bits": 76510336, "q_proj": { "group_size": { @@ -6819,7 +6819,7 @@ } }, { - "accuracy": 0.9918732857331634, + "accuracy": 0.9918712023645639, "total_bits": 85667104, "q_proj": { "group_size": { @@ -6871,7 +6871,7 @@ } }, { - "accuracy": 0.994609275367111, + "accuracy": 0.9946046634577215, "total_bits": 91722880, "q_proj": { "group_size": { @@ -6923,7 +6923,7 @@ } }, { - "accuracy": 0.9978871110361069, + "accuracy": 0.9978904649615288, "total_bits": 113978656, "q_proj": { "group_size": { @@ -6977,7 +6977,7 @@ ], "model.layers.3.mlp": [ { - "accuracy": 0.8215165734291077, + "accuracy": 0.8215235769748688, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -7029,7 +7029,7 @@ } }, { - "accuracy": 0.8267818093299866, + "accuracy": 0.8267826288938522, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -7081,7 +7081,7 @@ } }, { - "accuracy": 0.8501903116703033, + "accuracy": 0.8501260429620743, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -7130,7 +7130,7 @@ } }, { - "accuracy": 0.8572592884302139, + "accuracy": 0.8572545945644379, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -7179,7 +7179,7 @@ } }, { - "accuracy": 0.9100245088338852, + "accuracy": 0.9100974574685097, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -7231,7 +7231,7 @@ } }, { - "accuracy": 0.9172510206699371, + "accuracy": 0.9171888679265976, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -7283,7 +7283,7 @@ } }, { - "accuracy": 0.9271175712347031, + "accuracy": 0.92706498503685, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -7332,7 +7332,7 @@ } }, { - "accuracy": 0.953081201761961, + "accuracy": 0.9530698768794537, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -7375,7 +7375,7 @@ } }, { - "accuracy": 0.9570418335497379, + "accuracy": 0.957017607986927, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -7418,7 +7418,7 @@ } }, { - "accuracy": 0.9540456458926201, + "accuracy": 0.9540662579238415, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -7470,7 +7470,7 @@ } }, { - "accuracy": 0.9596328996121883, + "accuracy": 0.9596161395311356, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -7522,7 +7522,7 @@ } }, { - "accuracy": 0.9765274990350008, + "accuracy": 0.9765002690255642, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -7574,7 +7574,7 @@ } }, { - "accuracy": 0.9798263423144817, + "accuracy": 0.979815537109971, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -7626,7 +7626,7 @@ } }, { - "accuracy": 0.9871442606672645, + "accuracy": 0.987149802967906, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -7669,7 +7669,7 @@ } }, { - "accuracy": 0.9879334066063166, + "accuracy": 0.9879286577925086, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -7718,7 +7718,7 @@ } }, { - "accuracy": 0.9901348492130637, + "accuracy": 0.9901374354958534, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -7764,7 +7764,7 @@ } }, { - "accuracy": 0.9965592622756958, + "accuracy": 0.9965564699377865, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -7806,7 +7806,7 @@ ], "model.layers.4.self_attn": [ { - "accuracy": 0.8741211891174316, + "accuracy": 0.8741328567266464, "total_bits": 30308928, "q_proj": { "group_size": { @@ -7870,7 +7870,7 @@ } }, { - "accuracy": 0.8816789761185646, + "accuracy": 0.8816472738981247, "total_bits": 31455808, "q_proj": { "group_size": { @@ -7934,7 +7934,7 @@ } }, { - "accuracy": 0.9003885015845299, + "accuracy": 0.900344654917717, "total_bits": 33412832, "q_proj": { "group_size": { @@ -7998,7 +7998,7 @@ } }, { - "accuracy": 0.9307805150747299, + "accuracy": 0.9307383000850677, "total_bits": 37983200, "q_proj": { "group_size": { @@ -8062,7 +8062,7 @@ } }, { - "accuracy": 0.9374072849750519, + "accuracy": 0.9374280199408531, "total_bits": 44838176, "q_proj": { "group_size": { @@ -8126,7 +8126,7 @@ } }, { - "accuracy": 0.9384637139737606, + "accuracy": 0.9384343661367893, "total_bits": 44912768, "q_proj": { "group_size": { @@ -8190,7 +8190,7 @@ } }, { - "accuracy": 0.9653116390109062, + "accuracy": 0.9653166085481644, "total_bits": 57355552, "q_proj": { "group_size": { @@ -8242,7 +8242,7 @@ } }, { - "accuracy": 0.9661814905703068, + "accuracy": 0.9661872051656246, "total_bits": 57430144, "q_proj": { "group_size": { @@ -8294,7 +8294,7 @@ } }, { - "accuracy": 0.9684111662209034, + "accuracy": 0.968420397490263, "total_bits": 57950464, "q_proj": { "group_size": { @@ -8346,7 +8346,7 @@ } }, { - "accuracy": 0.969778697937727, + "accuracy": 0.9697968028485775, "total_bits": 58692736, "q_proj": { "group_size": { @@ -8398,7 +8398,7 @@ } }, { - "accuracy": 0.9687559828162193, + "accuracy": 0.9687640070915222, "total_bits": 59068544, "q_proj": { "group_size": { @@ -8462,7 +8462,7 @@ } }, { - "accuracy": 0.9707713481038809, + "accuracy": 0.9707700200378895, "total_bits": 59588864, "q_proj": { "group_size": { @@ -8526,7 +8526,7 @@ } }, { - "accuracy": 0.975062221288681, + "accuracy": 0.9750581458210945, "total_bits": 61536832, "q_proj": { "group_size": { @@ -8587,7 +8587,7 @@ } }, { - "accuracy": 0.9766068141907454, + "accuracy": 0.9766066540032625, "total_bits": 62354560, "q_proj": { "group_size": { @@ -8648,7 +8648,7 @@ } }, { - "accuracy": 0.986367778852582, + "accuracy": 0.9863643515855074, "total_bits": 75246880, "q_proj": { "group_size": { @@ -8709,7 +8709,7 @@ } }, { - "accuracy": 0.9882961716502905, + "accuracy": 0.9882954657077789, "total_bits": 76510336, "q_proj": { "group_size": { @@ -8770,7 +8770,7 @@ } }, { - "accuracy": 0.9909742707386613, + "accuracy": 0.9909781841561198, "total_bits": 85667104, "q_proj": { "group_size": { @@ -8822,7 +8822,7 @@ } }, { - "accuracy": 0.9939752677455544, + "accuracy": 0.9939774051308632, "total_bits": 91722880, "q_proj": { "group_size": { @@ -8874,7 +8874,7 @@ } }, { - "accuracy": 0.9976646257564425, + "accuracy": 0.9976642981637269, "total_bits": 113978656, "q_proj": { "group_size": { @@ -8928,7 +8928,7 @@ ], "model.layers.4.mlp": [ { - "accuracy": 0.8349805325269699, + "accuracy": 0.8348695486783981, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -8980,7 +8980,7 @@ } }, { - "accuracy": 0.8401748985052109, + "accuracy": 0.8400902897119522, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -9032,7 +9032,7 @@ } }, { - "accuracy": 0.8632630258798599, + "accuracy": 0.863140657544136, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -9081,7 +9081,7 @@ } }, { - "accuracy": 0.8702157586812973, + "accuracy": 0.870071679353714, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -9130,7 +9130,7 @@ } }, { - "accuracy": 0.9168255552649498, + "accuracy": 0.9167942702770233, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -9182,7 +9182,7 @@ } }, { - "accuracy": 0.9239948987960815, + "accuracy": 0.9239982962608337, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -9234,7 +9234,7 @@ } }, { - "accuracy": 0.933478482067585, + "accuracy": 0.9335077553987503, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -9283,7 +9283,7 @@ } }, { - "accuracy": 0.9563411399722099, + "accuracy": 0.9563678838312626, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -9326,7 +9326,7 @@ } }, { - "accuracy": 0.960248950868845, + "accuracy": 0.960248876363039, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -9369,7 +9369,7 @@ } }, { - "accuracy": 0.9574717655777931, + "accuracy": 0.9574565887451172, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -9421,7 +9421,7 @@ } }, { - "accuracy": 0.9629541300237179, + "accuracy": 0.9629608169198036, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -9473,7 +9473,7 @@ } }, { - "accuracy": 0.9782424960285425, + "accuracy": 0.9782421588897705, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -9525,7 +9525,7 @@ } }, { - "accuracy": 0.9814701918512583, + "accuracy": 0.9814739804714918, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -9577,7 +9577,7 @@ } }, { - "accuracy": 0.9879318736493587, + "accuracy": 0.9879294466227293, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -9620,7 +9620,7 @@ } }, { - "accuracy": 0.9888098947703838, + "accuracy": 0.988809896633029, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -9669,7 +9669,7 @@ } }, { - "accuracy": 0.9909165976569057, + "accuracy": 0.9909201338887215, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -9715,7 +9715,7 @@ } }, { - "accuracy": 0.9967805305495858, + "accuracy": 0.9967838707379997, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -9757,7 +9757,7 @@ ], "model.layers.5.self_attn": [ { - "accuracy": 0.8810675218701363, + "accuracy": 0.8811230733990669, "total_bits": 30308928, "q_proj": { "group_size": { @@ -9821,7 +9821,7 @@ } }, { - "accuracy": 0.8886952474713326, + "accuracy": 0.8887623399496078, "total_bits": 31455808, "q_proj": { "group_size": { @@ -9885,7 +9885,7 @@ } }, { - "accuracy": 0.9045190438628197, + "accuracy": 0.904540665447712, "total_bits": 33412832, "q_proj": { "group_size": { @@ -9949,7 +9949,7 @@ } }, { - "accuracy": 0.9352795407176018, + "accuracy": 0.9353184551000595, "total_bits": 37983200, "q_proj": { "group_size": { @@ -10013,7 +10013,7 @@ } }, { - "accuracy": 0.9399208948016167, + "accuracy": 0.9399426616728306, "total_bits": 44838176, "q_proj": { "group_size": { @@ -10077,7 +10077,7 @@ } }, { - "accuracy": 0.9410183131694794, + "accuracy": 0.9409984610974789, "total_bits": 44912768, "q_proj": { "group_size": { @@ -10141,7 +10141,7 @@ } }, { - "accuracy": 0.9663527235388756, + "accuracy": 0.9663707427680492, "total_bits": 57355552, "q_proj": { "group_size": { @@ -10193,7 +10193,7 @@ } }, { - "accuracy": 0.967367872595787, + "accuracy": 0.9673691280186176, "total_bits": 57430144, "q_proj": { "group_size": { @@ -10245,7 +10245,7 @@ } }, { - "accuracy": 0.9696921166032553, + "accuracy": 0.9697138108313084, "total_bits": 57950464, "q_proj": { "group_size": { @@ -10297,7 +10297,7 @@ } }, { - "accuracy": 0.9711299203336239, + "accuracy": 0.9711332526057959, "total_bits": 58692736, "q_proj": { "group_size": { @@ -10349,7 +10349,7 @@ } }, { - "accuracy": 0.9700027704238892, + "accuracy": 0.9700067639350891, "total_bits": 59068544, "q_proj": { "group_size": { @@ -10413,7 +10413,7 @@ } }, { - "accuracy": 0.9720256011933088, + "accuracy": 0.9720334056764841, "total_bits": 59588864, "q_proj": { "group_size": { @@ -10477,7 +10477,7 @@ } }, { - "accuracy": 0.9756313841789961, + "accuracy": 0.9756301864981651, "total_bits": 61536832, "q_proj": { "group_size": { @@ -10538,7 +10538,7 @@ } }, { - "accuracy": 0.9773869439959526, + "accuracy": 0.9774045348167419, "total_bits": 62354560, "q_proj": { "group_size": { @@ -10599,7 +10599,7 @@ } }, { - "accuracy": 0.9866560539230704, + "accuracy": 0.9866563268005848, "total_bits": 75246880, "q_proj": { "group_size": { @@ -10660,7 +10660,7 @@ } }, { - "accuracy": 0.9886289816349745, + "accuracy": 0.9886361388489604, "total_bits": 76510336, "q_proj": { "group_size": { @@ -10721,7 +10721,7 @@ } }, { - "accuracy": 0.9912481410428882, + "accuracy": 0.9912527557462454, "total_bits": 85667104, "q_proj": { "group_size": { @@ -10773,7 +10773,7 @@ } }, { - "accuracy": 0.9942180886864662, + "accuracy": 0.9942179205827415, "total_bits": 91722880, "q_proj": { "group_size": { @@ -10825,7 +10825,7 @@ } }, { - "accuracy": 0.9977244043257087, + "accuracy": 0.9977258909493685, "total_bits": 113978656, "q_proj": { "group_size": { @@ -10879,7 +10879,7 @@ ], "model.layers.5.mlp": [ { - "accuracy": 0.8648017942905426, + "accuracy": 0.8648174107074738, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -10931,7 +10931,7 @@ } }, { - "accuracy": 0.8694759905338287, + "accuracy": 0.8695154935121536, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -10983,7 +10983,7 @@ } }, { - "accuracy": 0.8880036026239395, + "accuracy": 0.888036236166954, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -11032,7 +11032,7 @@ } }, { - "accuracy": 0.8937847763299942, + "accuracy": 0.8938298374414444, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -11081,7 +11081,7 @@ } }, { - "accuracy": 0.9318181350827217, + "accuracy": 0.931794673204422, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -11133,7 +11133,7 @@ } }, { - "accuracy": 0.9377684108912945, + "accuracy": 0.9377873539924622, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -11185,7 +11185,7 @@ } }, { - "accuracy": 0.9455864503979683, + "accuracy": 0.9456103965640068, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -11234,7 +11234,7 @@ } }, { - "accuracy": 0.9638955146074295, + "accuracy": 0.963904220610857, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -11277,7 +11277,7 @@ } }, { - "accuracy": 0.9671880304813385, + "accuracy": 0.9671907536685467, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -11320,7 +11320,7 @@ } }, { - "accuracy": 0.9650383368134499, + "accuracy": 0.9650482423603535, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -11372,7 +11372,7 @@ } }, { - "accuracy": 0.9695848729461432, + "accuracy": 0.9695756994187832, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -11424,7 +11424,7 @@ } }, { - "accuracy": 0.9821004029363394, + "accuracy": 0.982111718505621, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -11476,7 +11476,7 @@ } }, { - "accuracy": 0.9847700102254748, + "accuracy": 0.984773620031774, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -11528,7 +11528,7 @@ } }, { - "accuracy": 0.990053579211235, + "accuracy": 0.9900560518726707, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -11571,7 +11571,7 @@ } }, { - "accuracy": 0.9907908504828811, + "accuracy": 0.990793714299798, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -11620,7 +11620,7 @@ } }, { - "accuracy": 0.992512381169945, + "accuracy": 0.992513523902744, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -11666,7 +11666,7 @@ } }, { - "accuracy": 0.9973284220322967, + "accuracy": 0.997328422497958, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -11708,7 +11708,7 @@ ], "model.layers.6.self_attn": [ { - "accuracy": 0.8890528008341789, + "accuracy": 0.8890272378921509, "total_bits": 30308928, "q_proj": { "group_size": { @@ -11772,7 +11772,7 @@ } }, { - "accuracy": 0.8953105807304382, + "accuracy": 0.8953426331281662, "total_bits": 31455808, "q_proj": { "group_size": { @@ -11836,7 +11836,7 @@ } }, { - "accuracy": 0.9070602431893349, + "accuracy": 0.9071049243211746, "total_bits": 33412832, "q_proj": { "group_size": { @@ -11900,7 +11900,7 @@ } }, { - "accuracy": 0.9330306127667427, + "accuracy": 0.9330921769142151, "total_bits": 37983200, "q_proj": { "group_size": { @@ -11964,7 +11964,7 @@ } }, { - "accuracy": 0.9448112137615681, + "accuracy": 0.9447792358696461, "total_bits": 44838176, "q_proj": { "group_size": { @@ -12028,7 +12028,7 @@ } }, { - "accuracy": 0.9454820677638054, + "accuracy": 0.9455131739377975, "total_bits": 44912768, "q_proj": { "group_size": { @@ -12092,7 +12092,7 @@ } }, { - "accuracy": 0.9695140719413757, + "accuracy": 0.969525508582592, "total_bits": 57355552, "q_proj": { "group_size": { @@ -12144,7 +12144,7 @@ } }, { - "accuracy": 0.9701519533991814, + "accuracy": 0.9701721202582121, "total_bits": 57430144, "q_proj": { "group_size": { @@ -12196,7 +12196,7 @@ } }, { - "accuracy": 0.972233023494482, + "accuracy": 0.9722142405807972, "total_bits": 57950464, "q_proj": { "group_size": { @@ -12248,7 +12248,7 @@ } }, { - "accuracy": 0.9737806580960751, + "accuracy": 0.9737892020493746, "total_bits": 58692736, "q_proj": { "group_size": { @@ -12300,7 +12300,7 @@ } }, { - "accuracy": 0.9722792375832796, + "accuracy": 0.9722646549344063, "total_bits": 59068544, "q_proj": { "group_size": { @@ -12364,7 +12364,7 @@ } }, { - "accuracy": 0.9740959145128727, + "accuracy": 0.9741003829985857, "total_bits": 59588864, "q_proj": { "group_size": { @@ -12428,7 +12428,7 @@ } }, { - "accuracy": 0.9769062623381615, + "accuracy": 0.9769276678562164, "total_bits": 61536832, "q_proj": { "group_size": { @@ -12489,7 +12489,7 @@ } }, { - "accuracy": 0.9786777105182409, + "accuracy": 0.9786724224686623, "total_bits": 62354560, "q_proj": { "group_size": { @@ -12550,7 +12550,7 @@ } }, { - "accuracy": 0.987405676394701, + "accuracy": 0.9874210571870208, "total_bits": 75246880, "q_proj": { "group_size": { @@ -12611,7 +12611,7 @@ } }, { - "accuracy": 0.9893234008923173, + "accuracy": 0.9893340524286032, "total_bits": 76510336, "q_proj": { "group_size": { @@ -12672,7 +12672,7 @@ } }, { - "accuracy": 0.9920955216512084, + "accuracy": 0.9920956883579493, "total_bits": 85667104, "q_proj": { "group_size": { @@ -12724,7 +12724,7 @@ } }, { - "accuracy": 0.9945340054109693, + "accuracy": 0.9945395006798208, "total_bits": 91722880, "q_proj": { "group_size": { @@ -12776,7 +12776,7 @@ } }, { - "accuracy": 0.9979429002851248, + "accuracy": 0.9979436090216041, "total_bits": 113978656, "q_proj": { "group_size": { @@ -12830,7 +12830,7 @@ ], "model.layers.6.mlp": [ { - "accuracy": 0.8601508587598801, + "accuracy": 0.860052615404129, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -12882,7 +12882,7 @@ } }, { - "accuracy": 0.8646412193775177, + "accuracy": 0.864541083574295, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -12934,7 +12934,7 @@ } }, { - "accuracy": 0.883434846997261, + "accuracy": 0.8833191320300102, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -12983,7 +12983,7 @@ } }, { - "accuracy": 0.8892851322889328, + "accuracy": 0.8891885280609131, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -13032,7 +13032,7 @@ } }, { - "accuracy": 0.9288300052285194, + "accuracy": 0.928782157599926, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -13084,7 +13084,7 @@ } }, { - "accuracy": 0.9350205287337303, + "accuracy": 0.9350093528628349, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -13136,7 +13136,7 @@ } }, { - "accuracy": 0.942976824939251, + "accuracy": 0.9429488480091095, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -13185,7 +13185,7 @@ } }, { - "accuracy": 0.9626522436738014, + "accuracy": 0.9626510068774223, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -13228,7 +13228,7 @@ } }, { - "accuracy": 0.9660748802125454, + "accuracy": 0.9660806246101856, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -13271,7 +13271,7 @@ } }, { - "accuracy": 0.9634818024933338, + "accuracy": 0.9634533040225506, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -13323,7 +13323,7 @@ } }, { - "accuracy": 0.9682779163122177, + "accuracy": 0.9682538993656635, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -13375,7 +13375,7 @@ } }, { - "accuracy": 0.9812953136861324, + "accuracy": 0.9812956769019365, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -13427,7 +13427,7 @@ } }, { - "accuracy": 0.9841256625950336, + "accuracy": 0.9841305427253246, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -13479,7 +13479,7 @@ } }, { - "accuracy": 0.9896932039409876, + "accuracy": 0.9896902348846197, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -13522,7 +13522,7 @@ } }, { - "accuracy": 0.9903836958110332, + "accuracy": 0.9903781078755856, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -13571,7 +13571,7 @@ } }, { - "accuracy": 0.9921105708926916, + "accuracy": 0.9921116251498461, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -13617,7 +13617,7 @@ } }, { - "accuracy": 0.9972038897685707, + "accuracy": 0.9972023773007095, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -13659,7 +13659,7 @@ ], "model.layers.7.self_attn": [ { - "accuracy": 0.8790968656539917, + "accuracy": 0.879193864762783, "total_bits": 30308928, "q_proj": { "group_size": { @@ -13723,7 +13723,7 @@ } }, { - "accuracy": 0.8855356946587563, + "accuracy": 0.885476142168045, "total_bits": 31455808, "q_proj": { "group_size": { @@ -13787,7 +13787,7 @@ } }, { - "accuracy": 0.9016124606132507, + "accuracy": 0.9015669599175453, "total_bits": 33412832, "q_proj": { "group_size": { @@ -13851,7 +13851,7 @@ } }, { - "accuracy": 0.9258091002702713, + "accuracy": 0.9257946684956551, "total_bits": 37983200, "q_proj": { "group_size": { @@ -13915,7 +13915,7 @@ } }, { - "accuracy": 0.9374926388263702, + "accuracy": 0.9375413469970226, "total_bits": 44838176, "q_proj": { "group_size": { @@ -13979,7 +13979,7 @@ } }, { - "accuracy": 0.9384367614984512, + "accuracy": 0.9384141005575657, "total_bits": 44912768, "q_proj": { "group_size": { @@ -14043,7 +14043,7 @@ } }, { - "accuracy": 0.9647591635584831, + "accuracy": 0.9647888205945492, "total_bits": 57355552, "q_proj": { "group_size": { @@ -14095,7 +14095,7 @@ } }, { - "accuracy": 0.965646505355835, + "accuracy": 0.9656654335558414, "total_bits": 57430144, "q_proj": { "group_size": { @@ -14147,7 +14147,7 @@ } }, { - "accuracy": 0.9682505577802658, + "accuracy": 0.968209270387888, "total_bits": 57950464, "q_proj": { "group_size": { @@ -14199,7 +14199,7 @@ } }, { - "accuracy": 0.9700952749699354, + "accuracy": 0.9700861666351557, "total_bits": 58692736, "q_proj": { "group_size": { @@ -14251,7 +14251,7 @@ } }, { - "accuracy": 0.9685632511973381, + "accuracy": 0.9685384854674339, "total_bits": 59068544, "q_proj": { "group_size": { @@ -14315,7 +14315,7 @@ } }, { - "accuracy": 0.9708435665816069, + "accuracy": 0.9708608984947205, "total_bits": 59588864, "q_proj": { "group_size": { @@ -14379,7 +14379,7 @@ } }, { - "accuracy": 0.9744916334748268, + "accuracy": 0.9745250958949327, "total_bits": 61536832, "q_proj": { "group_size": { @@ -14440,7 +14440,7 @@ } }, { - "accuracy": 0.976450975984335, + "accuracy": 0.9764064699411392, "total_bits": 62354560, "q_proj": { "group_size": { @@ -14501,7 +14501,7 @@ } }, { - "accuracy": 0.9858461897820234, + "accuracy": 0.9858506005257368, "total_bits": 75246880, "q_proj": { "group_size": { @@ -14562,7 +14562,7 @@ } }, { - "accuracy": 0.9881619503721595, + "accuracy": 0.9881491707637906, "total_bits": 76510336, "q_proj": { "group_size": { @@ -14623,7 +14623,7 @@ } }, { - "accuracy": 0.9907449893653393, + "accuracy": 0.9907346172258258, "total_bits": 85667104, "q_proj": { "group_size": { @@ -14675,7 +14675,7 @@ } }, { - "accuracy": 0.9937627115286887, + "accuracy": 0.9937750529497862, "total_bits": 91722880, "q_proj": { "group_size": { @@ -14727,7 +14727,7 @@ } }, { - "accuracy": 0.9975894596427679, + "accuracy": 0.997590501094237, "total_bits": 113978656, "q_proj": { "group_size": { @@ -14781,7 +14781,7 @@ ], "model.layers.7.mlp": [ { - "accuracy": 0.8853595852851868, + "accuracy": 0.8853648155927658, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -14833,7 +14833,7 @@ } }, { - "accuracy": 0.8890897259116173, + "accuracy": 0.8890001177787781, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -14885,7 +14885,7 @@ } }, { - "accuracy": 0.9030437618494034, + "accuracy": 0.9031427130103111, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -14934,7 +14934,7 @@ } }, { - "accuracy": 0.9074160978198051, + "accuracy": 0.9074975475668907, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -14983,7 +14983,7 @@ } }, { - "accuracy": 0.941648468375206, + "accuracy": 0.9416834153234959, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -15035,7 +15035,7 @@ } }, { - "accuracy": 0.9470459222793579, + "accuracy": 0.9470086395740509, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -15087,7 +15087,7 @@ } }, { - "accuracy": 0.9530564919114113, + "accuracy": 0.9530163891613483, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -15136,7 +15136,7 @@ } }, { - "accuracy": 0.9691261779516935, + "accuracy": 0.9691323079168797, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -15179,7 +15179,7 @@ } }, { - "accuracy": 0.9720455892384052, + "accuracy": 0.9720457717776299, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -15222,7 +15222,7 @@ } }, { - "accuracy": 0.9700704663991928, + "accuracy": 0.9700757917016745, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -15274,7 +15274,7 @@ } }, { - "accuracy": 0.9741590898483992, + "accuracy": 0.9741606414318085, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -15326,7 +15326,7 @@ } }, { - "accuracy": 0.9846790870651603, + "accuracy": 0.9846808835864067, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -15378,7 +15378,7 @@ } }, { - "accuracy": 0.9870709776878357, + "accuracy": 0.9870640141889453, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -15430,7 +15430,7 @@ } }, { - "accuracy": 0.9914329303428531, + "accuracy": 0.9914321266114712, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -15473,7 +15473,7 @@ } }, { - "accuracy": 0.9921443285420537, + "accuracy": 0.9921473953872919, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -15522,7 +15522,7 @@ } }, { - "accuracy": 0.9934511734172702, + "accuracy": 0.9934548917226493, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -15568,7 +15568,7 @@ } }, { - "accuracy": 0.997653994243592, + "accuracy": 0.9976542603690177, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -15610,7 +15610,7 @@ ], "model.layers.8.self_attn": [ { - "accuracy": 0.9262347742915154, + "accuracy": 0.9262180775403976, "total_bits": 30308928, "q_proj": { "group_size": { @@ -15674,7 +15674,7 @@ } }, { - "accuracy": 0.9292053729295731, + "accuracy": 0.9292021617293358, "total_bits": 31455808, "q_proj": { "group_size": { @@ -15738,7 +15738,7 @@ } }, { - "accuracy": 0.9359699636697769, + "accuracy": 0.9360192567110062, "total_bits": 33412832, "q_proj": { "group_size": { @@ -15802,7 +15802,7 @@ } }, { - "accuracy": 0.9522256478667259, + "accuracy": 0.9522725865244865, "total_bits": 37983200, "q_proj": { "group_size": { @@ -15866,7 +15866,7 @@ } }, { - "accuracy": 0.9621881134808064, + "accuracy": 0.9622119329869747, "total_bits": 44838176, "q_proj": { "group_size": { @@ -15930,7 +15930,7 @@ } }, { - "accuracy": 0.9625761918723583, + "accuracy": 0.9625555910170078, "total_bits": 44912768, "q_proj": { "group_size": { @@ -15994,7 +15994,7 @@ } }, { - "accuracy": 0.9790825769305229, + "accuracy": 0.9790912084281445, "total_bits": 57355552, "q_proj": { "group_size": { @@ -16046,7 +16046,7 @@ } }, { - "accuracy": 0.9794511869549751, + "accuracy": 0.9794544521719217, "total_bits": 57430144, "q_proj": { "group_size": { @@ -16098,7 +16098,7 @@ } }, { - "accuracy": 0.9807918332517147, + "accuracy": 0.9808075986802578, "total_bits": 57950464, "q_proj": { "group_size": { @@ -16150,7 +16150,7 @@ } }, { - "accuracy": 0.9819746408611536, + "accuracy": 0.9819814618676901, "total_bits": 58692736, "q_proj": { "group_size": { @@ -16202,7 +16202,7 @@ } }, { - "accuracy": 0.9808401670306921, + "accuracy": 0.980836171656847, "total_bits": 59068544, "q_proj": { "group_size": { @@ -16266,7 +16266,7 @@ } }, { - "accuracy": 0.9820886384695768, + "accuracy": 0.9820813406258821, "total_bits": 59588864, "q_proj": { "group_size": { @@ -16330,7 +16330,7 @@ } }, { - "accuracy": 0.9836654253304005, + "accuracy": 0.9836451895534992, "total_bits": 61536832, "q_proj": { "group_size": { @@ -16391,7 +16391,7 @@ } }, { - "accuracy": 0.984879620373249, + "accuracy": 0.9848749991506338, "total_bits": 62354560, "q_proj": { "group_size": { @@ -16452,7 +16452,7 @@ } }, { - "accuracy": 0.9910424621775746, + "accuracy": 0.9910451974719763, "total_bits": 75246880, "q_proj": { "group_size": { @@ -16513,7 +16513,7 @@ } }, { - "accuracy": 0.9924080655910075, + "accuracy": 0.9923991961404681, "total_bits": 76510336, "q_proj": { "group_size": { @@ -16574,7 +16574,7 @@ } }, { - "accuracy": 0.9945205664262176, + "accuracy": 0.9945177044719458, "total_bits": 85667104, "q_proj": { "group_size": { @@ -16626,7 +16626,7 @@ } }, { - "accuracy": 0.996047873981297, + "accuracy": 0.9960471182130277, "total_bits": 91722880, "q_proj": { "group_size": { @@ -16678,7 +16678,7 @@ } }, { - "accuracy": 0.998559134779498, + "accuracy": 0.9985587185947224, "total_bits": 113978656, "q_proj": { "group_size": { @@ -16732,7 +16732,7 @@ ], "model.layers.8.mlp": [ { - "accuracy": 0.8776565492153168, + "accuracy": 0.8774635121226311, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -16784,7 +16784,7 @@ } }, { - "accuracy": 0.8816645741462708, + "accuracy": 0.8816986083984375, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -16836,7 +16836,7 @@ } }, { - "accuracy": 0.8966159075498581, + "accuracy": 0.8964935094118118, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -16885,7 +16885,7 @@ } }, { - "accuracy": 0.9011181369423866, + "accuracy": 0.9010185077786446, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -16934,7 +16934,7 @@ } }, { - "accuracy": 0.9383117109537125, + "accuracy": 0.9382704459130764, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -16986,7 +16986,7 @@ } }, { - "accuracy": 0.9435076154768467, + "accuracy": 0.943505771458149, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -17038,7 +17038,7 @@ } }, { - "accuracy": 0.94978042319417, + "accuracy": 0.9497714042663574, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -17087,7 +17087,7 @@ } }, { - "accuracy": 0.9677746780216694, + "accuracy": 0.9677646122872829, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -17130,7 +17130,7 @@ } }, { - "accuracy": 0.9705556537955999, + "accuracy": 0.9705599583685398, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -17173,7 +17173,7 @@ } }, { - "accuracy": 0.9684275537729263, + "accuracy": 0.9684217162430286, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -17225,7 +17225,7 @@ } }, { - "accuracy": 0.972480921074748, + "accuracy": 0.9724891372025013, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -17277,7 +17277,7 @@ } }, { - "accuracy": 0.9838621038943529, + "accuracy": 0.9838705994188786, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -17329,7 +17329,7 @@ } }, { - "accuracy": 0.9862669911235571, + "accuracy": 0.9862625077366829, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -17381,7 +17381,7 @@ } }, { - "accuracy": 0.9911140948534012, + "accuracy": 0.9911155067384243, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -17424,7 +17424,7 @@ } }, { - "accuracy": 0.9916985612362623, + "accuracy": 0.9917009193450212, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -17473,7 +17473,7 @@ } }, { - "accuracy": 0.9930045073851943, + "accuracy": 0.9930097297765315, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -17519,7 +17519,7 @@ } }, { - "accuracy": 0.9975975535344332, + "accuracy": 0.9975970382802188, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -17561,7 +17561,7 @@ ], "model.layers.9.self_attn": [ { - "accuracy": 0.9156324192881584, + "accuracy": 0.9154471009969711, "total_bits": 30308928, "q_proj": { "group_size": { @@ -17625,7 +17625,7 @@ } }, { - "accuracy": 0.918098546564579, + "accuracy": 0.9180809780955315, "total_bits": 31455808, "q_proj": { "group_size": { @@ -17689,7 +17689,7 @@ } }, { - "accuracy": 0.9291017279028893, + "accuracy": 0.9292140081524849, "total_bits": 33412832, "q_proj": { "group_size": { @@ -17753,7 +17753,7 @@ } }, { - "accuracy": 0.9474808238446712, + "accuracy": 0.9475394748151302, "total_bits": 37983200, "q_proj": { "group_size": { @@ -17817,7 +17817,7 @@ } }, { - "accuracy": 0.9566572569310665, + "accuracy": 0.9566517025232315, "total_bits": 44838176, "q_proj": { "group_size": { @@ -17881,7 +17881,7 @@ } }, { - "accuracy": 0.9572707749903202, + "accuracy": 0.9572483897209167, "total_bits": 44912768, "q_proj": { "group_size": { @@ -17945,7 +17945,7 @@ } }, { - "accuracy": 0.9765746779739857, + "accuracy": 0.9765565041452646, "total_bits": 57355552, "q_proj": { "group_size": { @@ -17997,7 +17997,7 @@ } }, { - "accuracy": 0.9771516304463148, + "accuracy": 0.9771292954683304, "total_bits": 57430144, "q_proj": { "group_size": { @@ -18049,7 +18049,7 @@ } }, { - "accuracy": 0.9786375071853399, + "accuracy": 0.9786593876779079, "total_bits": 57950464, "q_proj": { "group_size": { @@ -18101,7 +18101,7 @@ } }, { - "accuracy": 0.9796764496713877, + "accuracy": 0.9796735905110836, "total_bits": 58692736, "q_proj": { "group_size": { @@ -18153,7 +18153,7 @@ } }, { - "accuracy": 0.9782940931618214, + "accuracy": 0.9782825838774443, "total_bits": 59068544, "q_proj": { "group_size": { @@ -18217,7 +18217,7 @@ } }, { - "accuracy": 0.9796239528805017, + "accuracy": 0.9796628952026367, "total_bits": 59588864, "q_proj": { "group_size": { @@ -18281,7 +18281,7 @@ } }, { - "accuracy": 0.9821039438247681, + "accuracy": 0.9821524657309055, "total_bits": 61536832, "q_proj": { "group_size": { @@ -18342,7 +18342,7 @@ } }, { - "accuracy": 0.9833755418658257, + "accuracy": 0.9833454601466656, "total_bits": 62354560, "q_proj": { "group_size": { @@ -18403,7 +18403,7 @@ } }, { - "accuracy": 0.9902575109153986, + "accuracy": 0.9902483588084579, "total_bits": 75246880, "q_proj": { "group_size": { @@ -18464,7 +18464,7 @@ } }, { - "accuracy": 0.9916903469711542, + "accuracy": 0.9916817611083388, "total_bits": 76510336, "q_proj": { "group_size": { @@ -18525,7 +18525,7 @@ } }, { - "accuracy": 0.993913528509438, + "accuracy": 0.9939101827330887, "total_bits": 85667104, "q_proj": { "group_size": { @@ -18577,7 +18577,7 @@ } }, { - "accuracy": 0.995829266961664, + "accuracy": 0.99583475664258, "total_bits": 91722880, "q_proj": { "group_size": { @@ -18629,7 +18629,7 @@ } }, { - "accuracy": 0.9984044209122658, + "accuracy": 0.9984046985628083, "total_bits": 113978656, "q_proj": { "group_size": { @@ -18683,7 +18683,7 @@ ], "model.layers.9.mlp": [ { - "accuracy": 0.8979872688651085, + "accuracy": 0.8980022817850113, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -18735,7 +18735,7 @@ } }, { - "accuracy": 0.9010738134384155, + "accuracy": 0.9009037613868713, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -18787,7 +18787,7 @@ } }, { - "accuracy": 0.9138390645384789, + "accuracy": 0.9135458469390869, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -18836,7 +18836,7 @@ } }, { - "accuracy": 0.9180445671081543, + "accuracy": 0.9177292063832283, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -18885,7 +18885,7 @@ } }, { - "accuracy": 0.9479075893759727, + "accuracy": 0.9478593431413174, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -18937,7 +18937,7 @@ } }, { - "accuracy": 0.9523597359657288, + "accuracy": 0.9523407816886902, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -18989,7 +18989,7 @@ } }, { - "accuracy": 0.9581680968403816, + "accuracy": 0.958098616451025, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -19038,7 +19038,7 @@ } }, { - "accuracy": 0.9725048933178186, + "accuracy": 0.9725117534399033, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -19081,7 +19081,7 @@ } }, { - "accuracy": 0.9750282820314169, + "accuracy": 0.975043885409832, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -19124,7 +19124,7 @@ } }, { - "accuracy": 0.9732320122420788, + "accuracy": 0.9732519965618849, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -19176,7 +19176,7 @@ } }, { - "accuracy": 0.9767951015383005, + "accuracy": 0.9767921902239323, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -19228,7 +19228,7 @@ } }, { - "accuracy": 0.9863404175266623, + "accuracy": 0.9863471165299416, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -19280,7 +19280,7 @@ } }, { - "accuracy": 0.9883861737325788, + "accuracy": 0.9883871376514435, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -19332,7 +19332,7 @@ } }, { - "accuracy": 0.992430523969233, + "accuracy": 0.9924324788153172, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -19375,7 +19375,7 @@ } }, { - "accuracy": 0.9929885254241526, + "accuracy": 0.9929874055087566, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -19424,7 +19424,7 @@ } }, { - "accuracy": 0.9942358685657382, + "accuracy": 0.9942356436513364, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -19470,7 +19470,7 @@ } }, { - "accuracy": 0.9979169676080346, + "accuracy": 0.9979170782025903, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -19512,7 +19512,7 @@ ], "model.layers.10.self_attn": [ { - "accuracy": 0.9255667924880981, + "accuracy": 0.9254285618662834, "total_bits": 30308928, "q_proj": { "group_size": { @@ -19576,7 +19576,7 @@ } }, { - "accuracy": 0.9285323470830917, + "accuracy": 0.9285455048084259, "total_bits": 31455808, "q_proj": { "group_size": { @@ -19640,7 +19640,7 @@ } }, { - "accuracy": 0.9377534314990044, + "accuracy": 0.9378277622163296, "total_bits": 33412832, "q_proj": { "group_size": { @@ -19704,7 +19704,7 @@ } }, { - "accuracy": 0.9557530134916306, + "accuracy": 0.9558689743280411, "total_bits": 37983200, "q_proj": { "group_size": { @@ -19768,7 +19768,7 @@ } }, { - "accuracy": 0.9622449390590191, + "accuracy": 0.962271124124527, "total_bits": 44838176, "q_proj": { "group_size": { @@ -19832,7 +19832,7 @@ } }, { - "accuracy": 0.9627878665924072, + "accuracy": 0.9627652131021023, "total_bits": 44912768, "q_proj": { "group_size": { @@ -19896,7 +19896,7 @@ } }, { - "accuracy": 0.9794471673667431, + "accuracy": 0.9794409442692995, "total_bits": 57355552, "q_proj": { "group_size": { @@ -19948,7 +19948,7 @@ } }, { - "accuracy": 0.9799556694924831, + "accuracy": 0.9799547977745533, "total_bits": 57430144, "q_proj": { "group_size": { @@ -20000,7 +20000,7 @@ } }, { - "accuracy": 0.9812588579952717, + "accuracy": 0.9812564067542553, "total_bits": 57950464, "q_proj": { "group_size": { @@ -20052,7 +20052,7 @@ } }, { - "accuracy": 0.982187744230032, + "accuracy": 0.98219870403409, "total_bits": 58692736, "q_proj": { "group_size": { @@ -20104,7 +20104,7 @@ } }, { - "accuracy": 0.9810379017144442, + "accuracy": 0.9810190796852112, "total_bits": 59068544, "q_proj": { "group_size": { @@ -20168,7 +20168,7 @@ } }, { - "accuracy": 0.9822507984936237, + "accuracy": 0.9822470918297768, "total_bits": 59588864, "q_proj": { "group_size": { @@ -20232,7 +20232,7 @@ } }, { - "accuracy": 0.9842813797295094, + "accuracy": 0.9842821806669235, "total_bits": 61536832, "q_proj": { "group_size": { @@ -20293,7 +20293,7 @@ } }, { - "accuracy": 0.9854367896914482, + "accuracy": 0.9854378383606672, "total_bits": 62354560, "q_proj": { "group_size": { @@ -20354,7 +20354,7 @@ } }, { - "accuracy": 0.991425178013742, + "accuracy": 0.9914244255051017, "total_bits": 75246880, "q_proj": { "group_size": { @@ -20415,7 +20415,7 @@ } }, { - "accuracy": 0.9926807903684676, + "accuracy": 0.9926830539479852, "total_bits": 76510336, "q_proj": { "group_size": { @@ -20476,7 +20476,7 @@ } }, { - "accuracy": 0.9946406041271985, + "accuracy": 0.994636666495353, "total_bits": 85667104, "q_proj": { "group_size": { @@ -20528,7 +20528,7 @@ } }, { - "accuracy": 0.9963198550976813, + "accuracy": 0.9963192888535559, "total_bits": 91722880, "q_proj": { "group_size": { @@ -20580,7 +20580,7 @@ } }, { - "accuracy": 0.9985976866446435, + "accuracy": 0.9985979022458196, "total_bits": 113978656, "q_proj": { "group_size": { @@ -20634,7 +20634,7 @@ ], "model.layers.10.mlp": [ { - "accuracy": 0.9072035849094391, + "accuracy": 0.9071538224816322, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -20686,7 +20686,7 @@ } }, { - "accuracy": 0.9100625887513161, + "accuracy": 0.9100388288497925, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -20738,7 +20738,7 @@ } }, { - "accuracy": 0.9221524447202682, + "accuracy": 0.922150731086731, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -20787,7 +20787,7 @@ } }, { - "accuracy": 0.9259821102023125, + "accuracy": 0.9259923249483109, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -20836,7 +20836,7 @@ } }, { - "accuracy": 0.9525629505515099, + "accuracy": 0.9525576233863831, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -20888,7 +20888,7 @@ } }, { - "accuracy": 0.9565679579973221, + "accuracy": 0.9565683789551258, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -20940,7 +20940,7 @@ } }, { - "accuracy": 0.9619633853435516, + "accuracy": 0.9619757160544395, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -20989,7 +20989,7 @@ } }, { - "accuracy": 0.975079670548439, + "accuracy": 0.9750785324722528, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -21032,7 +21032,7 @@ } }, { - "accuracy": 0.9773116856813431, + "accuracy": 0.9773098323494196, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -21075,7 +21075,7 @@ } }, { - "accuracy": 0.9756849519908428, + "accuracy": 0.9756814874708652, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -21127,7 +21127,7 @@ } }, { - "accuracy": 0.9788219351321459, + "accuracy": 0.9788009151816368, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -21179,7 +21179,7 @@ } }, { - "accuracy": 0.9875948084518313, + "accuracy": 0.9875935269519687, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -21231,7 +21231,7 @@ } }, { - "accuracy": 0.9894048757851124, + "accuracy": 0.9894073354080319, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -21283,7 +21283,7 @@ } }, { - "accuracy": 0.993154349271208, + "accuracy": 0.9931564317084849, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -21326,7 +21326,7 @@ } }, { - "accuracy": 0.9936201777309179, + "accuracy": 0.9936129190027714, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -21375,7 +21375,7 @@ } }, { - "accuracy": 0.9947737217880785, + "accuracy": 0.9947650441899896, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -21421,7 +21421,7 @@ } }, { - "accuracy": 0.9981311410665512, + "accuracy": 0.9981314450269565, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -21463,7 +21463,7 @@ ], "model.layers.11.self_attn": [ { - "accuracy": 0.9352168366312981, + "accuracy": 0.9351540505886078, "total_bits": 30308928, "q_proj": { "group_size": { @@ -21527,7 +21527,7 @@ } }, { - "accuracy": 0.9374474063515663, + "accuracy": 0.9374874904751778, "total_bits": 31455808, "q_proj": { "group_size": { @@ -21591,7 +21591,7 @@ } }, { - "accuracy": 0.9444124512374401, + "accuracy": 0.9444890134036541, "total_bits": 33412832, "q_proj": { "group_size": { @@ -21655,7 +21655,7 @@ } }, { - "accuracy": 0.9625572040677071, + "accuracy": 0.9625845514237881, "total_bits": 37983200, "q_proj": { "group_size": { @@ -21719,7 +21719,7 @@ } }, { - "accuracy": 0.9669128507375717, + "accuracy": 0.9669028967618942, "total_bits": 44838176, "q_proj": { "group_size": { @@ -21783,7 +21783,7 @@ } }, { - "accuracy": 0.967328879982233, + "accuracy": 0.9672983437776566, "total_bits": 44912768, "q_proj": { "group_size": { @@ -21847,7 +21847,7 @@ } }, { - "accuracy": 0.9819058496505022, + "accuracy": 0.9818990211933851, "total_bits": 57355552, "q_proj": { "group_size": { @@ -21899,7 +21899,7 @@ } }, { - "accuracy": 0.9823221303522587, + "accuracy": 0.9823174811899662, "total_bits": 57430144, "q_proj": { "group_size": { @@ -21951,7 +21951,7 @@ } }, { - "accuracy": 0.9834885075688362, + "accuracy": 0.9834803491830826, "total_bits": 57950464, "q_proj": { "group_size": { @@ -22003,7 +22003,7 @@ } }, { - "accuracy": 0.9843579828739166, + "accuracy": 0.9843547828495502, "total_bits": 58692736, "q_proj": { "group_size": { @@ -22055,7 +22055,7 @@ } }, { - "accuracy": 0.9833086878061295, + "accuracy": 0.9833086282014847, "total_bits": 59068544, "q_proj": { "group_size": { @@ -22119,7 +22119,7 @@ } }, { - "accuracy": 0.9843683261424303, + "accuracy": 0.9843555800616741, "total_bits": 59588864, "q_proj": { "group_size": { @@ -22183,7 +22183,7 @@ } }, { - "accuracy": 0.9858474927023053, + "accuracy": 0.9858486671000719, "total_bits": 61536832, "q_proj": { "group_size": { @@ -22244,7 +22244,7 @@ } }, { - "accuracy": 0.9868558822199702, + "accuracy": 0.9868420660495758, "total_bits": 62354560, "q_proj": { "group_size": { @@ -22305,7 +22305,7 @@ } }, { - "accuracy": 0.9922798662446439, + "accuracy": 0.9922812515869737, "total_bits": 75246880, "q_proj": { "group_size": { @@ -22366,7 +22366,7 @@ } }, { - "accuracy": 0.9933844502083957, + "accuracy": 0.9933867929503322, "total_bits": 76510336, "q_proj": { "group_size": { @@ -22427,7 +22427,7 @@ } }, { - "accuracy": 0.9952675346285105, + "accuracy": 0.9952673111110926, "total_bits": 85667104, "q_proj": { "group_size": { @@ -22479,7 +22479,7 @@ } }, { - "accuracy": 0.9966305803973228, + "accuracy": 0.9966264350805432, "total_bits": 91722880, "q_proj": { "group_size": { @@ -22531,7 +22531,7 @@ } }, { - "accuracy": 0.9987549100769684, + "accuracy": 0.9987560133449733, "total_bits": 113978656, "q_proj": { "group_size": { @@ -22585,7 +22585,7 @@ ], "model.layers.11.mlp": [ { - "accuracy": 0.922992967069149, + "accuracy": 0.9229258298873901, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -22637,7 +22637,7 @@ } }, { - "accuracy": 0.9253613352775574, + "accuracy": 0.9253562912344933, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -22689,7 +22689,7 @@ } }, { - "accuracy": 0.9349236041307449, + "accuracy": 0.9348956197500229, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -22738,7 +22738,7 @@ } }, { - "accuracy": 0.9380608797073364, + "accuracy": 0.9380255676805973, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -22787,7 +22787,7 @@ } }, { - "accuracy": 0.9607282392680645, + "accuracy": 0.9607758708298206, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -22839,7 +22839,7 @@ } }, { - "accuracy": 0.9641470424830914, + "accuracy": 0.964177817106247, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -22891,7 +22891,7 @@ } }, { - "accuracy": 0.9683838337659836, + "accuracy": 0.9684282056987286, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -22940,7 +22940,7 @@ } }, { - "accuracy": 0.9791794028133154, + "accuracy": 0.9791763704270124, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -22983,7 +22983,7 @@ } }, { - "accuracy": 0.9810750614851713, + "accuracy": 0.9810761008411646, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -23026,7 +23026,7 @@ } }, { - "accuracy": 0.9798438455909491, + "accuracy": 0.9798630569130182, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -23078,7 +23078,7 @@ } }, { - "accuracy": 0.9825253784656525, + "accuracy": 0.9825179129838943, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -23130,7 +23130,7 @@ } }, { - "accuracy": 0.9897021958604455, + "accuracy": 0.9896943140774965, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -23182,7 +23182,7 @@ } }, { - "accuracy": 0.9912520227953792, + "accuracy": 0.9912572083994746, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -23234,7 +23234,7 @@ } }, { - "accuracy": 0.994236150290817, + "accuracy": 0.9942377745173872, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -23277,7 +23277,7 @@ } }, { - "accuracy": 0.9947156864218414, + "accuracy": 0.9947184869088233, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -23326,7 +23326,7 @@ } }, { - "accuracy": 0.9956142762675881, + "accuracy": 0.9956165258772671, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -23372,7 +23372,7 @@ } }, { - "accuracy": 0.9984074216336012, + "accuracy": 0.9984078536508605, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -23414,7 +23414,7 @@ ], "model.layers.12.self_attn": [ { - "accuracy": 0.918254628777504, + "accuracy": 0.9183487147092819, "total_bits": 30308928, "q_proj": { "group_size": { @@ -23478,7 +23478,7 @@ } }, { - "accuracy": 0.9215041920542717, + "accuracy": 0.9214219599962234, "total_bits": 31455808, "q_proj": { "group_size": { @@ -23542,7 +23542,7 @@ } }, { - "accuracy": 0.9291860163211823, + "accuracy": 0.9291634485125542, "total_bits": 33412832, "q_proj": { "group_size": { @@ -23606,7 +23606,7 @@ } }, { - "accuracy": 0.9523625448346138, + "accuracy": 0.9523275718092918, "total_bits": 37983200, "q_proj": { "group_size": { @@ -23670,7 +23670,7 @@ } }, { - "accuracy": 0.9582577794790268, + "accuracy": 0.958238810300827, "total_bits": 44838176, "q_proj": { "group_size": { @@ -23734,7 +23734,7 @@ } }, { - "accuracy": 0.9587131217122078, + "accuracy": 0.9586759731173515, "total_bits": 44912768, "q_proj": { "group_size": { @@ -23798,7 +23798,7 @@ } }, { - "accuracy": 0.9767006933689117, + "accuracy": 0.9766934681683779, "total_bits": 57355552, "q_proj": { "group_size": { @@ -23850,7 +23850,7 @@ } }, { - "accuracy": 0.9771417211741209, + "accuracy": 0.9771546181291342, "total_bits": 57430144, "q_proj": { "group_size": { @@ -23902,7 +23902,7 @@ } }, { - "accuracy": 0.9786731544882059, + "accuracy": 0.978665629401803, "total_bits": 57950464, "q_proj": { "group_size": { @@ -23954,7 +23954,7 @@ } }, { - "accuracy": 0.9797742627561092, + "accuracy": 0.9797797929495573, "total_bits": 58692736, "q_proj": { "group_size": { @@ -24006,7 +24006,7 @@ } }, { - "accuracy": 0.9788827616721392, + "accuracy": 0.9788805264979601, "total_bits": 59068544, "q_proj": { "group_size": { @@ -24070,7 +24070,7 @@ } }, { - "accuracy": 0.980213237926364, + "accuracy": 0.9802060816437006, "total_bits": 59588864, "q_proj": { "group_size": { @@ -24134,7 +24134,7 @@ } }, { - "accuracy": 0.9817759990692139, + "accuracy": 0.9817687887698412, "total_bits": 61536832, "q_proj": { "group_size": { @@ -24195,7 +24195,7 @@ } }, { - "accuracy": 0.9829946663230658, + "accuracy": 0.9829999972134829, "total_bits": 62354560, "q_proj": { "group_size": { @@ -24256,7 +24256,7 @@ } }, { - "accuracy": 0.9900454664602876, + "accuracy": 0.9900399595499039, "total_bits": 75246880, "q_proj": { "group_size": { @@ -24317,7 +24317,7 @@ } }, { - "accuracy": 0.9914399096742272, + "accuracy": 0.9914370570331812, "total_bits": 76510336, "q_proj": { "group_size": { @@ -24378,7 +24378,7 @@ } }, { - "accuracy": 0.9938779231160879, + "accuracy": 0.9938817266374826, "total_bits": 85667104, "q_proj": { "group_size": { @@ -24430,7 +24430,7 @@ } }, { - "accuracy": 0.9955275356769562, + "accuracy": 0.9955261144787073, "total_bits": 91722880, "q_proj": { "group_size": { @@ -24482,7 +24482,7 @@ } }, { - "accuracy": 0.998387377592735, + "accuracy": 0.998388102161698, "total_bits": 113978656, "q_proj": { "group_size": { @@ -24536,7 +24536,7 @@ ], "model.layers.12.mlp": [ { - "accuracy": 0.9067049399018288, + "accuracy": 0.9067919254302979, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -24588,7 +24588,7 @@ } }, { - "accuracy": 0.9094245880842209, + "accuracy": 0.9094521254301071, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -24640,7 +24640,7 @@ } }, { - "accuracy": 0.9205821231007576, + "accuracy": 0.9205865487456322, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -24689,7 +24689,7 @@ } }, { - "accuracy": 0.924173966050148, + "accuracy": 0.9241846203804016, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -24738,7 +24738,7 @@ } }, { - "accuracy": 0.9520841389894485, + "accuracy": 0.9520521014928818, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -24790,7 +24790,7 @@ } }, { - "accuracy": 0.9562458842992783, + "accuracy": 0.9562351442873478, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -24842,7 +24842,7 @@ } }, { - "accuracy": 0.9611620157957077, + "accuracy": 0.961151484400034, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -24891,7 +24891,7 @@ } }, { - "accuracy": 0.9748448915779591, + "accuracy": 0.9748354908078909, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -24934,7 +24934,7 @@ } }, { - "accuracy": 0.9771162606775761, + "accuracy": 0.9771051350980997, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -24977,7 +24977,7 @@ } }, { - "accuracy": 0.975365836173296, + "accuracy": 0.9753743782639503, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -25029,7 +25029,7 @@ } }, { - "accuracy": 0.9786117561161518, + "accuracy": 0.9786114767193794, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -25081,7 +25081,7 @@ } }, { - "accuracy": 0.9873783187940717, + "accuracy": 0.9873899882659316, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -25133,7 +25133,7 @@ } }, { - "accuracy": 0.9893058259040117, + "accuracy": 0.9893016312271357, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -25185,7 +25185,7 @@ } }, { - "accuracy": 0.9930427521467209, + "accuracy": 0.993039789609611, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -25228,7 +25228,7 @@ } }, { - "accuracy": 0.9935374888591468, + "accuracy": 0.9935355954803526, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -25277,7 +25277,7 @@ } }, { - "accuracy": 0.9945738040842116, + "accuracy": 0.9945709388703108, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -25323,7 +25323,7 @@ } }, { - "accuracy": 0.9981157196452841, + "accuracy": 0.9981151465326548, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -25365,7 +25365,7 @@ ], "model.layers.13.self_attn": [ { - "accuracy": 0.914382241666317, + "accuracy": 0.9144919887185097, "total_bits": 30308928, "q_proj": { "group_size": { @@ -25429,7 +25429,7 @@ } }, { - "accuracy": 0.9174628779292107, + "accuracy": 0.9174542501568794, "total_bits": 31455808, "q_proj": { "group_size": { @@ -25493,7 +25493,7 @@ } }, { - "accuracy": 0.9295148551464081, + "accuracy": 0.9295745342969894, "total_bits": 33412832, "q_proj": { "group_size": { @@ -25557,7 +25557,7 @@ } }, { - "accuracy": 0.9491968564689159, + "accuracy": 0.9492183402180672, "total_bits": 37983200, "q_proj": { "group_size": { @@ -25621,7 +25621,7 @@ } }, { - "accuracy": 0.955919798463583, + "accuracy": 0.9559485502541065, "total_bits": 44838176, "q_proj": { "group_size": { @@ -25685,7 +25685,7 @@ } }, { - "accuracy": 0.9567287154495716, + "accuracy": 0.9566921889781952, "total_bits": 44912768, "q_proj": { "group_size": { @@ -25749,7 +25749,7 @@ } }, { - "accuracy": 0.9756081849336624, + "accuracy": 0.9756113328039646, "total_bits": 57355552, "q_proj": { "group_size": { @@ -25801,7 +25801,7 @@ } }, { - "accuracy": 0.9762581083923578, + "accuracy": 0.9762618523091078, "total_bits": 57430144, "q_proj": { "group_size": { @@ -25853,7 +25853,7 @@ } }, { - "accuracy": 0.9783238749951124, + "accuracy": 0.9782921988517046, "total_bits": 57950464, "q_proj": { "group_size": { @@ -25905,7 +25905,7 @@ } }, { - "accuracy": 0.9795089289546013, + "accuracy": 0.9794944487512112, "total_bits": 58692736, "q_proj": { "group_size": { @@ -25957,7 +25957,7 @@ } }, { - "accuracy": 0.9779392145574093, + "accuracy": 0.9778795074671507, "total_bits": 59068544, "q_proj": { "group_size": { @@ -26021,7 +26021,7 @@ } }, { - "accuracy": 0.9795319139957428, + "accuracy": 0.979520695284009, "total_bits": 59588864, "q_proj": { "group_size": { @@ -26085,7 +26085,7 @@ } }, { - "accuracy": 0.9819448851048946, + "accuracy": 0.9819323495030403, "total_bits": 61536832, "q_proj": { "group_size": { @@ -26146,7 +26146,7 @@ } }, { - "accuracy": 0.9835209306329489, + "accuracy": 0.9835347458720207, "total_bits": 62354560, "q_proj": { "group_size": { @@ -26207,7 +26207,7 @@ } }, { - "accuracy": 0.9901209101080894, + "accuracy": 0.9901253506541252, "total_bits": 75246880, "q_proj": { "group_size": { @@ -26268,7 +26268,7 @@ } }, { - "accuracy": 0.9917429555207491, + "accuracy": 0.9917331263422966, "total_bits": 76510336, "q_proj": { "group_size": { @@ -26329,7 +26329,7 @@ } }, { - "accuracy": 0.9937325660139322, + "accuracy": 0.9937320556491613, "total_bits": 85667104, "q_proj": { "group_size": { @@ -26381,7 +26381,7 @@ } }, { - "accuracy": 0.9958382518962026, + "accuracy": 0.9958483558148146, "total_bits": 91722880, "q_proj": { "group_size": { @@ -26433,7 +26433,7 @@ } }, { - "accuracy": 0.9983558729290962, + "accuracy": 0.9983553681522608, "total_bits": 113978656, "q_proj": { "group_size": { @@ -26487,7 +26487,7 @@ ], "model.layers.13.mlp": [ { - "accuracy": 0.9058817103505135, + "accuracy": 0.9057564288377762, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -26539,7 +26539,7 @@ } }, { - "accuracy": 0.9087112993001938, + "accuracy": 0.9086236134171486, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -26591,7 +26591,7 @@ } }, { - "accuracy": 0.9195607155561447, + "accuracy": 0.9196574911475182, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -26640,7 +26640,7 @@ } }, { - "accuracy": 0.923167884349823, + "accuracy": 0.9232490658760071, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -26689,7 +26689,7 @@ } }, { - "accuracy": 0.9515799544751644, + "accuracy": 0.9516337104141712, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -26741,7 +26741,7 @@ } }, { - "accuracy": 0.9560265839099884, + "accuracy": 0.9560323432087898, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -26793,7 +26793,7 @@ } }, { - "accuracy": 0.9607695490121841, + "accuracy": 0.9607681259512901, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -26842,7 +26842,7 @@ } }, { - "accuracy": 0.9745559766888618, + "accuracy": 0.9745499193668365, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -26885,7 +26885,7 @@ } }, { - "accuracy": 0.976823752745986, + "accuracy": 0.9768188558518887, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -26928,7 +26928,7 @@ } }, { - "accuracy": 0.9750555753707886, + "accuracy": 0.9750737082213163, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -26980,7 +26980,7 @@ } }, { - "accuracy": 0.978454452008009, + "accuracy": 0.9784559179097414, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -27032,7 +27032,7 @@ } }, { - "accuracy": 0.9872105978429317, + "accuracy": 0.9872140353545547, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -27084,7 +27084,7 @@ } }, { - "accuracy": 0.9891844298690557, + "accuracy": 0.9891853602603078, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -27136,7 +27136,7 @@ } }, { - "accuracy": 0.992884736508131, + "accuracy": 0.9928796184249222, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -27179,7 +27179,7 @@ } }, { - "accuracy": 0.9934014892205596, + "accuracy": 0.9934069863520563, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -27228,7 +27228,7 @@ } }, { - "accuracy": 0.9944165083579719, + "accuracy": 0.9944231859408319, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -27274,7 +27274,7 @@ } }, { - "accuracy": 0.9980151185300201, + "accuracy": 0.9980159213300794, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -27316,7 +27316,7 @@ ], "model.layers.14.self_attn": [ { - "accuracy": 0.9055267497897148, + "accuracy": 0.9052515029907227, "total_bits": 30308928, "q_proj": { "group_size": { @@ -27380,7 +27380,7 @@ } }, { - "accuracy": 0.9082472920417786, + "accuracy": 0.9081130772829056, "total_bits": 31455808, "q_proj": { "group_size": { @@ -27444,7 +27444,7 @@ } }, { - "accuracy": 0.9182290732860565, + "accuracy": 0.9183298647403717, "total_bits": 33412832, "q_proj": { "group_size": { @@ -27508,7 +27508,7 @@ } }, { - "accuracy": 0.9408689215779305, + "accuracy": 0.9409149326384068, "total_bits": 37983200, "q_proj": { "group_size": { @@ -27572,7 +27572,7 @@ } }, { - "accuracy": 0.9510448761284351, + "accuracy": 0.9511469714343548, "total_bits": 44838176, "q_proj": { "group_size": { @@ -27636,7 +27636,7 @@ } }, { - "accuracy": 0.9517546966671944, + "accuracy": 0.9518323987722397, "total_bits": 44912768, "q_proj": { "group_size": { @@ -27700,7 +27700,7 @@ } }, { - "accuracy": 0.9723473638296127, + "accuracy": 0.9723943509161472, "total_bits": 57355552, "q_proj": { "group_size": { @@ -27752,7 +27752,7 @@ } }, { - "accuracy": 0.9730114750564098, + "accuracy": 0.9731061886996031, "total_bits": 57430144, "q_proj": { "group_size": { @@ -27804,7 +27804,7 @@ } }, { - "accuracy": 0.9746960289776325, + "accuracy": 0.9747657887637615, "total_bits": 57950464, "q_proj": { "group_size": { @@ -27856,7 +27856,7 @@ } }, { - "accuracy": 0.9767959043383598, + "accuracy": 0.9768108148127794, "total_bits": 58692736, "q_proj": { "group_size": { @@ -27908,7 +27908,7 @@ } }, { - "accuracy": 0.9753426536917686, + "accuracy": 0.975377295166254, "total_bits": 59068544, "q_proj": { "group_size": { @@ -27972,7 +27972,7 @@ } }, { - "accuracy": 0.9770860001444817, + "accuracy": 0.9770306386053562, "total_bits": 59588864, "q_proj": { "group_size": { @@ -28036,7 +28036,7 @@ } }, { - "accuracy": 0.979099478572607, + "accuracy": 0.9790472611784935, "total_bits": 61536832, "q_proj": { "group_size": { @@ -28097,7 +28097,7 @@ } }, { - "accuracy": 0.9806705601513386, + "accuracy": 0.9806842133402824, "total_bits": 62354560, "q_proj": { "group_size": { @@ -28158,7 +28158,7 @@ } }, { - "accuracy": 0.9885000661015511, + "accuracy": 0.9885049602016807, "total_bits": 75246880, "q_proj": { "group_size": { @@ -28219,7 +28219,7 @@ } }, { - "accuracy": 0.9902753746137023, + "accuracy": 0.9902975112199783, "total_bits": 76510336, "q_proj": { "group_size": { @@ -28280,7 +28280,7 @@ } }, { - "accuracy": 0.992810903582722, + "accuracy": 0.9927993132732809, "total_bits": 85667104, "q_proj": { "group_size": { @@ -28332,7 +28332,7 @@ } }, { - "accuracy": 0.9949225764721632, + "accuracy": 0.994893008377403, "total_bits": 91722880, "q_proj": { "group_size": { @@ -28384,7 +28384,7 @@ } }, { - "accuracy": 0.9981167989317328, + "accuracy": 0.998116486473009, "total_bits": 113978656, "q_proj": { "group_size": { @@ -28438,7 +28438,7 @@ ], "model.layers.14.mlp": [ { - "accuracy": 0.9059914350509644, + "accuracy": 0.90602907538414, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -28490,7 +28490,7 @@ } }, { - "accuracy": 0.9088080897927284, + "accuracy": 0.9087480306625366, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -28542,7 +28542,7 @@ } }, { - "accuracy": 0.9203511402010918, + "accuracy": 0.9203285947442055, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -28591,7 +28591,7 @@ } }, { - "accuracy": 0.9241925030946732, + "accuracy": 0.9241577237844467, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -28640,7 +28640,7 @@ } }, { - "accuracy": 0.9516731016337872, + "accuracy": 0.951668631285429, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -28692,7 +28692,7 @@ } }, { - "accuracy": 0.9560071490705013, + "accuracy": 0.9559860564768314, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -28744,7 +28744,7 @@ } }, { - "accuracy": 0.9610604681074619, + "accuracy": 0.9610610008239746, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -28793,7 +28793,7 @@ } }, { - "accuracy": 0.9745946303009987, + "accuracy": 0.9746211394667625, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -28836,7 +28836,7 @@ } }, { - "accuracy": 0.9768316633999348, + "accuracy": 0.9768539238721132, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -28879,7 +28879,7 @@ } }, { - "accuracy": 0.9751278180629015, + "accuracy": 0.9751336295157671, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -28931,7 +28931,7 @@ } }, { - "accuracy": 0.9784498494118452, + "accuracy": 0.978433957323432, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -28983,7 +28983,7 @@ } }, { - "accuracy": 0.9872479913756251, + "accuracy": 0.9872386232018471, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -29035,7 +29035,7 @@ } }, { - "accuracy": 0.9891970083117485, + "accuracy": 0.98919727653265, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -29087,7 +29087,7 @@ } }, { - "accuracy": 0.992910641245544, + "accuracy": 0.9929077257402241, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -29130,7 +29130,7 @@ } }, { - "accuracy": 0.9934103316627443, + "accuracy": 0.99340810906142, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -29179,7 +29179,7 @@ } }, { - "accuracy": 0.9944956391118467, + "accuracy": 0.9944933266378939, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -29225,7 +29225,7 @@ } }, { - "accuracy": 0.9980454861652106, + "accuracy": 0.9980455068871379, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -29267,7 +29267,7 @@ ], "model.layers.15.self_attn": [ { - "accuracy": 0.8662237524986267, + "accuracy": 0.8660960495471954, "total_bits": 30308928, "q_proj": { "group_size": { @@ -29331,7 +29331,7 @@ } }, { - "accuracy": 0.8720844835042953, + "accuracy": 0.8721434473991394, "total_bits": 31455808, "q_proj": { "group_size": { @@ -29395,7 +29395,7 @@ } }, { - "accuracy": 0.8906018137931824, + "accuracy": 0.8906832113862038, "total_bits": 33412832, "q_proj": { "group_size": { @@ -29459,7 +29459,7 @@ } }, { - "accuracy": 0.922219954431057, + "accuracy": 0.9223601892590523, "total_bits": 37983200, "q_proj": { "group_size": { @@ -29523,7 +29523,7 @@ } }, { - "accuracy": 0.9315391108393669, + "accuracy": 0.9315524771809578, "total_bits": 44838176, "q_proj": { "group_size": { @@ -29587,7 +29587,7 @@ } }, { - "accuracy": 0.9328188821673393, + "accuracy": 0.9328577220439911, "total_bits": 44912768, "q_proj": { "group_size": { @@ -29651,7 +29651,7 @@ } }, { - "accuracy": 0.9618901945650578, + "accuracy": 0.9618603363633156, "total_bits": 57355552, "q_proj": { "group_size": { @@ -29703,7 +29703,7 @@ } }, { - "accuracy": 0.9632286131381989, + "accuracy": 0.9631414413452148, "total_bits": 57430144, "q_proj": { "group_size": { @@ -29755,7 +29755,7 @@ } }, { - "accuracy": 0.9660533033311367, + "accuracy": 0.9660372957587242, "total_bits": 57950464, "q_proj": { "group_size": { @@ -29807,7 +29807,7 @@ } }, { - "accuracy": 0.9675209484994411, + "accuracy": 0.9675589837133884, "total_bits": 58692736, "q_proj": { "group_size": { @@ -29859,7 +29859,7 @@ } }, { - "accuracy": 0.9656884074211121, + "accuracy": 0.9657478630542755, "total_bits": 59068544, "q_proj": { "group_size": { @@ -29923,7 +29923,7 @@ } }, { - "accuracy": 0.9681769870221615, + "accuracy": 0.9681409150362015, "total_bits": 59588864, "q_proj": { "group_size": { @@ -29987,7 +29987,7 @@ } }, { - "accuracy": 0.9722221530973911, + "accuracy": 0.9722285084426403, "total_bits": 61536832, "q_proj": { "group_size": { @@ -30048,7 +30048,7 @@ } }, { - "accuracy": 0.9743126630783081, + "accuracy": 0.9743023552000523, "total_bits": 62354560, "q_proj": { "group_size": { @@ -30109,7 +30109,7 @@ } }, { - "accuracy": 0.9847090318799019, + "accuracy": 0.984696488827467, "total_bits": 75246880, "q_proj": { "group_size": { @@ -30170,7 +30170,7 @@ } }, { - "accuracy": 0.987136579118669, + "accuracy": 0.9871381670236588, "total_bits": 76510336, "q_proj": { "group_size": { @@ -30231,7 +30231,7 @@ } }, { - "accuracy": 0.9900257075205445, + "accuracy": 0.9900241773575544, "total_bits": 85667104, "q_proj": { "group_size": { @@ -30283,7 +30283,7 @@ } }, { - "accuracy": 0.993544745258987, + "accuracy": 0.9935367675498128, "total_bits": 91722880, "q_proj": { "group_size": { @@ -30335,7 +30335,7 @@ } }, { - "accuracy": 0.9974129700567573, + "accuracy": 0.9974108194001019, "total_bits": 113978656, "q_proj": { "group_size": { @@ -30389,7 +30389,7 @@ ], "model.layers.15.mlp": [ { - "accuracy": 0.888176292181015, + "accuracy": 0.8881220296025276, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -30441,7 +30441,7 @@ } }, { - "accuracy": 0.8917654976248741, + "accuracy": 0.8917921856045723, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -30493,7 +30493,7 @@ } }, { - "accuracy": 0.9060942456126213, + "accuracy": 0.9061857014894485, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -30542,7 +30542,7 @@ } }, { - "accuracy": 0.9107229635119438, + "accuracy": 0.9108146727085114, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -30591,7 +30591,7 @@ } }, { - "accuracy": 0.9432618841528893, + "accuracy": 0.9432695247232914, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -30643,7 +30643,7 @@ } }, { - "accuracy": 0.9481836818158627, + "accuracy": 0.9481980800628662, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -30695,7 +30695,7 @@ } }, { - "accuracy": 0.9543357789516449, + "accuracy": 0.9543447978794575, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -30744,7 +30744,7 @@ } }, { - "accuracy": 0.9701154325157404, + "accuracy": 0.9701192807406187, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -30787,7 +30787,7 @@ } }, { - "accuracy": 0.9727210849523544, + "accuracy": 0.9727198947221041, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -30830,7 +30830,7 @@ } }, { - "accuracy": 0.9709262512624264, + "accuracy": 0.9709332976490259, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -30882,7 +30882,7 @@ } }, { - "accuracy": 0.9747244548052549, + "accuracy": 0.9747237414121628, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -30934,7 +30934,7 @@ } }, { - "accuracy": 0.9851207751780748, + "accuracy": 0.9851209698244929, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -30986,7 +30986,7 @@ } }, { - "accuracy": 0.9873405825346708, + "accuracy": 0.9873364437371492, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -31038,7 +31038,7 @@ } }, { - "accuracy": 0.991690007969737, + "accuracy": 0.991686038672924, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -31081,7 +31081,7 @@ } }, { - "accuracy": 0.9923195065930486, + "accuracy": 0.9923256579786539, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -31130,7 +31130,7 @@ } }, { - "accuracy": 0.9936661920510232, + "accuracy": 0.993671263102442, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -31176,7 +31176,7 @@ } }, { - "accuracy": 0.9976954362355173, + "accuracy": 0.9976960332132876, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -31218,7 +31218,7 @@ ], "model.layers.16.self_attn": [ { - "accuracy": 0.8969288393855095, + "accuracy": 0.8970862925052643, "total_bits": 30308928, "q_proj": { "group_size": { @@ -31282,7 +31282,7 @@ } }, { - "accuracy": 0.9022532030940056, + "accuracy": 0.9023451805114746, "total_bits": 31455808, "q_proj": { "group_size": { @@ -31346,7 +31346,7 @@ } }, { - "accuracy": 0.9167034402489662, + "accuracy": 0.9166429415345192, "total_bits": 33412832, "q_proj": { "group_size": { @@ -31410,7 +31410,7 @@ } }, { - "accuracy": 0.9358327612280846, + "accuracy": 0.9357787296175957, "total_bits": 37983200, "q_proj": { "group_size": { @@ -31474,7 +31474,7 @@ } }, { - "accuracy": 0.9472634494304657, + "accuracy": 0.9472717791795731, "total_bits": 44838176, "q_proj": { "group_size": { @@ -31538,7 +31538,7 @@ } }, { - "accuracy": 0.9484786465764046, + "accuracy": 0.9484795853495598, "total_bits": 44912768, "q_proj": { "group_size": { @@ -31602,7 +31602,7 @@ } }, { - "accuracy": 0.9694637320935726, + "accuracy": 0.9694760199636221, "total_bits": 57355552, "q_proj": { "group_size": { @@ -31654,7 +31654,7 @@ } }, { - "accuracy": 0.9708479661494493, + "accuracy": 0.9708113986998796, "total_bits": 57430144, "q_proj": { "group_size": { @@ -31706,7 +31706,7 @@ } }, { - "accuracy": 0.9735263660550117, + "accuracy": 0.9735017456114292, "total_bits": 57950464, "q_proj": { "group_size": { @@ -31758,7 +31758,7 @@ } }, { - "accuracy": 0.9748429581522942, + "accuracy": 0.9747295752167702, "total_bits": 58692736, "q_proj": { "group_size": { @@ -31810,7 +31810,7 @@ } }, { - "accuracy": 0.9736697655171156, + "accuracy": 0.9736849442124367, "total_bits": 59068544, "q_proj": { "group_size": { @@ -31874,7 +31874,7 @@ } }, { - "accuracy": 0.9757199659943581, + "accuracy": 0.9757067002356052, "total_bits": 59588864, "q_proj": { "group_size": { @@ -31938,7 +31938,7 @@ } }, { - "accuracy": 0.9787998888641596, + "accuracy": 0.9787530265748501, "total_bits": 61536832, "q_proj": { "group_size": { @@ -31999,7 +31999,7 @@ } }, { - "accuracy": 0.9805225525051355, + "accuracy": 0.9805027451366186, "total_bits": 62354560, "q_proj": { "group_size": { @@ -32060,7 +32060,7 @@ } }, { - "accuracy": 0.9882316552102566, + "accuracy": 0.9882538206875324, "total_bits": 75246880, "q_proj": { "group_size": { @@ -32121,7 +32121,7 @@ } }, { - "accuracy": 0.9901310745626688, + "accuracy": 0.9901269851252437, "total_bits": 76510336, "q_proj": { "group_size": { @@ -32182,7 +32182,7 @@ } }, { - "accuracy": 0.9920943574979901, + "accuracy": 0.9920847797766328, "total_bits": 85667104, "q_proj": { "group_size": { @@ -32234,7 +32234,7 @@ } }, { - "accuracy": 0.9948356342501938, + "accuracy": 0.9948330130428076, "total_bits": 91722880, "q_proj": { "group_size": { @@ -32286,7 +32286,7 @@ } }, { - "accuracy": 0.9979338457342237, + "accuracy": 0.9979362795129418, "total_bits": 113978656, "q_proj": { "group_size": { @@ -32340,7 +32340,7 @@ ], "model.layers.16.mlp": [ { - "accuracy": 0.8954387977719307, + "accuracy": 0.8952863588929176, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -32392,7 +32392,7 @@ } }, { - "accuracy": 0.8993488028645515, + "accuracy": 0.8992033004760742, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -32444,7 +32444,7 @@ } }, { - "accuracy": 0.9125201851129532, + "accuracy": 0.9123476222157478, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -32493,7 +32493,7 @@ } }, { - "accuracy": 0.916957214474678, + "accuracy": 0.916797399520874, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -32542,7 +32542,7 @@ } }, { - "accuracy": 0.9469495937228203, + "accuracy": 0.9469642452895641, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -32594,7 +32594,7 @@ } }, { - "accuracy": 0.9515363164246082, + "accuracy": 0.951481893658638, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -32646,7 +32646,7 @@ } }, { - "accuracy": 0.9573016315698624, + "accuracy": 0.9572397917509079, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -32695,7 +32695,7 @@ } }, { - "accuracy": 0.97197007201612, + "accuracy": 0.9719776529818773, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -32738,7 +32738,7 @@ } }, { - "accuracy": 0.9743286669254303, + "accuracy": 0.974342368543148, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -32781,7 +32781,7 @@ } }, { - "accuracy": 0.9728555325418711, + "accuracy": 0.9728449210524559, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -32833,7 +32833,7 @@ } }, { - "accuracy": 0.9763589985668659, + "accuracy": 0.9763544015586376, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -32885,7 +32885,7 @@ } }, { - "accuracy": 0.9861350525170565, + "accuracy": 0.9861237006261945, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -32937,7 +32937,7 @@ } }, { - "accuracy": 0.9881947506219149, + "accuracy": 0.9881899319589138, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -32989,7 +32989,7 @@ } }, { - "accuracy": 0.9922279161401093, + "accuracy": 0.9922269973903894, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -33032,7 +33032,7 @@ } }, { - "accuracy": 0.9928275826387107, + "accuracy": 0.9928280608728528, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -33081,7 +33081,7 @@ } }, { - "accuracy": 0.9940253831446171, + "accuracy": 0.9940254967659712, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -33127,7 +33127,7 @@ } }, { - "accuracy": 0.9978487037587911, + "accuracy": 0.9978484844323248, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -33169,7 +33169,7 @@ ], "model.layers.17.self_attn": [ { - "accuracy": 0.8973334357142448, + "accuracy": 0.897542305290699, "total_bits": 30308928, "q_proj": { "group_size": { @@ -33233,7 +33233,7 @@ } }, { - "accuracy": 0.9017208069562912, + "accuracy": 0.9018189832568169, "total_bits": 31455808, "q_proj": { "group_size": { @@ -33297,7 +33297,7 @@ } }, { - "accuracy": 0.9132213443517685, + "accuracy": 0.9131938815116882, "total_bits": 33412832, "q_proj": { "group_size": { @@ -33361,7 +33361,7 @@ } }, { - "accuracy": 0.938893273472786, + "accuracy": 0.9388857409358025, "total_bits": 37983200, "q_proj": { "group_size": { @@ -33425,7 +33425,7 @@ } }, { - "accuracy": 0.9475571848452091, + "accuracy": 0.9475753307342529, "total_bits": 44838176, "q_proj": { "group_size": { @@ -33489,7 +33489,7 @@ } }, { - "accuracy": 0.9484684765338898, + "accuracy": 0.9485311545431614, "total_bits": 44912768, "q_proj": { "group_size": { @@ -33553,7 +33553,7 @@ } }, { - "accuracy": 0.9707033317536116, + "accuracy": 0.970684751868248, "total_bits": 57355552, "q_proj": { "group_size": { @@ -33605,7 +33605,7 @@ } }, { - "accuracy": 0.9716454949229956, + "accuracy": 0.9716228414326906, "total_bits": 57430144, "q_proj": { "group_size": { @@ -33657,7 +33657,7 @@ } }, { - "accuracy": 0.9738726690411568, + "accuracy": 0.973836112767458, "total_bits": 57950464, "q_proj": { "group_size": { @@ -33709,7 +33709,7 @@ } }, { - "accuracy": 0.9751554299145937, + "accuracy": 0.9751142673194408, "total_bits": 58692736, "q_proj": { "group_size": { @@ -33761,7 +33761,7 @@ } }, { - "accuracy": 0.973699688911438, + "accuracy": 0.9736771062016487, "total_bits": 59068544, "q_proj": { "group_size": { @@ -33825,7 +33825,7 @@ } }, { - "accuracy": 0.9755098223686218, + "accuracy": 0.9755203202366829, "total_bits": 59588864, "q_proj": { "group_size": { @@ -33889,7 +33889,7 @@ } }, { - "accuracy": 0.9779850598424673, + "accuracy": 0.9779762793332338, "total_bits": 61536832, "q_proj": { "group_size": { @@ -33950,7 +33950,7 @@ } }, { - "accuracy": 0.9795938245952129, + "accuracy": 0.9795962031930685, "total_bits": 62354560, "q_proj": { "group_size": { @@ -34011,7 +34011,7 @@ } }, { - "accuracy": 0.9879280971363187, + "accuracy": 0.987911774776876, "total_bits": 75246880, "q_proj": { "group_size": { @@ -34072,7 +34072,7 @@ } }, { - "accuracy": 0.989773684181273, + "accuracy": 0.9897674126550555, "total_bits": 76510336, "q_proj": { "group_size": { @@ -34133,7 +34133,7 @@ } }, { - "accuracy": 0.9923741007223725, + "accuracy": 0.9923535925336182, "total_bits": 85667104, "q_proj": { "group_size": { @@ -34185,7 +34185,7 @@ } }, { - "accuracy": 0.9947892669588327, + "accuracy": 0.9947894560173154, "total_bits": 91722880, "q_proj": { "group_size": { @@ -34237,7 +34237,7 @@ } }, { - "accuracy": 0.99802085920237, + "accuracy": 0.998017291072756, "total_bits": 113978656, "q_proj": { "group_size": { @@ -34291,7 +34291,7 @@ ], "model.layers.17.mlp": [ { - "accuracy": 0.8820443674921989, + "accuracy": 0.8820276632905006, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -34343,7 +34343,7 @@ } }, { - "accuracy": 0.8866309821605682, + "accuracy": 0.8865934386849403, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -34395,7 +34395,7 @@ } }, { - "accuracy": 0.9031416177749634, + "accuracy": 0.9032439365983009, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -34444,7 +34444,7 @@ } }, { - "accuracy": 0.9086097851395607, + "accuracy": 0.9086964055895805, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -34493,7 +34493,7 @@ } }, { - "accuracy": 0.9407571367919445, + "accuracy": 0.9407499842345715, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -34545,7 +34545,7 @@ } }, { - "accuracy": 0.9456419833004475, + "accuracy": 0.9456696957349777, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -34597,7 +34597,7 @@ } }, { - "accuracy": 0.9527646824717522, + "accuracy": 0.952761884778738, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -34646,7 +34646,7 @@ } }, { - "accuracy": 0.9684986434876919, + "accuracy": 0.9684955701231956, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -34689,7 +34689,7 @@ } }, { - "accuracy": 0.9712209962308407, + "accuracy": 0.9712157864123583, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -34732,7 +34732,7 @@ } }, { - "accuracy": 0.969695445150137, + "accuracy": 0.969698378816247, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -34784,7 +34784,7 @@ } }, { - "accuracy": 0.973537739366293, + "accuracy": 0.9735384881496429, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -34836,7 +34836,7 @@ } }, { - "accuracy": 0.984518950805068, + "accuracy": 0.9845216348767281, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -34888,7 +34888,7 @@ } }, { - "accuracy": 0.9867853112518787, + "accuracy": 0.9867835436016321, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -34940,7 +34940,7 @@ } }, { - "accuracy": 0.991300848312676, + "accuracy": 0.9913051715120673, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -34983,7 +34983,7 @@ } }, { - "accuracy": 0.9920124607160687, + "accuracy": 0.9920066902413964, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -35032,7 +35032,7 @@ } }, { - "accuracy": 0.9935338972136378, + "accuracy": 0.9935281220823526, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -35078,7 +35078,7 @@ } }, { - "accuracy": 0.9976069342810661, + "accuracy": 0.9976056986488402, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -35120,7 +35120,7 @@ ], "model.layers.18.self_attn": [ { - "accuracy": 0.8961049765348434, + "accuracy": 0.895967960357666, "total_bits": 30308928, "q_proj": { "group_size": { @@ -35184,7 +35184,7 @@ } }, { - "accuracy": 0.9031495451927185, + "accuracy": 0.9031614512205124, "total_bits": 31455808, "q_proj": { "group_size": { @@ -35248,7 +35248,7 @@ } }, { - "accuracy": 0.915522888302803, + "accuracy": 0.9155553206801414, "total_bits": 33412832, "q_proj": { "group_size": { @@ -35312,7 +35312,7 @@ } }, { - "accuracy": 0.9396003894507885, + "accuracy": 0.9396803267300129, "total_bits": 37983200, "q_proj": { "group_size": { @@ -35376,7 +35376,7 @@ } }, { - "accuracy": 0.9481151774525642, + "accuracy": 0.9481409452855587, "total_bits": 44838176, "q_proj": { "group_size": { @@ -35440,7 +35440,7 @@ } }, { - "accuracy": 0.9490873701870441, + "accuracy": 0.9491141587495804, "total_bits": 44912768, "q_proj": { "group_size": { @@ -35504,7 +35504,7 @@ } }, { - "accuracy": 0.9702784214168787, + "accuracy": 0.9702505953609943, "total_bits": 57355552, "q_proj": { "group_size": { @@ -35556,7 +35556,7 @@ } }, { - "accuracy": 0.9712849836796522, + "accuracy": 0.9712676033377647, "total_bits": 57430144, "q_proj": { "group_size": { @@ -35608,7 +35608,7 @@ } }, { - "accuracy": 0.9733225014060736, + "accuracy": 0.9733318723738194, "total_bits": 57950464, "q_proj": { "group_size": { @@ -35660,7 +35660,7 @@ } }, { - "accuracy": 0.9746621809899807, + "accuracy": 0.9746661577373743, "total_bits": 58692736, "q_proj": { "group_size": { @@ -35712,7 +35712,7 @@ } }, { - "accuracy": 0.9740584716200829, + "accuracy": 0.9740777555853128, "total_bits": 59068544, "q_proj": { "group_size": { @@ -35776,7 +35776,7 @@ } }, { - "accuracy": 0.9757704772055149, + "accuracy": 0.975718442350626, "total_bits": 59588864, "q_proj": { "group_size": { @@ -35840,7 +35840,7 @@ } }, { - "accuracy": 0.9784729983657598, + "accuracy": 0.9784317370504141, "total_bits": 61536832, "q_proj": { "group_size": { @@ -35901,7 +35901,7 @@ } }, { - "accuracy": 0.9800199028104544, + "accuracy": 0.9800386726856232, "total_bits": 62354560, "q_proj": { "group_size": { @@ -35962,7 +35962,7 @@ } }, { - "accuracy": 0.9881230108439922, + "accuracy": 0.988131619989872, "total_bits": 75246880, "q_proj": { "group_size": { @@ -36023,7 +36023,7 @@ } }, { - "accuracy": 0.9899277659133077, + "accuracy": 0.9899393441155553, "total_bits": 76510336, "q_proj": { "group_size": { @@ -36084,7 +36084,7 @@ } }, { - "accuracy": 0.9922054400667548, + "accuracy": 0.9921957161277533, "total_bits": 85667104, "q_proj": { "group_size": { @@ -36136,7 +36136,7 @@ } }, { - "accuracy": 0.9948229189030826, + "accuracy": 0.994826287496835, "total_bits": 91722880, "q_proj": { "group_size": { @@ -36188,7 +36188,7 @@ } }, { - "accuracy": 0.9979508460965008, + "accuracy": 0.9979522456414998, "total_bits": 113978656, "q_proj": { "group_size": { @@ -36242,7 +36242,7 @@ ], "model.layers.18.mlp": [ { - "accuracy": 0.8908465802669525, + "accuracy": 0.890760600566864, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -36294,7 +36294,7 @@ } }, { - "accuracy": 0.8948191478848457, + "accuracy": 0.8948594033718109, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -36346,7 +36346,7 @@ } }, { - "accuracy": 0.9099691584706306, + "accuracy": 0.9100265651941299, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -36395,7 +36395,7 @@ } }, { - "accuracy": 0.9150631278753281, + "accuracy": 0.915120542049408, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -36444,7 +36444,7 @@ } }, { - "accuracy": 0.9450795240700245, + "accuracy": 0.9450446665287018, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -36496,7 +36496,7 @@ } }, { - "accuracy": 0.949484571814537, + "accuracy": 0.9494681656360626, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -36548,7 +36548,7 @@ } }, { - "accuracy": 0.9560906924307346, + "accuracy": 0.9560775049030781, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -36597,7 +36597,7 @@ } }, { - "accuracy": 0.9707168936729431, + "accuracy": 0.9707209877669811, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -36640,7 +36640,7 @@ } }, { - "accuracy": 0.9732743687927723, + "accuracy": 0.9732760544866323, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -36683,7 +36683,7 @@ } }, { - "accuracy": 0.9719167854636908, + "accuracy": 0.9719307515770197, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -36735,7 +36735,7 @@ } }, { - "accuracy": 0.9754060637205839, + "accuracy": 0.9753952287137508, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -36787,7 +36787,7 @@ } }, { - "accuracy": 0.9856863981112838, + "accuracy": 0.9856886547058821, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -36839,7 +36839,7 @@ } }, { - "accuracy": 0.9877114491537213, + "accuracy": 0.9877165118232369, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -36891,7 +36891,7 @@ } }, { - "accuracy": 0.9919731765985489, + "accuracy": 0.9919724566861987, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -36934,7 +36934,7 @@ } }, { - "accuracy": 0.9926252705045044, + "accuracy": 0.9926214762963355, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -36983,7 +36983,7 @@ } }, { - "accuracy": 0.9940348407253623, + "accuracy": 0.9940323028713465, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -37029,7 +37029,7 @@ } }, { - "accuracy": 0.9977936870418489, + "accuracy": 0.997793102869764, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -37071,7 +37071,7 @@ ], "model.layers.19.self_attn": [ { - "accuracy": 0.9066938832402229, + "accuracy": 0.9067771062254906, "total_bits": 30308928, "q_proj": { "group_size": { @@ -37135,7 +37135,7 @@ } }, { - "accuracy": 0.9125282913446426, + "accuracy": 0.9125330448150635, "total_bits": 31455808, "q_proj": { "group_size": { @@ -37199,7 +37199,7 @@ } }, { - "accuracy": 0.9224199429154396, + "accuracy": 0.9224216490983963, "total_bits": 33412832, "q_proj": { "group_size": { @@ -37263,7 +37263,7 @@ } }, { - "accuracy": 0.942340325564146, + "accuracy": 0.9422799944877625, "total_bits": 37983200, "q_proj": { "group_size": { @@ -37327,7 +37327,7 @@ } }, { - "accuracy": 0.9528491497039795, + "accuracy": 0.9527867995202541, "total_bits": 44838176, "q_proj": { "group_size": { @@ -37391,7 +37391,7 @@ } }, { - "accuracy": 0.9537361785769463, + "accuracy": 0.9536703340709209, "total_bits": 44912768, "q_proj": { "group_size": { @@ -37455,7 +37455,7 @@ } }, { - "accuracy": 0.9727440439164639, + "accuracy": 0.9727084040641785, "total_bits": 57355552, "q_proj": { "group_size": { @@ -37507,7 +37507,7 @@ } }, { - "accuracy": 0.9736681282520294, + "accuracy": 0.9736226126551628, "total_bits": 57430144, "q_proj": { "group_size": { @@ -37559,7 +37559,7 @@ } }, { - "accuracy": 0.9758165907114744, + "accuracy": 0.9758408833295107, "total_bits": 57950464, "q_proj": { "group_size": { @@ -37611,7 +37611,7 @@ } }, { - "accuracy": 0.9769553057849407, + "accuracy": 0.976946609094739, "total_bits": 58692736, "q_proj": { "group_size": { @@ -37663,7 +37663,7 @@ } }, { - "accuracy": 0.9764603525400162, + "accuracy": 0.9764624573290348, "total_bits": 59068544, "q_proj": { "group_size": { @@ -37727,7 +37727,7 @@ } }, { - "accuracy": 0.9781377725303173, + "accuracy": 0.9780647847801447, "total_bits": 59588864, "q_proj": { "group_size": { @@ -37791,7 +37791,7 @@ } }, { - "accuracy": 0.9803321305662394, + "accuracy": 0.9802794177085161, "total_bits": 61536832, "q_proj": { "group_size": { @@ -37852,7 +37852,7 @@ } }, { - "accuracy": 0.9818277545273304, + "accuracy": 0.9817991387099028, "total_bits": 62354560, "q_proj": { "group_size": { @@ -37913,7 +37913,7 @@ } }, { - "accuracy": 0.9891065321862698, + "accuracy": 0.9891098402440548, "total_bits": 75246880, "q_proj": { "group_size": { @@ -37974,7 +37974,7 @@ } }, { - "accuracy": 0.9908470399677753, + "accuracy": 0.9908483978360891, "total_bits": 76510336, "q_proj": { "group_size": { @@ -38035,7 +38035,7 @@ } }, { - "accuracy": 0.9929368873126805, + "accuracy": 0.9929364663548768, "total_bits": 85667104, "q_proj": { "group_size": { @@ -38087,7 +38087,7 @@ } }, { - "accuracy": 0.9951926521025598, + "accuracy": 0.9951782925054431, "total_bits": 91722880, "q_proj": { "group_size": { @@ -38139,7 +38139,7 @@ } }, { - "accuracy": 0.9981394049245864, + "accuracy": 0.9981401044642553, "total_bits": 113978656, "q_proj": { "group_size": { @@ -38193,7 +38193,7 @@ ], "model.layers.19.mlp": [ { - "accuracy": 0.898843489587307, + "accuracy": 0.8988735228776932, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -38245,7 +38245,7 @@ } }, { - "accuracy": 0.9021168202161789, + "accuracy": 0.9020884037017822, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -38297,7 +38297,7 @@ } }, { - "accuracy": 0.9158534109592438, + "accuracy": 0.9158180356025696, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -38346,7 +38346,7 @@ } }, { - "accuracy": 0.9202790409326553, + "accuracy": 0.9202406033873558, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -38395,7 +38395,7 @@ } }, { - "accuracy": 0.9486076608300209, + "accuracy": 0.9486297108232975, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -38447,7 +38447,7 @@ } }, { - "accuracy": 0.9527660310268402, + "accuracy": 0.9527538195252419, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -38499,7 +38499,7 @@ } }, { - "accuracy": 0.9588682539761066, + "accuracy": 0.9588394649326801, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -38548,7 +38548,7 @@ } }, { - "accuracy": 0.9728159811347723, + "accuracy": 0.9728188179433346, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -38591,7 +38591,7 @@ } }, { - "accuracy": 0.9751972481608391, + "accuracy": 0.9751956835389137, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -38634,7 +38634,7 @@ } }, { - "accuracy": 0.9737109690904617, + "accuracy": 0.9737076684832573, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -38686,7 +38686,7 @@ } }, { - "accuracy": 0.9769691210240126, + "accuracy": 0.976981945335865, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -38738,7 +38738,7 @@ } }, { - "accuracy": 0.986573307774961, + "accuracy": 0.9865698497742414, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -38790,7 +38790,7 @@ } }, { - "accuracy": 0.9884986458346248, + "accuracy": 0.9884996181353927, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -38842,7 +38842,7 @@ } }, { - "accuracy": 0.9925676062703133, + "accuracy": 0.9925639107823372, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -38885,7 +38885,7 @@ } }, { - "accuracy": 0.993094963952899, + "accuracy": 0.993094386998564, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -38934,7 +38934,7 @@ } }, { - "accuracy": 0.9943557516671717, + "accuracy": 0.9943572375923395, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -38980,7 +38980,7 @@ } }, { - "accuracy": 0.9979684855788946, + "accuracy": 0.9979692660272121, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -39022,7 +39022,7 @@ ], "model.layers.20.self_attn": [ { - "accuracy": 0.9254191517829895, + "accuracy": 0.9252974018454552, "total_bits": 30308928, "q_proj": { "group_size": { @@ -39086,7 +39086,7 @@ } }, { - "accuracy": 0.9304513037204742, + "accuracy": 0.9304210692644119, "total_bits": 31455808, "q_proj": { "group_size": { @@ -39150,7 +39150,7 @@ } }, { - "accuracy": 0.937650989741087, + "accuracy": 0.9376390874385834, "total_bits": 33412832, "q_proj": { "group_size": { @@ -39214,7 +39214,7 @@ } }, { - "accuracy": 0.9561277441680431, + "accuracy": 0.956094067543745, "total_bits": 37983200, "q_proj": { "group_size": { @@ -39278,7 +39278,7 @@ } }, { - "accuracy": 0.9629123508930206, + "accuracy": 0.9629477187991142, "total_bits": 44838176, "q_proj": { "group_size": { @@ -39342,7 +39342,7 @@ } }, { - "accuracy": 0.9635394588112831, + "accuracy": 0.9635471068322659, "total_bits": 44912768, "q_proj": { "group_size": { @@ -39406,7 +39406,7 @@ } }, { - "accuracy": 0.9784403182566166, + "accuracy": 0.9784409739077091, "total_bits": 57355552, "q_proj": { "group_size": { @@ -39458,7 +39458,7 @@ } }, { - "accuracy": 0.9791186898946762, + "accuracy": 0.9791207388043404, "total_bits": 57430144, "q_proj": { "group_size": { @@ -39510,7 +39510,7 @@ } }, { - "accuracy": 0.9805207420140505, + "accuracy": 0.9805529490113258, "total_bits": 57950464, "q_proj": { "group_size": { @@ -39562,7 +39562,7 @@ } }, { - "accuracy": 0.981576981022954, + "accuracy": 0.9815756008028984, "total_bits": 58692736, "q_proj": { "group_size": { @@ -39614,7 +39614,7 @@ } }, { - "accuracy": 0.9814564771950245, + "accuracy": 0.981438597664237, "total_bits": 59068544, "q_proj": { "group_size": { @@ -39678,7 +39678,7 @@ } }, { - "accuracy": 0.9826366528868675, + "accuracy": 0.9826178383082151, "total_bits": 59588864, "q_proj": { "group_size": { @@ -39742,7 +39742,7 @@ } }, { - "accuracy": 0.9840204436331987, + "accuracy": 0.9840060472488403, "total_bits": 61536832, "q_proj": { "group_size": { @@ -39803,7 +39803,7 @@ } }, { - "accuracy": 0.9851696165278554, + "accuracy": 0.9851967319846153, "total_bits": 62354560, "q_proj": { "group_size": { @@ -39864,7 +39864,7 @@ } }, { - "accuracy": 0.9912118604406714, + "accuracy": 0.99119614623487, "total_bits": 75246880, "q_proj": { "group_size": { @@ -39925,7 +39925,7 @@ } }, { - "accuracy": 0.9925604872405529, + "accuracy": 0.992552753072232, "total_bits": 76510336, "q_proj": { "group_size": { @@ -39986,7 +39986,7 @@ } }, { - "accuracy": 0.9943439392372966, + "accuracy": 0.9943421361967921, "total_bits": 85667104, "q_proj": { "group_size": { @@ -40038,7 +40038,7 @@ } }, { - "accuracy": 0.9961527525447309, + "accuracy": 0.996142350602895, "total_bits": 91722880, "q_proj": { "group_size": { @@ -40090,7 +40090,7 @@ } }, { - "accuracy": 0.9985169863793999, + "accuracy": 0.9985177288763225, "total_bits": 113978656, "q_proj": { "group_size": { @@ -40144,7 +40144,7 @@ ], "model.layers.20.mlp": [ { - "accuracy": 0.9078842997550964, + "accuracy": 0.9078511148691177, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -40196,7 +40196,7 @@ } }, { - "accuracy": 0.9108857437968254, + "accuracy": 0.9108638241887093, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -40248,7 +40248,7 @@ } }, { - "accuracy": 0.9233747720718384, + "accuracy": 0.9233528077602386, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -40297,7 +40297,7 @@ } }, { - "accuracy": 0.927286222577095, + "accuracy": 0.9272778257727623, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -40346,7 +40346,7 @@ } }, { - "accuracy": 0.9533279724419117, + "accuracy": 0.9533239230513573, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -40398,7 +40398,7 @@ } }, { - "accuracy": 0.9570191614329815, + "accuracy": 0.9570236355066299, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -40450,7 +40450,7 @@ } }, { - "accuracy": 0.9625181145966053, + "accuracy": 0.962521106004715, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -40499,7 +40499,7 @@ } }, { - "accuracy": 0.9753356482833624, + "accuracy": 0.9753350578248501, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -40542,7 +40542,7 @@ } }, { - "accuracy": 0.977478351444006, + "accuracy": 0.9774747285991907, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -40585,7 +40585,7 @@ } }, { - "accuracy": 0.9761522505432367, + "accuracy": 0.9761437401175499, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -40637,7 +40637,7 @@ } }, { - "accuracy": 0.9790751449763775, + "accuracy": 0.9790640287101269, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -40689,7 +40689,7 @@ } }, { - "accuracy": 0.9878394166007638, + "accuracy": 0.9878420624881983, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -40741,7 +40741,7 @@ } }, { - "accuracy": 0.9895561756566167, + "accuracy": 0.9895521271973848, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -40793,7 +40793,7 @@ } }, { - "accuracy": 0.9932784507982433, + "accuracy": 0.993278375826776, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -40836,7 +40836,7 @@ } }, { - "accuracy": 0.9937723437324166, + "accuracy": 0.9937705183401704, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -40885,7 +40885,7 @@ } }, { - "accuracy": 0.9949068506248295, + "accuracy": 0.9949048236012459, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -40931,7 +40931,7 @@ } }, { - "accuracy": 0.9981734347529709, + "accuracy": 0.9981726757250726, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -40973,7 +40973,7 @@ ], "model.layers.21.self_attn": [ { - "accuracy": 0.9116751402616501, + "accuracy": 0.9116267189383507, "total_bits": 30308928, "q_proj": { "group_size": { @@ -41037,7 +41037,7 @@ } }, { - "accuracy": 0.9161897599697113, + "accuracy": 0.9161302745342255, "total_bits": 31455808, "q_proj": { "group_size": { @@ -41101,7 +41101,7 @@ } }, { - "accuracy": 0.9299630001187325, + "accuracy": 0.9298892468214035, "total_bits": 33412832, "q_proj": { "group_size": { @@ -41165,7 +41165,7 @@ } }, { - "accuracy": 0.951121561229229, + "accuracy": 0.951112475246191, "total_bits": 37983200, "q_proj": { "group_size": { @@ -41229,7 +41229,7 @@ } }, { - "accuracy": 0.9554766491055489, + "accuracy": 0.9555105529725552, "total_bits": 44838176, "q_proj": { "group_size": { @@ -41293,7 +41293,7 @@ } }, { - "accuracy": 0.9563397578895092, + "accuracy": 0.9563395045697689, "total_bits": 44912768, "q_proj": { "group_size": { @@ -41357,7 +41357,7 @@ } }, { - "accuracy": 0.9752995986491442, + "accuracy": 0.9753066599369049, "total_bits": 57355552, "q_proj": { "group_size": { @@ -41409,7 +41409,7 @@ } }, { - "accuracy": 0.976159306243062, + "accuracy": 0.9761861730366945, "total_bits": 57430144, "q_proj": { "group_size": { @@ -41461,7 +41461,7 @@ } }, { - "accuracy": 0.9777697827666998, + "accuracy": 0.9777861218899488, "total_bits": 57950464, "q_proj": { "group_size": { @@ -41513,7 +41513,7 @@ } }, { - "accuracy": 0.9786687269806862, + "accuracy": 0.9786933194845915, "total_bits": 58692736, "q_proj": { "group_size": { @@ -41565,7 +41565,7 @@ } }, { - "accuracy": 0.9778354410082102, + "accuracy": 0.9778481628745794, "total_bits": 59068544, "q_proj": { "group_size": { @@ -41629,7 +41629,7 @@ } }, { - "accuracy": 0.9793091975152493, + "accuracy": 0.9793014619499445, "total_bits": 59588864, "q_proj": { "group_size": { @@ -41693,7 +41693,7 @@ } }, { - "accuracy": 0.9823502618819475, + "accuracy": 0.9823220800608397, "total_bits": 61536832, "q_proj": { "group_size": { @@ -41754,7 +41754,7 @@ } }, { - "accuracy": 0.9835798889398575, + "accuracy": 0.9835791904479265, "total_bits": 62354560, "q_proj": { "group_size": { @@ -41815,7 +41815,7 @@ } }, { - "accuracy": 0.9903135802596807, + "accuracy": 0.9903201386332512, "total_bits": 75246880, "q_proj": { "group_size": { @@ -41876,7 +41876,7 @@ } }, { - "accuracy": 0.9917551334947348, + "accuracy": 0.9917648062109947, "total_bits": 76510336, "q_proj": { "group_size": { @@ -41937,7 +41937,7 @@ } }, { - "accuracy": 0.993569896556437, + "accuracy": 0.9935718071646988, "total_bits": 85667104, "q_proj": { "group_size": { @@ -41989,7 +41989,7 @@ } }, { - "accuracy": 0.9958970271982253, + "accuracy": 0.995899414177984, "total_bits": 91722880, "q_proj": { "group_size": { @@ -42041,7 +42041,7 @@ } }, { - "accuracy": 0.9983291744720191, + "accuracy": 0.9983296216232702, "total_bits": 113978656, "q_proj": { "group_size": { @@ -42095,7 +42095,7 @@ ], "model.layers.21.mlp": [ { - "accuracy": 0.9132195189595222, + "accuracy": 0.9132231697440147, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -42147,7 +42147,7 @@ } }, { - "accuracy": 0.9158970862627029, + "accuracy": 0.9158701747655869, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -42199,7 +42199,7 @@ } }, { - "accuracy": 0.9271287769079208, + "accuracy": 0.9270192459225655, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -42248,7 +42248,7 @@ } }, { - "accuracy": 0.9307196065783501, + "accuracy": 0.9306086674332619, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -42297,7 +42297,7 @@ } }, { - "accuracy": 0.955941203981638, + "accuracy": 0.9559643566608429, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -42349,7 +42349,7 @@ } }, { - "accuracy": 0.9593969620764256, + "accuracy": 0.9593847468495369, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -42401,7 +42401,7 @@ } }, { - "accuracy": 0.9644332267343998, + "accuracy": 0.9644359201192856, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -42450,7 +42450,7 @@ } }, { - "accuracy": 0.9767589289695024, + "accuracy": 0.9767424874007702, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -42493,7 +42493,7 @@ } }, { - "accuracy": 0.9787649121135473, + "accuracy": 0.9787469636648893, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -42536,7 +42536,7 @@ } }, { - "accuracy": 0.9774891547858715, + "accuracy": 0.9774995297193527, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -42588,7 +42588,7 @@ } }, { - "accuracy": 0.9802252352237701, + "accuracy": 0.9802324343472719, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -42640,7 +42640,7 @@ } }, { - "accuracy": 0.9885327704250813, + "accuracy": 0.9885260602459311, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -42692,7 +42692,7 @@ } }, { - "accuracy": 0.9901311350986362, + "accuracy": 0.9901291783899069, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -42744,7 +42744,7 @@ } }, { - "accuracy": 0.9936433634720743, + "accuracy": 0.9936425597406924, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -42787,7 +42787,7 @@ } }, { - "accuracy": 0.9941183044575155, + "accuracy": 0.9941207375377417, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -42836,7 +42836,7 @@ } }, { - "accuracy": 0.995133682154119, + "accuracy": 0.9951349799521267, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -42882,7 +42882,7 @@ } }, { - "accuracy": 0.9982258901000023, + "accuracy": 0.9982257036026567, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -42924,7 +42924,7 @@ ], "model.layers.22.self_attn": [ { - "accuracy": 0.8600220680236816, + "accuracy": 0.8604224324226379, "total_bits": 30308928, "q_proj": { "group_size": { @@ -42988,7 +42988,7 @@ } }, { - "accuracy": 0.8723062872886658, + "accuracy": 0.8720817565917969, "total_bits": 31455808, "q_proj": { "group_size": { @@ -43052,7 +43052,7 @@ } }, { - "accuracy": 0.8845950290560722, + "accuracy": 0.8842579200863838, "total_bits": 33412832, "q_proj": { "group_size": { @@ -43116,7 +43116,7 @@ } }, { - "accuracy": 0.9110095426440239, + "accuracy": 0.9107557758688927, "total_bits": 37983200, "q_proj": { "group_size": { @@ -43180,7 +43180,7 @@ } }, { - "accuracy": 0.9318739250302315, + "accuracy": 0.9317922592163086, "total_bits": 44838176, "q_proj": { "group_size": { @@ -43244,7 +43244,7 @@ } }, { - "accuracy": 0.9331164434552193, + "accuracy": 0.933014988899231, "total_bits": 44912768, "q_proj": { "group_size": { @@ -43308,7 +43308,7 @@ } }, { - "accuracy": 0.9576672576367855, + "accuracy": 0.9576846696436405, "total_bits": 57355552, "q_proj": { "group_size": { @@ -43360,7 +43360,7 @@ } }, { - "accuracy": 0.9591643884778023, + "accuracy": 0.9591707922518253, "total_bits": 57430144, "q_proj": { "group_size": { @@ -43412,7 +43412,7 @@ } }, { - "accuracy": 0.9620198979973793, + "accuracy": 0.9620674923062325, "total_bits": 57950464, "q_proj": { "group_size": { @@ -43464,7 +43464,7 @@ } }, { - "accuracy": 0.9642005227506161, + "accuracy": 0.9641453549265862, "total_bits": 58692736, "q_proj": { "group_size": { @@ -43516,7 +43516,7 @@ } }, { - "accuracy": 0.9660037606954575, + "accuracy": 0.9659963771700859, "total_bits": 59068544, "q_proj": { "group_size": { @@ -43580,7 +43580,7 @@ } }, { - "accuracy": 0.968350138515234, + "accuracy": 0.9683596417307854, "total_bits": 59588864, "q_proj": { "group_size": { @@ -43644,7 +43644,7 @@ } }, { - "accuracy": 0.9704683814197779, + "accuracy": 0.970446715131402, "total_bits": 61536832, "q_proj": { "group_size": { @@ -43705,7 +43705,7 @@ } }, { - "accuracy": 0.9727780558168888, + "accuracy": 0.9728066977113485, "total_bits": 62354560, "q_proj": { "group_size": { @@ -43766,7 +43766,7 @@ } }, { - "accuracy": 0.9837654158473015, + "accuracy": 0.9837965164333582, "total_bits": 75246880, "q_proj": { "group_size": { @@ -43827,7 +43827,7 @@ } }, { - "accuracy": 0.9864024138078094, + "accuracy": 0.9864012431353331, "total_bits": 76510336, "q_proj": { "group_size": { @@ -43888,7 +43888,7 @@ } }, { - "accuracy": 0.988879844546318, + "accuracy": 0.9888947391882539, "total_bits": 85667104, "q_proj": { "group_size": { @@ -43940,7 +43940,7 @@ } }, { - "accuracy": 0.9924624958075583, + "accuracy": 0.9924732316285372, "total_bits": 91722880, "q_proj": { "group_size": { @@ -43992,7 +43992,7 @@ } }, { - "accuracy": 0.9970627035945654, + "accuracy": 0.997059682616964, "total_bits": 113978656, "q_proj": { "group_size": { @@ -44046,7 +44046,7 @@ ], "model.layers.22.mlp": [ { - "accuracy": 0.9158392548561096, + "accuracy": 0.9158530607819557, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -44098,7 +44098,7 @@ } }, { - "accuracy": 0.9184657260775566, + "accuracy": 0.9185132682323456, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -44150,7 +44150,7 @@ } }, { - "accuracy": 0.9284176975488663, + "accuracy": 0.9284360781311989, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -44199,7 +44199,7 @@ } }, { - "accuracy": 0.9315355196595192, + "accuracy": 0.9315476194024086, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -44248,7 +44248,7 @@ } }, { - "accuracy": 0.9572760388255119, + "accuracy": 0.9572666324675083, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -44300,7 +44300,7 @@ } }, { - "accuracy": 0.9605343677103519, + "accuracy": 0.9605594612658024, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -44352,7 +44352,7 @@ } }, { - "accuracy": 0.9649710729718208, + "accuracy": 0.9650028869509697, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -44401,7 +44401,7 @@ } }, { - "accuracy": 0.9774835146963596, + "accuracy": 0.9774914421141148, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -44444,7 +44444,7 @@ } }, { - "accuracy": 0.9793780688196421, + "accuracy": 0.9793844223022461, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -44487,7 +44487,7 @@ } }, { - "accuracy": 0.9781624637544155, + "accuracy": 0.9781443998217583, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -44539,7 +44539,7 @@ } }, { - "accuracy": 0.9807386361062527, + "accuracy": 0.9807199090719223, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -44591,7 +44591,7 @@ } }, { - "accuracy": 0.988841949030757, + "accuracy": 0.9888424472883344, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -44643,7 +44643,7 @@ } }, { - "accuracy": 0.9903620686382055, + "accuracy": 0.9903717981651425, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -44695,7 +44695,7 @@ } }, { - "accuracy": 0.9938594889827073, + "accuracy": 0.9938576300628483, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -44738,7 +44738,7 @@ } }, { - "accuracy": 0.9942582775838673, + "accuracy": 0.994258991908282, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -44787,7 +44787,7 @@ } }, { - "accuracy": 0.9951435467228293, + "accuracy": 0.9951435327529907, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -44833,7 +44833,7 @@ } }, { - "accuracy": 0.9983168488834053, + "accuracy": 0.9983171256026253, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -44875,7 +44875,7 @@ ], "model.layers.23.self_attn": [ { - "accuracy": 0.9002235606312752, + "accuracy": 0.9000980034470558, "total_bits": 30308928, "q_proj": { "group_size": { @@ -44939,7 +44939,7 @@ } }, { - "accuracy": 0.9065486118197441, + "accuracy": 0.9066225737333298, "total_bits": 31455808, "q_proj": { "group_size": { @@ -45003,7 +45003,7 @@ } }, { - "accuracy": 0.918041318655014, + "accuracy": 0.9180461913347244, "total_bits": 33412832, "q_proj": { "group_size": { @@ -45067,7 +45067,7 @@ } }, { - "accuracy": 0.9384324066340923, + "accuracy": 0.9384226053953171, "total_bits": 37983200, "q_proj": { "group_size": { @@ -45131,7 +45131,7 @@ } }, { - "accuracy": 0.9503814466297626, + "accuracy": 0.950372826308012, "total_bits": 44838176, "q_proj": { "group_size": { @@ -45195,7 +45195,7 @@ } }, { - "accuracy": 0.9512348845601082, + "accuracy": 0.9512467607855797, "total_bits": 44912768, "q_proj": { "group_size": { @@ -45259,7 +45259,7 @@ } }, { - "accuracy": 0.970819503068924, + "accuracy": 0.9708252772688866, "total_bits": 57355552, "q_proj": { "group_size": { @@ -45311,7 +45311,7 @@ } }, { - "accuracy": 0.9717874713242054, + "accuracy": 0.9717806540429592, "total_bits": 57430144, "q_proj": { "group_size": { @@ -45363,7 +45363,7 @@ } }, { - "accuracy": 0.9738185089081526, + "accuracy": 0.9737685434520245, "total_bits": 57950464, "q_proj": { "group_size": { @@ -45415,7 +45415,7 @@ } }, { - "accuracy": 0.9751602187752724, + "accuracy": 0.9751146398484707, "total_bits": 58692736, "q_proj": { "group_size": { @@ -45467,7 +45467,7 @@ } }, { - "accuracy": 0.9751874227076769, + "accuracy": 0.9751594942063093, "total_bits": 59068544, "q_proj": { "group_size": { @@ -45531,7 +45531,7 @@ } }, { - "accuracy": 0.9768790081143379, + "accuracy": 0.9768443964421749, "total_bits": 59588864, "q_proj": { "group_size": { @@ -45595,7 +45595,7 @@ } }, { - "accuracy": 0.9792286064475775, + "accuracy": 0.9791899565607309, "total_bits": 61536832, "q_proj": { "group_size": { @@ -45656,7 +45656,7 @@ } }, { - "accuracy": 0.9807712472975254, + "accuracy": 0.9807248823344707, "total_bits": 62354560, "q_proj": { "group_size": { @@ -45717,7 +45717,7 @@ } }, { - "accuracy": 0.9885837156325579, + "accuracy": 0.98859893810004, "total_bits": 75246880, "q_proj": { "group_size": { @@ -45778,7 +45778,7 @@ } }, { - "accuracy": 0.9903419725596905, + "accuracy": 0.9903517542406917, "total_bits": 76510336, "q_proj": { "group_size": { @@ -45839,7 +45839,7 @@ } }, { - "accuracy": 0.9923813547939062, + "accuracy": 0.9923766339197755, "total_bits": 85667104, "q_proj": { "group_size": { @@ -45891,7 +45891,7 @@ } }, { - "accuracy": 0.9948961278423667, + "accuracy": 0.9948966847732663, "total_bits": 91722880, "q_proj": { "group_size": { @@ -45943,7 +45943,7 @@ } }, { - "accuracy": 0.9980002944357693, + "accuracy": 0.9980048832949251, "total_bits": 113978656, "q_proj": { "group_size": { @@ -45997,7 +45997,7 @@ ], "model.layers.23.mlp": [ { - "accuracy": 0.9183400496840477, + "accuracy": 0.9182481989264488, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -46049,7 +46049,7 @@ } }, { - "accuracy": 0.9207602441310883, + "accuracy": 0.9207983389496803, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -46101,7 +46101,7 @@ } }, { - "accuracy": 0.9304101318120956, + "accuracy": 0.9304468557238579, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -46150,7 +46150,7 @@ } }, { - "accuracy": 0.9335396587848663, + "accuracy": 0.9335753992199898, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -46199,7 +46199,7 @@ } }, { - "accuracy": 0.95809031650424, + "accuracy": 0.9580657295882702, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -46251,7 +46251,7 @@ } }, { - "accuracy": 0.9615879841148853, + "accuracy": 0.9615712836384773, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -46303,7 +46303,7 @@ } }, { - "accuracy": 0.9659944400191307, + "accuracy": 0.9659555852413177, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -46352,7 +46352,7 @@ } }, { - "accuracy": 0.9778957311064005, + "accuracy": 0.9778776671737432, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -46395,7 +46395,7 @@ } }, { - "accuracy": 0.9797942880541086, + "accuracy": 0.9797797352075577, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -46438,7 +46438,7 @@ } }, { - "accuracy": 0.9784904830157757, + "accuracy": 0.9784805551171303, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -46490,7 +46490,7 @@ } }, { - "accuracy": 0.9812441393733025, + "accuracy": 0.9812456294894218, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -46542,7 +46542,7 @@ } }, { - "accuracy": 0.9889877140522003, + "accuracy": 0.9889850988984108, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -46594,7 +46594,7 @@ } }, { - "accuracy": 0.9906198102980852, + "accuracy": 0.9906222112476826, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -46646,7 +46646,7 @@ } }, { - "accuracy": 0.9938806621357799, + "accuracy": 0.9938766132108867, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -46689,7 +46689,7 @@ } }, { - "accuracy": 0.9943293896503747, + "accuracy": 0.9943245043978095, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -46738,7 +46738,7 @@ } }, { - "accuracy": 0.9952116911299527, + "accuracy": 0.9952051844447851, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -46784,7 +46784,7 @@ } }, { - "accuracy": 0.9983016916085035, + "accuracy": 0.9983023661188781, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -46826,7 +46826,7 @@ ], "model.layers.24.self_attn": [ { - "accuracy": 0.9000411629676819, + "accuracy": 0.9000758603215218, "total_bits": 30308928, "q_proj": { "group_size": { @@ -46890,7 +46890,7 @@ } }, { - "accuracy": 0.9092481806874275, + "accuracy": 0.9089899435639381, "total_bits": 31455808, "q_proj": { "group_size": { @@ -46954,7 +46954,7 @@ } }, { - "accuracy": 0.9228631407022476, + "accuracy": 0.9227519929409027, "total_bits": 33412832, "q_proj": { "group_size": { @@ -47018,7 +47018,7 @@ } }, { - "accuracy": 0.9451075606048107, + "accuracy": 0.9450107850134373, "total_bits": 37983200, "q_proj": { "group_size": { @@ -47082,7 +47082,7 @@ } }, { - "accuracy": 0.9511439241468906, + "accuracy": 0.9511034078896046, "total_bits": 44838176, "q_proj": { "group_size": { @@ -47146,7 +47146,7 @@ } }, { - "accuracy": 0.9521462395787239, + "accuracy": 0.9521391801536083, "total_bits": 44912768, "q_proj": { "group_size": { @@ -47210,7 +47210,7 @@ } }, { - "accuracy": 0.9704149011522532, + "accuracy": 0.9703994449228048, "total_bits": 57355552, "q_proj": { "group_size": { @@ -47262,7 +47262,7 @@ } }, { - "accuracy": 0.9715412594377995, + "accuracy": 0.9715345222502947, "total_bits": 57430144, "q_proj": { "group_size": { @@ -47314,7 +47314,7 @@ } }, { - "accuracy": 0.9736700374633074, + "accuracy": 0.9736871141940355, "total_bits": 57950464, "q_proj": { "group_size": { @@ -47366,7 +47366,7 @@ } }, { - "accuracy": 0.9749877713620663, + "accuracy": 0.9749988541007042, "total_bits": 58692736, "q_proj": { "group_size": { @@ -47418,7 +47418,7 @@ } }, { - "accuracy": 0.9757188335061073, + "accuracy": 0.9757179487496614, "total_bits": 59068544, "q_proj": { "group_size": { @@ -47482,7 +47482,7 @@ } }, { - "accuracy": 0.9774507116526365, + "accuracy": 0.9774703308939934, "total_bits": 59588864, "q_proj": { "group_size": { @@ -47546,7 +47546,7 @@ } }, { - "accuracy": 0.9802383426576853, + "accuracy": 0.9802435729652643, "total_bits": 61536832, "q_proj": { "group_size": { @@ -47607,7 +47607,7 @@ } }, { - "accuracy": 0.9814821984618902, + "accuracy": 0.9814784899353981, "total_bits": 62354560, "q_proj": { "group_size": { @@ -47668,7 +47668,7 @@ } }, { - "accuracy": 0.9890236798673868, + "accuracy": 0.9890194535255432, "total_bits": 75246880, "q_proj": { "group_size": { @@ -47729,7 +47729,7 @@ } }, { - "accuracy": 0.9906842615455389, + "accuracy": 0.9906802931800485, "total_bits": 76510336, "q_proj": { "group_size": { @@ -47790,7 +47790,7 @@ } }, { - "accuracy": 0.9923012899234891, + "accuracy": 0.992301972117275, "total_bits": 85667104, "q_proj": { "group_size": { @@ -47842,7 +47842,7 @@ } }, { - "accuracy": 0.9948786222375929, + "accuracy": 0.9948805985040963, "total_bits": 91722880, "q_proj": { "group_size": { @@ -47894,7 +47894,7 @@ } }, { - "accuracy": 0.997995373327285, + "accuracy": 0.9979949889238924, "total_bits": 113978656, "q_proj": { "group_size": { @@ -47948,7 +47948,7 @@ ], "model.layers.24.mlp": [ { - "accuracy": 0.92559964209795, + "accuracy": 0.9256472215056419, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -48000,7 +48000,7 @@ } }, { - "accuracy": 0.9278130382299423, + "accuracy": 0.9277902320027351, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -48052,7 +48052,7 @@ } }, { - "accuracy": 0.9358445852994919, + "accuracy": 0.9358237609267235, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -48101,7 +48101,7 @@ } }, { - "accuracy": 0.9386767745018005, + "accuracy": 0.9386411532759666, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -48150,7 +48150,7 @@ } }, { - "accuracy": 0.9618233405053616, + "accuracy": 0.9618184603750706, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -48202,7 +48202,7 @@ } }, { - "accuracy": 0.9650960303843021, + "accuracy": 0.9650743305683136, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -48254,7 +48254,7 @@ } }, { - "accuracy": 0.9686915799975395, + "accuracy": 0.9686741307377815, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -48303,7 +48303,7 @@ } }, { - "accuracy": 0.9795693270862103, + "accuracy": 0.9795593917369843, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -48346,7 +48346,7 @@ } }, { - "accuracy": 0.9815245009958744, + "accuracy": 0.9815181270241737, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -48389,7 +48389,7 @@ } }, { - "accuracy": 0.9804772697389126, + "accuracy": 0.9804782513529062, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -48441,7 +48441,7 @@ } }, { - "accuracy": 0.982961056753993, + "accuracy": 0.9829648770391941, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -48493,7 +48493,7 @@ } }, { - "accuracy": 0.9900317844003439, + "accuracy": 0.9900405630469322, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -48545,7 +48545,7 @@ } }, { - "accuracy": 0.9914947487413883, + "accuracy": 0.9914911538362503, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -48597,7 +48597,7 @@ } }, { - "accuracy": 0.994380182120949, + "accuracy": 0.9943781793117523, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -48640,7 +48640,7 @@ } }, { - "accuracy": 0.9948879033327103, + "accuracy": 0.9948839037679136, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -48689,7 +48689,7 @@ } }, { - "accuracy": 0.9956484977155924, + "accuracy": 0.9956428701989353, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -48735,7 +48735,7 @@ } }, { - "accuracy": 0.9983874682802707, + "accuracy": 0.9983870283467695, "total_bits": 512046144, "gate_proj": { "group_size": { @@ -48777,7 +48777,7 @@ ], "model.layers.25.self_attn": [ { - "accuracy": 0.9237724244594574, + "accuracy": 0.923765018582344, "total_bits": 30308928, "q_proj": { "group_size": { @@ -48841,7 +48841,7 @@ } }, { - "accuracy": 0.9273674637079239, + "accuracy": 0.9273531660437584, "total_bits": 31455808, "q_proj": { "group_size": { @@ -48905,7 +48905,7 @@ } }, { - "accuracy": 0.9392730295658112, + "accuracy": 0.9392255060374737, "total_bits": 33412832, "q_proj": { "group_size": { @@ -48969,7 +48969,7 @@ } }, { - "accuracy": 0.9596496224403381, + "accuracy": 0.9596178978681564, "total_bits": 37983200, "q_proj": { "group_size": { @@ -49033,7 +49033,7 @@ } }, { - "accuracy": 0.9613975808024406, + "accuracy": 0.9613914974033833, "total_bits": 44838176, "q_proj": { "group_size": { @@ -49097,7 +49097,7 @@ } }, { - "accuracy": 0.9620046243071556, + "accuracy": 0.962019756436348, "total_bits": 44912768, "q_proj": { "group_size": { @@ -49161,7 +49161,7 @@ } }, { - "accuracy": 0.9788154270499945, + "accuracy": 0.9787868969142437, "total_bits": 57355552, "q_proj": { "group_size": { @@ -49213,7 +49213,7 @@ } }, { - "accuracy": 0.9793564602732658, + "accuracy": 0.9793211314827204, "total_bits": 57430144, "q_proj": { "group_size": { @@ -49265,7 +49265,7 @@ } }, { - "accuracy": 0.980896295979619, + "accuracy": 0.9808873273432255, "total_bits": 57950464, "q_proj": { "group_size": { @@ -49317,7 +49317,7 @@ } }, { - "accuracy": 0.9818288143724203, + "accuracy": 0.9818263165652752, "total_bits": 58692736, "q_proj": { "group_size": { @@ -49369,7 +49369,7 @@ } }, { - "accuracy": 0.9807142727077007, + "accuracy": 0.9806932359933853, "total_bits": 59068544, "q_proj": { "group_size": { @@ -49433,7 +49433,7 @@ } }, { - "accuracy": 0.9820475969463587, + "accuracy": 0.9820628892630339, "total_bits": 59588864, "q_proj": { "group_size": { @@ -49497,7 +49497,7 @@ } }, { - "accuracy": 0.9845238020643592, + "accuracy": 0.9845330221578479, "total_bits": 61536832, "q_proj": { "group_size": { @@ -49558,7 +49558,7 @@ } }, { - "accuracy": 0.9857827695086598, + "accuracy": 0.9857928091660142, "total_bits": 62354560, "q_proj": { "group_size": { @@ -49619,7 +49619,7 @@ } }, { - "accuracy": 0.9914994724094868, + "accuracy": 0.9915020493790507, "total_bits": 75246880, "q_proj": { "group_size": { @@ -49680,7 +49680,7 @@ } }, { - "accuracy": 0.9928717431612313, + "accuracy": 0.9928759732283652, "total_bits": 76510336, "q_proj": { "group_size": { @@ -49741,7 +49741,7 @@ } }, { - "accuracy": 0.9944902677088976, + "accuracy": 0.9944881168194115, "total_bits": 85667104, "q_proj": { "group_size": { @@ -49793,7 +49793,7 @@ } }, { - "accuracy": 0.9964965777471662, + "accuracy": 0.9964962496887892, "total_bits": 91722880, "q_proj": { "group_size": { @@ -49845,7 +49845,7 @@ } }, { - "accuracy": 0.9985775835812092, + "accuracy": 0.998579174396582, "total_bits": 113978656, "q_proj": { "group_size": { @@ -49899,7 +49899,7 @@ ], "model.layers.25.mlp": [ { - "accuracy": 0.9394260719418526, + "accuracy": 0.9394301772117615, "total_bits": 142969344, "gate_proj": { "group_size": { @@ -49951,7 +49951,7 @@ } }, { - "accuracy": 0.9412130787968636, + "accuracy": 0.9411459490656853, "total_bits": 148277760, "gate_proj": { "group_size": { @@ -50003,7 +50003,7 @@ } }, { - "accuracy": 0.9476935565471649, + "accuracy": 0.9477050378918648, "total_bits": 165462912, "gate_proj": { "group_size": { @@ -50052,7 +50052,7 @@ } }, { - "accuracy": 0.9500809907913208, + "accuracy": 0.9500880539417267, "total_bits": 185590656, "gate_proj": { "group_size": { @@ -50101,7 +50101,7 @@ } }, { - "accuracy": 0.9688832182437181, + "accuracy": 0.96889528632164, "total_bits": 209798784, "gate_proj": { "group_size": { @@ -50153,7 +50153,7 @@ } }, { - "accuracy": 0.9714504927396774, + "accuracy": 0.9714055731892586, "total_bits": 214864128, "gate_proj": { "group_size": { @@ -50205,7 +50205,7 @@ } }, { - "accuracy": 0.9744708389043808, + "accuracy": 0.9744217358529568, "total_bits": 230963904, "gate_proj": { "group_size": { @@ -50254,7 +50254,7 @@ } }, { - "accuracy": 0.9832967892289162, + "accuracy": 0.9833166711032391, "total_bits": 263770272, "gate_proj": { "group_size": { @@ -50297,7 +50297,7 @@ } }, { - "accuracy": 0.9849021304398775, + "accuracy": 0.9849346242845058, "total_bits": 267653376, "gate_proj": { "group_size": { @@ -50340,7 +50340,7 @@ } }, { - "accuracy": 0.9840464647859335, + "accuracy": 0.9840444251894951, "total_bits": 272393856, "gate_proj": { "group_size": { @@ -50392,7 +50392,7 @@ } }, { - "accuracy": 0.9860300803557038, + "accuracy": 0.9860321069136262, "total_bits": 277459200, "gate_proj": { "group_size": { @@ -50444,7 +50444,7 @@ } }, { - "accuracy": 0.9918431174010038, + "accuracy": 0.9918465595692396, "total_bits": 334988928, "gate_proj": { "group_size": { @@ -50496,7 +50496,7 @@ } }, { - "accuracy": 0.9930016789585352, + "accuracy": 0.9929989366792142, "total_bits": 340054272, "gate_proj": { "group_size": { @@ -50548,7 +50548,7 @@ } }, { - "accuracy": 0.9954412854276597, + "accuracy": 0.9954434814862907, "total_bits": 386967168, "gate_proj": { "group_size": { @@ -50591,7 +50591,7 @@ } }, { - "accuracy": 0.9958284390158951, + "accuracy": 0.9958340055309236, "total_bits": 400569408, "gate_proj": { "group_size": { @@ -50640,7 +50640,7 @@ } }, { - "accuracy": 0.9965037242509425, + "accuracy": 0.9965090290643275, "total_bits": 436548672, "gate_proj": { "group_size": { @@ -50686,7 +50686,7 @@ } }, { - "accuracy": 0.9987250744597986, + "accuracy": 0.9987249359255657, "total_bits": 512046144, "gate_proj": { "group_size": {