diff --git "a/measurement.json" "b/measurement.json" --- "a/measurement.json" +++ "b/measurement.json" @@ -2,7 +2,7 @@ "measurement": { "model.layers.0.self_attn": [ { - "accuracy": 0.9682983008679003, + "accuracy": 0.9682874407153577, "total_bits": 20322304, "q_proj": { "group_size": { @@ -66,7 +66,7 @@ } }, { - "accuracy": 0.9716265338938683, + "accuracy": 0.9716238399269059, "total_bits": 20977664, "q_proj": { "group_size": { @@ -130,7 +130,7 @@ } }, { - "accuracy": 0.9758414932293817, + "accuracy": 0.9758445249171928, "total_bits": 21419264, "q_proj": { "group_size": { @@ -194,7 +194,7 @@ } }, { - "accuracy": 0.9791492791846395, + "accuracy": 0.9791506784968078, "total_bits": 25481728, "q_proj": { "group_size": { @@ -258,7 +258,7 @@ } }, { - "accuracy": 0.9821789915440604, + "accuracy": 0.9821799445198849, "total_bits": 30051328, "q_proj": { "group_size": { @@ -322,7 +322,7 @@ } }, { - "accuracy": 0.9835021753096953, + "accuracy": 0.983504913339857, "total_bits": 30068480, "q_proj": { "group_size": { @@ -386,7 +386,7 @@ } }, { - "accuracy": 0.9831938220886514, + "accuracy": 0.9831941557931714, "total_bits": 38308864, "q_proj": { "group_size": { @@ -438,7 +438,7 @@ } }, { - "accuracy": 0.9845860572531819, + "accuracy": 0.9845845374511555, "total_bits": 38326016, "q_proj": { "group_size": { @@ -490,7 +490,7 @@ } }, { - "accuracy": 0.9875427457154728, + "accuracy": 0.9875404424383305, "total_bits": 38641152, "q_proj": { "group_size": { @@ -542,7 +542,7 @@ } }, { - "accuracy": 0.9877431174973026, + "accuracy": 0.9877446434111334, "total_bits": 39202816, "q_proj": { "group_size": { @@ -594,7 +594,7 @@ } }, { - "accuracy": 0.9908396730897948, + "accuracy": 0.9908262086682953, "total_bits": 39505664, "q_proj": { "group_size": { @@ -658,7 +658,7 @@ } }, { - "accuracy": 0.9923648509429768, + "accuracy": 0.9923634504666552, "total_bits": 39812608, "q_proj": { "group_size": { @@ -722,7 +722,7 @@ } }, { - "accuracy": 0.9911484192707576, + "accuracy": 0.9911214637686498, "total_bits": 40245248, "q_proj": { "group_size": { @@ -783,7 +783,7 @@ } }, { - "accuracy": 0.9928680540178902, + "accuracy": 0.9928679491858929, "total_bits": 40701952, "q_proj": { "group_size": { @@ -844,7 +844,7 @@ } }, { - "accuracy": 0.9947719568153843, + "accuracy": 0.99476970572141, "total_bits": 49384448, "q_proj": { "group_size": { @@ -905,7 +905,7 @@ } }, { - "accuracy": 0.9967667017335771, + "accuracy": 0.9967691240308341, "total_bits": 50139136, "q_proj": { "group_size": { @@ -966,7 +966,7 @@ } }, { - "accuracy": 0.9949336459685583, + "accuracy": 0.9949329298106022, "total_bits": 57183232, "q_proj": { "group_size": { @@ -1018,7 +1018,7 @@ } }, { - "accuracy": 0.9982713821955258, + "accuracy": 0.9982707447488792, "total_bits": 59125760, "q_proj": { "group_size": { @@ -1070,7 +1070,7 @@ } }, { - "accuracy": 0.9987349518269184, + "accuracy": 0.9987331730008009, "total_bits": 76057600, "q_proj": { "group_size": { @@ -1124,7 +1124,7 @@ ], "model.layers.0.mlp": [ { - "accuracy": 0.9384528608061373, + "accuracy": 0.938434915849939, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -1176,7 +1176,7 @@ } }, { - "accuracy": 0.9405098832212389, + "accuracy": 0.940501960227266, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -1228,7 +1228,7 @@ } }, { - "accuracy": 0.9507361555006355, + "accuracy": 0.9507351766806096, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -1277,7 +1277,7 @@ } }, { - "accuracy": 0.9542276696301997, + "accuracy": 0.9542373232543468, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -1326,7 +1326,7 @@ } }, { - "accuracy": 0.9704745137132704, + "accuracy": 0.9704789497191086, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -1378,7 +1378,7 @@ } }, { - "accuracy": 0.9727356568910182, + "accuracy": 0.9727522267494351, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -1430,7 +1430,7 @@ } }, { - "accuracy": 0.9773116145515814, + "accuracy": 0.977308277389966, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -1479,7 +1479,7 @@ } }, { - "accuracy": 0.9839919590158388, + "accuracy": 0.984003548452165, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -1522,7 +1522,7 @@ } }, { - "accuracy": 0.9855326557299122, + "accuracy": 0.9855335272150114, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -1565,7 +1565,7 @@ } }, { - "accuracy": 0.9850486510549672, + "accuracy": 0.985049948329106, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -1617,7 +1617,7 @@ } }, { - "accuracy": 0.9868802661658265, + "accuracy": 0.9868836476234719, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -1669,7 +1669,7 @@ } }, { - "accuracy": 0.992365266662091, + "accuracy": 0.9923667435068637, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -1721,7 +1721,7 @@ } }, { - "accuracy": 0.993443659186596, + "accuracy": 0.993445762025658, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -1773,7 +1773,7 @@ } }, { - "accuracy": 0.9956599612632999, + "accuracy": 0.9956614242837531, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -1816,7 +1816,7 @@ } }, { - "accuracy": 0.9961486826505279, + "accuracy": 0.9961501328798477, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -1865,7 +1865,7 @@ } }, { - "accuracy": 0.9971685604687082, + "accuracy": 0.9971702657348942, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -1911,7 +1911,7 @@ } }, { - "accuracy": 0.9987972777162213, + "accuracy": 0.9988014432165073, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -1953,7 +1953,7 @@ ], "model.layers.1.self_attn": [ { - "accuracy": 0.9108214639127254, + "accuracy": 0.9108511405065656, "total_bits": 20322304, "q_proj": { "group_size": { @@ -2017,7 +2017,7 @@ } }, { - "accuracy": 0.9232971454039216, + "accuracy": 0.923370539676398, "total_bits": 20977664, "q_proj": { "group_size": { @@ -2081,7 +2081,7 @@ } }, { - "accuracy": 0.9315698468126357, + "accuracy": 0.9315206478349864, "total_bits": 21419264, "q_proj": { "group_size": { @@ -2145,7 +2145,7 @@ } }, { - "accuracy": 0.9561206973157823, + "accuracy": 0.9561020527034998, "total_bits": 25481728, "q_proj": { "group_size": { @@ -2209,7 +2209,7 @@ } }, { - "accuracy": 0.9570822806563228, + "accuracy": 0.9570626576896757, "total_bits": 30051328, "q_proj": { "group_size": { @@ -2273,7 +2273,7 @@ } }, { - "accuracy": 0.9592409976758063, + "accuracy": 0.9592317920178175, "total_bits": 30068480, "q_proj": { "group_size": { @@ -2337,7 +2337,7 @@ } }, { - "accuracy": 0.9678784445859492, + "accuracy": 0.9679190741153434, "total_bits": 38308864, "q_proj": { "group_size": { @@ -2389,7 +2389,7 @@ } }, { - "accuracy": 0.9706547380192205, + "accuracy": 0.9706715542124584, "total_bits": 38326016, "q_proj": { "group_size": { @@ -2441,7 +2441,7 @@ } }, { - "accuracy": 0.9739332859171554, + "accuracy": 0.9739320183871314, "total_bits": 38641152, "q_proj": { "group_size": { @@ -2493,7 +2493,7 @@ } }, { - "accuracy": 0.9753870061831549, + "accuracy": 0.9753995828796178, "total_bits": 39202816, "q_proj": { "group_size": { @@ -2545,7 +2545,7 @@ } }, { - "accuracy": 0.9789500897750258, + "accuracy": 0.9789510484552011, "total_bits": 39505664, "q_proj": { "group_size": { @@ -2609,7 +2609,7 @@ } }, { - "accuracy": 0.980843193596229, + "accuracy": 0.9808439775370061, "total_bits": 39812608, "q_proj": { "group_size": { @@ -2673,7 +2673,7 @@ } }, { - "accuracy": 0.9811316981213167, + "accuracy": 0.98113038984593, "total_bits": 40245248, "q_proj": { "group_size": { @@ -2734,7 +2734,7 @@ } }, { - "accuracy": 0.9832416973658837, + "accuracy": 0.9832428406807594, "total_bits": 40701952, "q_proj": { "group_size": { @@ -2795,7 +2795,7 @@ } }, { - "accuracy": 0.9883767399587668, + "accuracy": 0.9883782229735516, "total_bits": 49384448, "q_proj": { "group_size": { @@ -2856,7 +2856,7 @@ } }, { - "accuracy": 0.9915346478228457, + "accuracy": 0.9915355073753744, "total_bits": 50139136, "q_proj": { "group_size": { @@ -2917,7 +2917,7 @@ } }, { - "accuracy": 0.9903387152589858, + "accuracy": 0.9903375284629874, "total_bits": 57183232, "q_proj": { "group_size": { @@ -2969,7 +2969,7 @@ } }, { - "accuracy": 0.9952386601362377, + "accuracy": 0.9952398307796102, "total_bits": 59125760, "q_proj": { "group_size": { @@ -3021,7 +3021,7 @@ } }, { - "accuracy": 0.9973312688525766, + "accuracy": 0.9973314737580949, "total_bits": 76057600, "q_proj": { "group_size": { @@ -3075,7 +3075,7 @@ ], "model.layers.1.mlp": [ { - "accuracy": 0.8793770750053227, + "accuracy": 0.8793256003409624, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -3127,7 +3127,7 @@ } }, { - "accuracy": 0.8823806294240057, + "accuracy": 0.8824421516619623, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -3179,7 +3179,7 @@ } }, { - "accuracy": 0.9030057615600526, + "accuracy": 0.9030293147079647, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -3228,7 +3228,7 @@ } }, { - "accuracy": 0.9090581187047064, + "accuracy": 0.9090742925181985, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -3277,7 +3277,7 @@ } }, { - "accuracy": 0.9400753302033991, + "accuracy": 0.9400730272755027, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -3329,7 +3329,7 @@ } }, { - "accuracy": 0.944974705344066, + "accuracy": 0.9449704205617309, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -3381,7 +3381,7 @@ } }, { - "accuracy": 0.953436266630888, + "accuracy": 0.9534328070003539, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -3430,7 +3430,7 @@ } }, { - "accuracy": 0.9691391321830451, + "accuracy": 0.9691335337702185, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -3473,7 +3473,7 @@ } }, { - "accuracy": 0.9719762564636767, + "accuracy": 0.9719835316063836, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -3516,7 +3516,7 @@ } }, { - "accuracy": 0.969587788102217, + "accuracy": 0.9695805793162435, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -3568,7 +3568,7 @@ } }, { - "accuracy": 0.9734254346694797, + "accuracy": 0.9734432843979448, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -3620,7 +3620,7 @@ } }, { - "accuracy": 0.9845075445482507, + "accuracy": 0.9844993405858986, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -3672,7 +3672,7 @@ } }, { - "accuracy": 0.9867773523437791, + "accuracy": 0.9867757280007936, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -3724,7 +3724,7 @@ } }, { - "accuracy": 0.9916443115798756, + "accuracy": 0.9916464776615612, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -3767,7 +3767,7 @@ } }, { - "accuracy": 0.9921156048367266, + "accuracy": 0.9921119355421979, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -3816,7 +3816,7 @@ } }, { - "accuracy": 0.9938288204139099, + "accuracy": 0.9938303573580924, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -3862,7 +3862,7 @@ } }, { - "accuracy": 0.9977631597430445, + "accuracy": 0.997766035143286, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -3904,7 +3904,7 @@ ], "model.layers.2.self_attn": [ { - "accuracy": 0.9108831738121808, + "accuracy": 0.9109318256378174, "total_bits": 20322304, "q_proj": { "group_size": { @@ -3968,7 +3968,7 @@ } }, { - "accuracy": 0.9188321116380394, + "accuracy": 0.9188620522618294, "total_bits": 20977664, "q_proj": { "group_size": { @@ -4032,7 +4032,7 @@ } }, { - "accuracy": 0.9258095030672848, + "accuracy": 0.9258248675614595, "total_bits": 21419264, "q_proj": { "group_size": { @@ -4096,7 +4096,7 @@ } }, { - "accuracy": 0.9540007621981204, + "accuracy": 0.9539957451634109, "total_bits": 25481728, "q_proj": { "group_size": { @@ -4160,7 +4160,7 @@ } }, { - "accuracy": 0.9557981574907899, + "accuracy": 0.9558035505469888, "total_bits": 30051328, "q_proj": { "group_size": { @@ -4224,7 +4224,7 @@ } }, { - "accuracy": 0.9572184963617474, + "accuracy": 0.9572357737924904, "total_bits": 30068480, "q_proj": { "group_size": { @@ -4288,7 +4288,7 @@ } }, { - "accuracy": 0.9715723822591826, + "accuracy": 0.9715711995959282, "total_bits": 38308864, "q_proj": { "group_size": { @@ -4340,7 +4340,7 @@ } }, { - "accuracy": 0.9736771958414465, + "accuracy": 0.973668051417917, "total_bits": 38326016, "q_proj": { "group_size": { @@ -4392,7 +4392,7 @@ } }, { - "accuracy": 0.9759140233509243, + "accuracy": 0.9759049126878381, "total_bits": 38641152, "q_proj": { "group_size": { @@ -4444,7 +4444,7 @@ } }, { - "accuracy": 0.9773596292361617, + "accuracy": 0.9773663431406021, "total_bits": 39202816, "q_proj": { "group_size": { @@ -4496,7 +4496,7 @@ } }, { - "accuracy": 0.9781920240493491, + "accuracy": 0.9781929469900206, "total_bits": 39505664, "q_proj": { "group_size": { @@ -4560,7 +4560,7 @@ } }, { - "accuracy": 0.9797302876831964, + "accuracy": 0.9797207546653226, "total_bits": 39812608, "q_proj": { "group_size": { @@ -4624,7 +4624,7 @@ } }, { - "accuracy": 0.9810420385329053, + "accuracy": 0.981040223967284, "total_bits": 40245248, "q_proj": { "group_size": { @@ -4685,7 +4685,7 @@ } }, { - "accuracy": 0.9825765965506434, + "accuracy": 0.9825644714292139, "total_bits": 40701952, "q_proj": { "group_size": { @@ -4746,7 +4746,7 @@ } }, { - "accuracy": 0.9890098834293894, + "accuracy": 0.9890050991089083, "total_bits": 49384448, "q_proj": { "group_size": { @@ -4807,7 +4807,7 @@ } }, { - "accuracy": 0.9910462911357172, + "accuracy": 0.991049351345282, "total_bits": 50139136, "q_proj": { "group_size": { @@ -4868,7 +4868,7 @@ } }, { - "accuracy": 0.9923304296680726, + "accuracy": 0.9923324783449061, "total_bits": 57183232, "q_proj": { "group_size": { @@ -4920,7 +4920,7 @@ } }, { - "accuracy": 0.9949429729313124, + "accuracy": 0.9949421468481887, "total_bits": 59125760, "q_proj": { "group_size": { @@ -4972,7 +4972,7 @@ } }, { - "accuracy": 0.9978999279046548, + "accuracy": 0.9979008423906635, "total_bits": 76057600, "q_proj": { "group_size": { @@ -5026,7 +5026,7 @@ ], "model.layers.2.mlp": [ { - "accuracy": 0.840625281445682, + "accuracy": 0.8508858843706548, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -5078,7 +5078,7 @@ } }, { - "accuracy": 0.8434935556724668, + "accuracy": 0.8228671383112669, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -5130,7 +5130,7 @@ } }, { - "accuracy": 0.842301519587636, + "accuracy": 0.8238817453384399, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -5179,7 +5179,7 @@ } }, { - "accuracy": 0.8428694028407335, + "accuracy": 0.8244084091857076, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -5228,7 +5228,7 @@ } }, { - "accuracy": 0.9608602949883789, + "accuracy": 0.9603659544372931, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -5280,7 +5280,7 @@ } }, { - "accuracy": 0.9743879720335826, + "accuracy": 0.9714144087629393, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -5332,7 +5332,7 @@ } }, { - "accuracy": 0.9768655257066712, + "accuracy": 0.9736919869901612, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -5381,7 +5381,7 @@ } }, { - "accuracy": 0.9835631273454055, + "accuracy": 0.9804451974923722, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -5424,7 +5424,7 @@ } }, { - "accuracy": 0.9841959786135703, + "accuracy": 0.9853532239794731, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -5467,7 +5467,7 @@ } }, { - "accuracy": 0.9873136784299277, + "accuracy": 0.9876259589218535, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -5519,7 +5519,7 @@ } }, { - "accuracy": 0.9881969522102736, + "accuracy": 0.9875553772435524, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -5571,7 +5571,7 @@ } }, { - "accuracy": 0.993532494554529, + "accuracy": 0.9937278879806399, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -5623,7 +5623,7 @@ } }, { - "accuracy": 0.9945291330222972, + "accuracy": 0.9945026718487497, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -5675,7 +5675,7 @@ } }, { - "accuracy": 0.9960147560341284, + "accuracy": 0.994713309512008, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -5718,7 +5718,7 @@ } }, { - "accuracy": 0.9961775908013806, + "accuracy": 0.9957495419075713, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -5767,7 +5767,7 @@ } }, { - "accuracy": 0.9966542667534668, + "accuracy": 0.9961803438491188, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -5813,7 +5813,7 @@ } }, { - "accuracy": 0.9975590130779892, + "accuracy": 0.9975739220244577, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -5855,7 +5855,7 @@ ], "model.layers.3.self_attn": [ { - "accuracy": 0.9736474718665704, + "accuracy": 0.9727510105585679, "total_bits": 20322304, "q_proj": { "group_size": { @@ -5919,7 +5919,7 @@ } }, { - "accuracy": 0.9758290975587443, + "accuracy": 0.9753560880199075, "total_bits": 20977664, "q_proj": { "group_size": { @@ -5983,7 +5983,7 @@ } }, { - "accuracy": 0.9801487566437572, + "accuracy": 0.9801863346947357, "total_bits": 21419264, "q_proj": { "group_size": { @@ -6047,7 +6047,7 @@ } }, { - "accuracy": 0.9847445175400935, + "accuracy": 0.9849272505380213, "total_bits": 25481728, "q_proj": { "group_size": { @@ -6111,7 +6111,7 @@ } }, { - "accuracy": 0.9864065214060247, + "accuracy": 0.9866183617850766, "total_bits": 30051328, "q_proj": { "group_size": { @@ -6175,7 +6175,7 @@ } }, { - "accuracy": 0.9875185675336979, + "accuracy": 0.9868732392205857, "total_bits": 30068480, "q_proj": { "group_size": { @@ -6239,7 +6239,7 @@ } }, { - "accuracy": 0.9914771775947884, + "accuracy": 0.9914904434699565, "total_bits": 38308864, "q_proj": { "group_size": { @@ -6291,7 +6291,7 @@ } }, { - "accuracy": 0.9916240855236538, + "accuracy": 0.9916756358579732, "total_bits": 38326016, "q_proj": { "group_size": { @@ -6343,7 +6343,7 @@ } }, { - "accuracy": 0.9925482680846471, + "accuracy": 0.9925506020954344, "total_bits": 38641152, "q_proj": { "group_size": { @@ -6395,7 +6395,7 @@ } }, { - "accuracy": 0.9926470368518494, + "accuracy": 0.9927375791594386, "total_bits": 39202816, "q_proj": { "group_size": { @@ -6447,7 +6447,7 @@ } }, { - "accuracy": 0.9926109578809701, + "accuracy": 0.9929143660410773, "total_bits": 39505664, "q_proj": { "group_size": { @@ -6511,7 +6511,7 @@ } }, { - "accuracy": 0.9933838602155447, + "accuracy": 0.9931017690978479, "total_bits": 39812608, "q_proj": { "group_size": { @@ -6575,7 +6575,7 @@ } }, { - "accuracy": 0.9947964096791111, + "accuracy": 0.9946609666803852, "total_bits": 40245248, "q_proj": { "group_size": { @@ -6636,7 +6636,7 @@ } }, { - "accuracy": 0.9952841958438512, + "accuracy": 0.9953527827456128, "total_bits": 40701952, "q_proj": { "group_size": { @@ -6697,7 +6697,7 @@ } }, { - "accuracy": 0.9970442751364317, + "accuracy": 0.9970253725332441, "total_bits": 49384448, "q_proj": { "group_size": { @@ -6758,7 +6758,7 @@ } }, { - "accuracy": 0.9975447617907776, + "accuracy": 0.9975086720369291, "total_bits": 50139136, "q_proj": { "group_size": { @@ -6819,7 +6819,7 @@ } }, { - "accuracy": 0.9975781371322228, + "accuracy": 0.9975524558394682, "total_bits": 57183232, "q_proj": { "group_size": { @@ -6871,7 +6871,7 @@ } }, { - "accuracy": 0.998904952481098, + "accuracy": 0.9989020308057661, "total_bits": 59125760, "q_proj": { "group_size": { @@ -6923,7 +6923,7 @@ } }, { - "accuracy": 0.9993530151950836, + "accuracy": 0.9993565694858262, "total_bits": 76057600, "q_proj": { "group_size": { @@ -6977,7 +6977,7 @@ ], "model.layers.3.mlp": [ { - "accuracy": 0.9503226869273931, + "accuracy": 0.9503053447697312, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -7029,7 +7029,7 @@ } }, { - "accuracy": 0.9516687479335815, + "accuracy": 0.9516650929581374, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -7081,7 +7081,7 @@ } }, { - "accuracy": 0.9591339628677815, + "accuracy": 0.9591238992288709, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -7130,7 +7130,7 @@ } }, { - "accuracy": 0.9615265524480492, + "accuracy": 0.9615170336328447, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -7179,7 +7179,7 @@ } }, { - "accuracy": 0.9748701251810417, + "accuracy": 0.9748653610004112, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -7231,7 +7231,7 @@ } }, { - "accuracy": 0.9768565815174952, + "accuracy": 0.9768592905020341, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -7283,7 +7283,7 @@ } }, { - "accuracy": 0.980164977372624, + "accuracy": 0.9801605626707897, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -7332,7 +7332,7 @@ } }, { - "accuracy": 0.9868724637199193, + "accuracy": 0.9868700111401267, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -7375,7 +7375,7 @@ } }, { - "accuracy": 0.9880873914808035, + "accuracy": 0.9880812272313051, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -7418,7 +7418,7 @@ } }, { - "accuracy": 0.9872069549164735, + "accuracy": 0.9872040670015849, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -7470,7 +7470,7 @@ } }, { - "accuracy": 0.9887989581911825, + "accuracy": 0.9887957595638, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -7522,7 +7522,7 @@ } }, { - "accuracy": 0.9934862754016649, + "accuracy": 0.9934866408002563, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -7574,7 +7574,7 @@ } }, { - "accuracy": 0.9944231532281265, + "accuracy": 0.9944198449666146, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -7626,7 +7626,7 @@ } }, { - "accuracy": 0.9964644734718604, + "accuracy": 0.9964635728247231, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -7669,7 +7669,7 @@ } }, { - "accuracy": 0.9966909741197014, + "accuracy": 0.9966915663680993, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -7718,7 +7718,7 @@ } }, { - "accuracy": 0.9973680579132633, + "accuracy": 0.9973676756344503, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -7764,7 +7764,7 @@ } }, { - "accuracy": 0.9990603479491256, + "accuracy": 0.9990612296351173, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -7806,7 +7806,7 @@ ], "model.layers.4.self_attn": [ { - "accuracy": 0.9443176258355379, + "accuracy": 0.9505113521590829, "total_bits": 20322304, "q_proj": { "group_size": { @@ -7870,7 +7870,7 @@ } }, { - "accuracy": 0.9480956732295454, + "accuracy": 0.9505069560837001, "total_bits": 20977664, "q_proj": { "group_size": { @@ -7934,7 +7934,7 @@ } }, { - "accuracy": 0.96754155959934, + "accuracy": 0.9683844344690442, "total_bits": 21419264, "q_proj": { "group_size": { @@ -7998,7 +7998,7 @@ } }, { - "accuracy": 0.9740229183807969, + "accuracy": 0.9744697749847546, "total_bits": 25481728, "q_proj": { "group_size": { @@ -8062,7 +8062,7 @@ } }, { - "accuracy": 0.9777639809763059, + "accuracy": 0.9775246130302548, "total_bits": 30051328, "q_proj": { "group_size": { @@ -8126,7 +8126,7 @@ } }, { - "accuracy": 0.9755148711847141, + "accuracy": 0.9768680022098124, "total_bits": 30068480, "q_proj": { "group_size": { @@ -8190,7 +8190,7 @@ } }, { - "accuracy": 0.9853574702283368, + "accuracy": 0.9853687543072738, "total_bits": 38308864, "q_proj": { "group_size": { @@ -8242,7 +8242,7 @@ } }, { - "accuracy": 0.9862714365590364, + "accuracy": 0.9871022676234134, "total_bits": 38326016, "q_proj": { "group_size": { @@ -8294,7 +8294,7 @@ } }, { - "accuracy": 0.9873043717816472, + "accuracy": 0.9873597125988454, "total_bits": 38641152, "q_proj": { "group_size": { @@ -8346,7 +8346,7 @@ } }, { - "accuracy": 0.9876295399153605, + "accuracy": 0.9877094957628287, "total_bits": 39202816, "q_proj": { "group_size": { @@ -8398,7 +8398,7 @@ } }, { - "accuracy": 0.9881749196210876, + "accuracy": 0.9873825625400059, "total_bits": 39505664, "q_proj": { "group_size": { @@ -8462,7 +8462,7 @@ } }, { - "accuracy": 0.988841739599593, + "accuracy": 0.9885187454638071, "total_bits": 39812608, "q_proj": { "group_size": { @@ -8526,7 +8526,7 @@ } }, { - "accuracy": 0.9912818209850229, + "accuracy": 0.9911124990903772, "total_bits": 40245248, "q_proj": { "group_size": { @@ -8587,7 +8587,7 @@ } }, { - "accuracy": 0.9923008258629125, + "accuracy": 0.9922324632061645, "total_bits": 40701952, "q_proj": { "group_size": { @@ -8648,7 +8648,7 @@ } }, { - "accuracy": 0.9951733036432415, + "accuracy": 0.9949509919097181, "total_bits": 49384448, "q_proj": { "group_size": { @@ -8709,7 +8709,7 @@ } }, { - "accuracy": 0.9960373506182805, + "accuracy": 0.9959194401744753, "total_bits": 50139136, "q_proj": { "group_size": { @@ -8770,7 +8770,7 @@ } }, { - "accuracy": 0.9959649939992232, + "accuracy": 0.9957039124274161, "total_bits": 57183232, "q_proj": { "group_size": { @@ -8822,7 +8822,7 @@ } }, { - "accuracy": 0.9981779366498813, + "accuracy": 0.9981541812885553, "total_bits": 59125760, "q_proj": { "group_size": { @@ -8874,7 +8874,7 @@ } }, { - "accuracy": 0.9990017554337101, + "accuracy": 0.9989064547044109, "total_bits": 76057600, "q_proj": { "group_size": { @@ -8928,7 +8928,7 @@ ], "model.layers.4.mlp": [ { - "accuracy": 0.9381219202186912, + "accuracy": 0.9381555742584169, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -8980,7 +8980,7 @@ } }, { - "accuracy": 0.9398156930692494, + "accuracy": 0.9398268219083548, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -9032,7 +9032,7 @@ } }, { - "accuracy": 0.9491160199977458, + "accuracy": 0.9491222584620118, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -9081,7 +9081,7 @@ } }, { - "accuracy": 0.9520283334422857, + "accuracy": 0.9520410485565662, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -9130,7 +9130,7 @@ } }, { - "accuracy": 0.9685923740034923, + "accuracy": 0.9685996748739854, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -9182,7 +9182,7 @@ } }, { - "accuracy": 0.971025726874359, + "accuracy": 0.9710266159381717, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -9234,7 +9234,7 @@ } }, { - "accuracy": 0.9751350940205157, + "accuracy": 0.9751348763238639, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -9283,7 +9283,7 @@ } }, { - "accuracy": 0.9836475097690709, + "accuracy": 0.9836455206386745, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -9326,7 +9326,7 @@ } }, { - "accuracy": 0.9851255836547352, + "accuracy": 0.9851241566939279, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -9369,7 +9369,7 @@ } }, { - "accuracy": 0.9840292109875008, + "accuracy": 0.9840302344528027, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -9421,7 +9421,7 @@ } }, { - "accuracy": 0.9859674836625345, + "accuracy": 0.9859583526849747, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -9473,7 +9473,7 @@ } }, { - "accuracy": 0.9918705298041459, + "accuracy": 0.9918730374483857, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -9525,7 +9525,7 @@ } }, { - "accuracy": 0.9930100547790062, + "accuracy": 0.9930113837181125, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -9577,7 +9577,7 @@ } }, { - "accuracy": 0.995612055703532, + "accuracy": 0.9956115610257257, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -9620,7 +9620,7 @@ } }, { - "accuracy": 0.9958760176668875, + "accuracy": 0.9958746829361189, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -9669,7 +9669,7 @@ } }, { - "accuracy": 0.9967082659131847, + "accuracy": 0.9967091263679322, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -9715,7 +9715,7 @@ } }, { - "accuracy": 0.9988447303257999, + "accuracy": 0.9988452331308508, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -9757,7 +9757,7 @@ ], "model.layers.5.self_attn": [ { - "accuracy": 0.9465296540874988, + "accuracy": 0.9439493955578655, "total_bits": 20322304, "q_proj": { "group_size": { @@ -9821,7 +9821,7 @@ } }, { - "accuracy": 0.9399791315663606, + "accuracy": 0.9491862847935408, "total_bits": 20977664, "q_proj": { "group_size": { @@ -9885,7 +9885,7 @@ } }, { - "accuracy": 0.9649434428429231, + "accuracy": 0.9640327207744122, "total_bits": 21419264, "q_proj": { "group_size": { @@ -9949,7 +9949,7 @@ } }, { - "accuracy": 0.9709275431232527, + "accuracy": 0.9699463305296376, "total_bits": 25481728, "q_proj": { "group_size": { @@ -10013,7 +10013,7 @@ } }, { - "accuracy": 0.9735816894099116, + "accuracy": 0.9731963544618338, "total_bits": 30051328, "q_proj": { "group_size": { @@ -10077,7 +10077,7 @@ } }, { - "accuracy": 0.9746526911621913, + "accuracy": 0.9738411789294332, "total_bits": 30068480, "q_proj": { "group_size": { @@ -10141,7 +10141,7 @@ } }, { - "accuracy": 0.9841359436977655, + "accuracy": 0.9840768628637306, "total_bits": 38308864, "q_proj": { "group_size": { @@ -10193,7 +10193,7 @@ } }, { - "accuracy": 0.9845134740462527, + "accuracy": 0.9864005128620192, "total_bits": 38326016, "q_proj": { "group_size": { @@ -10245,7 +10245,7 @@ } }, { - "accuracy": 0.9865997735760175, + "accuracy": 0.9858329140697606, "total_bits": 38641152, "q_proj": { "group_size": { @@ -10297,7 +10297,7 @@ } }, { - "accuracy": 0.986946506309323, + "accuracy": 0.9860310146468692, "total_bits": 39202816, "q_proj": { "group_size": { @@ -10349,7 +10349,7 @@ } }, { - "accuracy": 0.9867051407927647, + "accuracy": 0.985195861547254, "total_bits": 39505664, "q_proj": { "group_size": { @@ -10413,7 +10413,7 @@ } }, { - "accuracy": 0.986678110959474, + "accuracy": 0.9863588069565594, "total_bits": 39812608, "q_proj": { "group_size": { @@ -10477,7 +10477,7 @@ } }, { - "accuracy": 0.9903565040440299, + "accuracy": 0.9904701206251048, "total_bits": 40245248, "q_proj": { "group_size": { @@ -10538,7 +10538,7 @@ } }, { - "accuracy": 0.9912592684850097, + "accuracy": 0.9916604193858802, "total_bits": 40701952, "q_proj": { "group_size": { @@ -10599,7 +10599,7 @@ } }, { - "accuracy": 0.9945314888900612, + "accuracy": 0.9946889041457325, "total_bits": 49384448, "q_proj": { "group_size": { @@ -10660,7 +10660,7 @@ } }, { - "accuracy": 0.9954941700561903, + "accuracy": 0.9956147490011062, "total_bits": 50139136, "q_proj": { "group_size": { @@ -10721,7 +10721,7 @@ } }, { - "accuracy": 0.9953118968114723, + "accuracy": 0.9954356452799402, "total_bits": 57183232, "q_proj": { "group_size": { @@ -10773,7 +10773,7 @@ } }, { - "accuracy": 0.9981462773575913, + "accuracy": 0.9981674393202411, "total_bits": 59125760, "q_proj": { "group_size": { @@ -10825,7 +10825,7 @@ } }, { - "accuracy": 0.9988067679005326, + "accuracy": 0.9988245204876876, "total_bits": 76057600, "q_proj": { "group_size": { @@ -10879,7 +10879,7 @@ ], "model.layers.5.mlp": [ { - "accuracy": 0.9266083212569356, + "accuracy": 0.9265897828154266, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -10931,7 +10931,7 @@ } }, { - "accuracy": 0.9286065436899662, + "accuracy": 0.9286236956249923, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -10983,7 +10983,7 @@ } }, { - "accuracy": 0.9396829379256815, + "accuracy": 0.939705518539995, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -11032,7 +11032,7 @@ } }, { - "accuracy": 0.9431348899379373, + "accuracy": 0.9431477903854102, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -11081,7 +11081,7 @@ } }, { - "accuracy": 0.9627713058143854, + "accuracy": 0.9627439859323204, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -11133,7 +11133,7 @@ } }, { - "accuracy": 0.9656413906486705, + "accuracy": 0.9656392872566357, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -11185,7 +11185,7 @@ } }, { - "accuracy": 0.9705372618045658, + "accuracy": 0.9705301222857088, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -11234,7 +11234,7 @@ } }, { - "accuracy": 0.9805802576011047, + "accuracy": 0.9805821948684752, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -11277,7 +11277,7 @@ } }, { - "accuracy": 0.9823318731505424, + "accuracy": 0.982332726707682, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -11320,7 +11320,7 @@ } }, { - "accuracy": 0.981048887479119, + "accuracy": 0.9810561769409105, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -11372,7 +11372,7 @@ } }, { - "accuracy": 0.9833684508921579, + "accuracy": 0.9833735114661977, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -11424,7 +11424,7 @@ } }, { - "accuracy": 0.990378886112012, + "accuracy": 0.9903801176114939, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -11476,7 +11476,7 @@ } }, { - "accuracy": 0.9917267852870282, + "accuracy": 0.9917245247925166, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -11528,7 +11528,7 @@ } }, { - "accuracy": 0.9947774146858137, + "accuracy": 0.9947774168103933, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -11571,7 +11571,7 @@ } }, { - "accuracy": 0.9951207306003198, + "accuracy": 0.9951203083910514, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -11620,7 +11620,7 @@ } }, { - "accuracy": 0.9961024023214122, + "accuracy": 0.9961022604547907, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -11666,7 +11666,7 @@ } }, { - "accuracy": 0.998621207450924, + "accuracy": 0.9986226341570728, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -11708,7 +11708,7 @@ ], "model.layers.6.self_attn": [ { - "accuracy": 0.9418419930152595, + "accuracy": 0.9455862352624536, "total_bits": 20322304, "q_proj": { "group_size": { @@ -11772,7 +11772,7 @@ } }, { - "accuracy": 0.9484909817110747, + "accuracy": 0.947748615173623, "total_bits": 20977664, "q_proj": { "group_size": { @@ -11836,7 +11836,7 @@ } }, { - "accuracy": 0.9587179007939994, + "accuracy": 0.9581296476535499, "total_bits": 21419264, "q_proj": { "group_size": { @@ -11900,7 +11900,7 @@ } }, { - "accuracy": 0.9661045121029019, + "accuracy": 0.9654256459325552, "total_bits": 25481728, "q_proj": { "group_size": { @@ -11964,7 +11964,7 @@ } }, { - "accuracy": 0.9726183342281729, + "accuracy": 0.971989750280045, "total_bits": 30051328, "q_proj": { "group_size": { @@ -12028,7 +12028,7 @@ } }, { - "accuracy": 0.9735796074382961, + "accuracy": 0.9739401262486354, "total_bits": 30068480, "q_proj": { "group_size": { @@ -12092,7 +12092,7 @@ } }, { - "accuracy": 0.9825016316026449, + "accuracy": 0.982845788821578, "total_bits": 38308864, "q_proj": { "group_size": { @@ -12144,7 +12144,7 @@ } }, { - "accuracy": 0.9834437241661362, + "accuracy": 0.9833603407023475, "total_bits": 38326016, "q_proj": { "group_size": { @@ -12196,7 +12196,7 @@ } }, { - "accuracy": 0.9851681603468023, + "accuracy": 0.9849820840754546, "total_bits": 38641152, "q_proj": { "group_size": { @@ -12248,7 +12248,7 @@ } }, { - "accuracy": 0.9856295348145068, + "accuracy": 0.9854893322335556, "total_bits": 39202816, "q_proj": { "group_size": { @@ -12300,7 +12300,7 @@ } }, { - "accuracy": 0.9851711338851601, + "accuracy": 0.9850116848829202, "total_bits": 39505664, "q_proj": { "group_size": { @@ -12364,7 +12364,7 @@ } }, { - "accuracy": 0.986586615035776, + "accuracy": 0.9862476548296399, "total_bits": 39812608, "q_proj": { "group_size": { @@ -12428,7 +12428,7 @@ } }, { - "accuracy": 0.9888801165507175, + "accuracy": 0.9884495650185272, "total_bits": 40245248, "q_proj": { "group_size": { @@ -12489,7 +12489,7 @@ } }, { - "accuracy": 0.9898250671103597, + "accuracy": 0.9897496405756101, "total_bits": 40701952, "q_proj": { "group_size": { @@ -12550,7 +12550,7 @@ } }, { - "accuracy": 0.9939268997695763, + "accuracy": 0.9939482012414373, "total_bits": 49384448, "q_proj": { "group_size": { @@ -12611,7 +12611,7 @@ } }, { - "accuracy": 0.9948269620945211, + "accuracy": 0.9948613537999336, "total_bits": 50139136, "q_proj": { "group_size": { @@ -12672,7 +12672,7 @@ } }, { - "accuracy": 0.9951100962352939, + "accuracy": 0.9951175312453415, "total_bits": 57183232, "q_proj": { "group_size": { @@ -12724,7 +12724,7 @@ } }, { - "accuracy": 0.997504429120454, + "accuracy": 0.9974744894425385, "total_bits": 59125760, "q_proj": { "group_size": { @@ -12776,7 +12776,7 @@ } }, { - "accuracy": 0.9987283626105636, + "accuracy": 0.9986800119731924, "total_bits": 76057600, "q_proj": { "group_size": { @@ -12830,7 +12830,7 @@ ], "model.layers.6.mlp": [ { - "accuracy": 0.9170122384093702, + "accuracy": 0.9170301384292543, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -12882,7 +12882,7 @@ } }, { - "accuracy": 0.9193421402014792, + "accuracy": 0.919331019744277, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -12934,7 +12934,7 @@ } }, { - "accuracy": 0.932212425628677, + "accuracy": 0.932229972910136, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -12983,7 +12983,7 @@ } }, { - "accuracy": 0.9363095683511347, + "accuracy": 0.9363063033670187, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -13032,7 +13032,7 @@ } }, { - "accuracy": 0.9577710141893476, + "accuracy": 0.9577465485781431, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -13084,7 +13084,7 @@ } }, { - "accuracy": 0.9611061662435532, + "accuracy": 0.9610988129861653, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -13136,7 +13136,7 @@ } }, { - "accuracy": 0.9667884936789051, + "accuracy": 0.9667723688762635, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -13185,7 +13185,7 @@ } }, { - "accuracy": 0.9779134966665879, + "accuracy": 0.9779056387487799, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -13228,7 +13228,7 @@ } }, { - "accuracy": 0.9799143364652991, + "accuracy": 0.9799105699639767, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -13271,7 +13271,7 @@ } }, { - "accuracy": 0.9784999802941456, + "accuracy": 0.9784922350663692, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -13323,7 +13323,7 @@ } }, { - "accuracy": 0.9811378001468256, + "accuracy": 0.9811363412300125, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -13375,7 +13375,7 @@ } }, { - "accuracy": 0.989061931555625, + "accuracy": 0.9890591687289998, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -13427,7 +13427,7 @@ } }, { - "accuracy": 0.9906022883369587, + "accuracy": 0.9906044090166688, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -13479,7 +13479,7 @@ } }, { - "accuracy": 0.9940370166732464, + "accuracy": 0.9940391734417062, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -13522,7 +13522,7 @@ } }, { - "accuracy": 0.9944562675664201, + "accuracy": 0.9944552840606775, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -13571,7 +13571,7 @@ } }, { - "accuracy": 0.995648256590357, + "accuracy": 0.9956490360928001, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -13617,7 +13617,7 @@ } }, { - "accuracy": 0.9984210256152437, + "accuracy": 0.9984224444415304, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -13659,7 +13659,7 @@ ], "model.layers.7.self_attn": [ { - "accuracy": 0.8989655710756779, + "accuracy": 0.8983123078942299, "total_bits": 20322304, "q_proj": { "group_size": { @@ -13723,7 +13723,7 @@ } }, { - "accuracy": 0.9094870276749134, + "accuracy": 0.911407018546015, "total_bits": 20977664, "q_proj": { "group_size": { @@ -13787,7 +13787,7 @@ } }, { - "accuracy": 0.9360942805651575, + "accuracy": 0.9333993026521057, "total_bits": 21419264, "q_proj": { "group_size": { @@ -13851,7 +13851,7 @@ } }, { - "accuracy": 0.9451489034108818, + "accuracy": 0.9419278849381953, "total_bits": 25481728, "q_proj": { "group_size": { @@ -13915,7 +13915,7 @@ } }, { - "accuracy": 0.9540366844739765, + "accuracy": 0.9542598675470799, "total_bits": 30051328, "q_proj": { "group_size": { @@ -13979,7 +13979,7 @@ } }, { - "accuracy": 0.9552278250921518, + "accuracy": 0.9568204355891794, "total_bits": 30068480, "q_proj": { "group_size": { @@ -14043,7 +14043,7 @@ } }, { - "accuracy": 0.9745677303289995, + "accuracy": 0.977223283261992, "total_bits": 38308864, "q_proj": { "group_size": { @@ -14095,7 +14095,7 @@ } }, { - "accuracy": 0.9745288434205577, + "accuracy": 0.975888021173887, "total_bits": 38326016, "q_proj": { "group_size": { @@ -14147,7 +14147,7 @@ } }, { - "accuracy": 0.9777406478533521, + "accuracy": 0.9783789886860177, "total_bits": 38641152, "q_proj": { "group_size": { @@ -14199,7 +14199,7 @@ } }, { - "accuracy": 0.9785657813772559, + "accuracy": 0.9788547960342839, "total_bits": 39202816, "q_proj": { "group_size": { @@ -14251,7 +14251,7 @@ } }, { - "accuracy": 0.9763187242206186, + "accuracy": 0.9757549887290224, "total_bits": 39505664, "q_proj": { "group_size": { @@ -14315,7 +14315,7 @@ } }, { - "accuracy": 0.978967959410511, + "accuracy": 0.979342598002404, "total_bits": 39812608, "q_proj": { "group_size": { @@ -14379,7 +14379,7 @@ } }, { - "accuracy": 0.9845154113136232, + "accuracy": 0.9841148174018599, "total_bits": 40245248, "q_proj": { "group_size": { @@ -14440,7 +14440,7 @@ } }, { - "accuracy": 0.9861942294519395, + "accuracy": 0.985871184442658, "total_bits": 40701952, "q_proj": { "group_size": { @@ -14501,7 +14501,7 @@ } }, { - "accuracy": 0.9913671567337587, + "accuracy": 0.9915930248680525, "total_bits": 49384448, "q_proj": { "group_size": { @@ -14562,7 +14562,7 @@ } }, { - "accuracy": 0.9926596416917164, + "accuracy": 0.9926986661739647, "total_bits": 50139136, "q_proj": { "group_size": { @@ -14623,7 +14623,7 @@ } }, { - "accuracy": 0.9927626944554504, + "accuracy": 0.9930413794936612, "total_bits": 57183232, "q_proj": { "group_size": { @@ -14675,7 +14675,7 @@ } }, { - "accuracy": 0.9968172224762384, + "accuracy": 0.9967936781322351, "total_bits": 59125760, "q_proj": { "group_size": { @@ -14727,7 +14727,7 @@ } }, { - "accuracy": 0.9980925641139038, + "accuracy": 0.9981576569844037, "total_bits": 76057600, "q_proj": { "group_size": { @@ -14781,7 +14781,7 @@ ], "model.layers.7.mlp": [ { - "accuracy": 0.8740640999749303, + "accuracy": 0.8761396110057831, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -14833,7 +14833,7 @@ } }, { - "accuracy": 0.8790809842757881, + "accuracy": 0.8773001343943179, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -14885,7 +14885,7 @@ } }, { - "accuracy": 0.8829639297910035, + "accuracy": 0.8859596261754632, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -14934,7 +14934,7 @@ } }, { - "accuracy": 0.8844086863100529, + "accuracy": 0.8874513003975153, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -14983,7 +14983,7 @@ } }, { - "accuracy": 0.9626284560654312, + "accuracy": 0.9649159100372344, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -15035,7 +15035,7 @@ } }, { - "accuracy": 0.9632150703109801, + "accuracy": 0.9641846157610416, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -15087,7 +15087,7 @@ } }, { - "accuracy": 0.9669195328606293, + "accuracy": 0.9680030718445778, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -15136,7 +15136,7 @@ } }, { - "accuracy": 0.9814709811471403, + "accuracy": 0.9814539876533672, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -15179,7 +15179,7 @@ } }, { - "accuracy": 0.9827554197399877, + "accuracy": 0.9827524308348075, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -15222,7 +15222,7 @@ } }, { - "accuracy": 0.9820675658993423, + "accuracy": 0.9823680627159774, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -15274,7 +15274,7 @@ } }, { - "accuracy": 0.9844704826246016, + "accuracy": 0.9839322321349755, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -15326,7 +15326,7 @@ } }, { - "accuracy": 0.9909601904219016, + "accuracy": 0.9909889902919531, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -15378,7 +15378,7 @@ } }, { - "accuracy": 0.9922629986249376, + "accuracy": 0.9922378689807374, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -15430,7 +15430,7 @@ } }, { - "accuracy": 0.9948913365660701, + "accuracy": 0.9948546060186345, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -15473,7 +15473,7 @@ } }, { - "accuracy": 0.9952513682947028, + "accuracy": 0.9953135109972209, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -15522,7 +15522,7 @@ } }, { - "accuracy": 0.9961311991792172, + "accuracy": 0.9962075788062066, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -15568,7 +15568,7 @@ } }, { - "accuracy": 0.9983171257918002, + "accuracy": 0.9983270965531119, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -15610,7 +15610,7 @@ ], "model.layers.8.self_attn": [ { - "accuracy": 0.9559460389427841, + "accuracy": 0.9549286474939436, "total_bits": 20322304, "q_proj": { "group_size": { @@ -15674,7 +15674,7 @@ } }, { - "accuracy": 0.9575134336482733, + "accuracy": 0.9581307489424944, "total_bits": 20977664, "q_proj": { "group_size": { @@ -15738,7 +15738,7 @@ } }, { - "accuracy": 0.961513358168304, + "accuracy": 0.9611671413294971, "total_bits": 21419264, "q_proj": { "group_size": { @@ -15802,7 +15802,7 @@ } }, { - "accuracy": 0.9684337473008782, + "accuracy": 0.9680541863199323, "total_bits": 25481728, "q_proj": { "group_size": { @@ -15866,7 +15866,7 @@ } }, { - "accuracy": 0.9756559787783772, + "accuracy": 0.9750149477040395, "total_bits": 30051328, "q_proj": { "group_size": { @@ -15930,7 +15930,7 @@ } }, { - "accuracy": 0.9769143615849316, + "accuracy": 0.9769023475237191, "total_bits": 30068480, "q_proj": { "group_size": { @@ -15994,7 +15994,7 @@ } }, { - "accuracy": 0.9822000450221822, + "accuracy": 0.9822686673142016, "total_bits": 38308864, "q_proj": { "group_size": { @@ -16046,7 +16046,7 @@ } }, { - "accuracy": 0.9835819063591771, + "accuracy": 0.9834700028295629, "total_bits": 38326016, "q_proj": { "group_size": { @@ -16098,7 +16098,7 @@ } }, { - "accuracy": 0.984664169489406, + "accuracy": 0.9847945614601485, "total_bits": 38641152, "q_proj": { "group_size": { @@ -16150,7 +16150,7 @@ } }, { - "accuracy": 0.9853839995339513, + "accuracy": 0.985567458672449, "total_bits": 39202816, "q_proj": { "group_size": { @@ -16202,7 +16202,7 @@ } }, { - "accuracy": 0.9862543563940562, + "accuracy": 0.9863774447585456, "total_bits": 39505664, "q_proj": { "group_size": { @@ -16266,7 +16266,7 @@ } }, { - "accuracy": 0.9877599139581434, + "accuracy": 0.9878150528529659, "total_bits": 39812608, "q_proj": { "group_size": { @@ -16330,7 +16330,7 @@ } }, { - "accuracy": 0.9896408215281554, + "accuracy": 0.9897127409349196, "total_bits": 40245248, "q_proj": { "group_size": { @@ -16391,7 +16391,7 @@ } }, { - "accuracy": 0.9907788153504953, + "accuracy": 0.990748614363838, "total_bits": 40701952, "q_proj": { "group_size": { @@ -16452,7 +16452,7 @@ } }, { - "accuracy": 0.9941072368528694, + "accuracy": 0.9941602927283384, "total_bits": 49384448, "q_proj": { "group_size": { @@ -16513,7 +16513,7 @@ } }, { - "accuracy": 0.9952677572437096, + "accuracy": 0.995237237541005, "total_bits": 50139136, "q_proj": { "group_size": { @@ -16574,7 +16574,7 @@ } }, { - "accuracy": 0.9952235055970959, + "accuracy": 0.9952759052976035, "total_bits": 57183232, "q_proj": { "group_size": { @@ -16626,7 +16626,7 @@ } }, { - "accuracy": 0.9970219443348469, + "accuracy": 0.9970202781551052, "total_bits": 59125760, "q_proj": { "group_size": { @@ -16678,7 +16678,7 @@ } }, { - "accuracy": 0.9987544280957081, + "accuracy": 0.9987503957090667, "total_bits": 76057600, "q_proj": { "group_size": { @@ -16732,7 +16732,7 @@ ], "model.layers.8.mlp": [ { - "accuracy": 0.9254459459334612, + "accuracy": 0.9254228402860463, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -16784,7 +16784,7 @@ } }, { - "accuracy": 0.927535941824317, + "accuracy": 0.9275152259506285, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -16836,7 +16836,7 @@ } }, { - "accuracy": 0.9381578795146197, + "accuracy": 0.9381464358884841, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -16885,7 +16885,7 @@ } }, { - "accuracy": 0.9415699113160372, + "accuracy": 0.9415542425122112, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -16934,7 +16934,7 @@ } }, { - "accuracy": 0.962083505699411, + "accuracy": 0.96208989713341, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -16986,7 +16986,7 @@ } }, { - "accuracy": 0.9650707013206556, + "accuracy": 0.9650762210367247, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -17038,7 +17038,7 @@ } }, { - "accuracy": 0.9698029174469411, + "accuracy": 0.9698117008665577, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -17087,7 +17087,7 @@ } }, { - "accuracy": 0.9802284634206444, + "accuracy": 0.980227192514576, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -17130,7 +17130,7 @@ } }, { - "accuracy": 0.9819698373321444, + "accuracy": 0.9819611018756405, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -17173,7 +17173,7 @@ } }, { - "accuracy": 0.9807284856215119, + "accuracy": 0.9807263038819656, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -17225,7 +17225,7 @@ } }, { - "accuracy": 0.9830856570624746, + "accuracy": 0.9830842994851992, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -17277,7 +17277,7 @@ } }, { - "accuracy": 0.9902120197657496, + "accuracy": 0.9902103608474135, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -17329,7 +17329,7 @@ } }, { - "accuracy": 0.9915785910561681, + "accuracy": 0.9915799244190566, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -17381,7 +17381,7 @@ } }, { - "accuracy": 0.9946554411144461, + "accuracy": 0.9946536683710292, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -17424,7 +17424,7 @@ } }, { - "accuracy": 0.9950274055881891, + "accuracy": 0.9950293049623724, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -17473,7 +17473,7 @@ } }, { - "accuracy": 0.9959887096483726, + "accuracy": 0.9959906810399843, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -17519,7 +17519,7 @@ } }, { - "accuracy": 0.9985474362547393, + "accuracy": 0.9985481850599172, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -17561,7 +17561,7 @@ ], "model.layers.9.self_attn": [ { - "accuracy": 0.9416354231070727, + "accuracy": 0.9429567465558648, "total_bits": 20322304, "q_proj": { "group_size": { @@ -17625,7 +17625,7 @@ } }, { - "accuracy": 0.944032930303365, + "accuracy": 0.9451392055489123, "total_bits": 20977664, "q_proj": { "group_size": { @@ -17689,7 +17689,7 @@ } }, { - "accuracy": 0.9539643882308155, + "accuracy": 0.9536743790376931, "total_bits": 21419264, "q_proj": { "group_size": { @@ -17753,7 +17753,7 @@ } }, { - "accuracy": 0.9652976144570857, + "accuracy": 0.9649963709525764, "total_bits": 25481728, "q_proj": { "group_size": { @@ -17817,7 +17817,7 @@ } }, { - "accuracy": 0.9721351037733257, + "accuracy": 0.9717296939343214, "total_bits": 30051328, "q_proj": { "group_size": { @@ -17881,7 +17881,7 @@ } }, { - "accuracy": 0.9718929268419743, + "accuracy": 0.9723781605716795, "total_bits": 30068480, "q_proj": { "group_size": { @@ -17945,7 +17945,7 @@ } }, { - "accuracy": 0.9830018813954666, + "accuracy": 0.983433022222016, "total_bits": 38308864, "q_proj": { "group_size": { @@ -17997,7 +17997,7 @@ } }, { - "accuracy": 0.9841009282972664, + "accuracy": 0.9840334347682074, "total_bits": 38326016, "q_proj": { "group_size": { @@ -18049,7 +18049,7 @@ } }, { - "accuracy": 0.9853055531857535, + "accuracy": 0.9854540803353302, "total_bits": 38641152, "q_proj": { "group_size": { @@ -18101,7 +18101,7 @@ } }, { - "accuracy": 0.9860099809593521, + "accuracy": 0.9861169052892365, "total_bits": 39202816, "q_proj": { "group_size": { @@ -18153,7 +18153,7 @@ } }, { - "accuracy": 0.985617536935024, + "accuracy": 0.9851709572831169, "total_bits": 39505664, "q_proj": { "group_size": { @@ -18217,7 +18217,7 @@ } }, { - "accuracy": 0.9865410620695911, + "accuracy": 0.9863768034265377, "total_bits": 39812608, "q_proj": { "group_size": { @@ -18281,7 +18281,7 @@ } }, { - "accuracy": 0.9883724692626856, + "accuracy": 0.9883650410920382, "total_bits": 40245248, "q_proj": { "group_size": { @@ -18342,7 +18342,7 @@ } }, { - "accuracy": 0.989411324437242, + "accuracy": 0.9894577771192417, "total_bits": 40701952, "q_proj": { "group_size": { @@ -18403,7 +18403,7 @@ } }, { - "accuracy": 0.9935562049795408, + "accuracy": 0.993505035788985, "total_bits": 49384448, "q_proj": { "group_size": { @@ -18464,7 +18464,7 @@ } }, { - "accuracy": 0.9946293067769147, + "accuracy": 0.9946799160679802, "total_bits": 50139136, "q_proj": { "group_size": { @@ -18525,7 +18525,7 @@ } }, { - "accuracy": 0.9954830832139123, + "accuracy": 0.9954471277887933, "total_bits": 57183232, "q_proj": { "group_size": { @@ -18577,7 +18577,7 @@ } }, { - "accuracy": 0.9972713361639762, + "accuracy": 0.9972719212528318, "total_bits": 59125760, "q_proj": { "group_size": { @@ -18629,7 +18629,7 @@ } }, { - "accuracy": 0.9987714422095451, + "accuracy": 0.9987652926429291, "total_bits": 76057600, "q_proj": { "group_size": { @@ -18683,7 +18683,7 @@ ], "model.layers.9.mlp": [ { - "accuracy": 0.9147394583560526, + "accuracy": 0.9147509448230267, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -18735,7 +18735,7 @@ } }, { - "accuracy": 0.9171580839902163, + "accuracy": 0.9171082079410553, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -18787,7 +18787,7 @@ } }, { - "accuracy": 0.9306429305579513, + "accuracy": 0.9306198828853667, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -18836,7 +18836,7 @@ } }, { - "accuracy": 0.9349638258572668, + "accuracy": 0.9349386191461235, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -18885,7 +18885,7 @@ } }, { - "accuracy": 0.9565607679542154, + "accuracy": 0.9565686315763742, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -18937,7 +18937,7 @@ } }, { - "accuracy": 0.9600150126498193, + "accuracy": 0.9600318800657988, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -18989,7 +18989,7 @@ } }, { - "accuracy": 0.9659549227217212, + "accuracy": 0.9659541936125606, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -19038,7 +19038,7 @@ } }, { - "accuracy": 0.9772516805678606, + "accuracy": 0.977248563314788, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -19081,7 +19081,7 @@ } }, { - "accuracy": 0.9793121941620484, + "accuracy": 0.9793144373688847, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -19124,7 +19124,7 @@ } }, { - "accuracy": 0.9778701895847917, + "accuracy": 0.9778778683394194, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -19176,7 +19176,7 @@ } }, { - "accuracy": 0.9806117045227438, + "accuracy": 0.9806100962450728, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -19228,7 +19228,7 @@ } }, { - "accuracy": 0.988735472841654, + "accuracy": 0.9887387556955218, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -19280,7 +19280,7 @@ } }, { - "accuracy": 0.9903422188945115, + "accuracy": 0.990345562750008, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -19332,7 +19332,7 @@ } }, { - "accuracy": 0.9938431880436838, + "accuracy": 0.993844908720348, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -19375,7 +19375,7 @@ } }, { - "accuracy": 0.9942859809088986, + "accuracy": 0.9942835884576198, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -19424,7 +19424,7 @@ } }, { - "accuracy": 0.9955427188251633, + "accuracy": 0.9955410496331751, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -19470,7 +19470,7 @@ } }, { - "accuracy": 0.9983650423309882, + "accuracy": 0.9983668145650881, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -19512,7 +19512,7 @@ ], "model.layers.10.self_attn": [ { - "accuracy": 0.9319141302257776, + "accuracy": 0.931745336856693, "total_bits": 20322304, "q_proj": { "group_size": { @@ -19576,7 +19576,7 @@ } }, { - "accuracy": 0.9316584276966751, + "accuracy": 0.933227461297065, "total_bits": 20977664, "q_proj": { "group_size": { @@ -19640,7 +19640,7 @@ } }, { - "accuracy": 0.9483856568112969, + "accuracy": 0.9463236778974533, "total_bits": 21419264, "q_proj": { "group_size": { @@ -19704,7 +19704,7 @@ } }, { - "accuracy": 0.9590357269626111, + "accuracy": 0.9562887218780816, "total_bits": 25481728, "q_proj": { "group_size": { @@ -19768,7 +19768,7 @@ } }, { - "accuracy": 0.9661238526459783, + "accuracy": 0.9640138891991228, "total_bits": 30051328, "q_proj": { "group_size": { @@ -19832,7 +19832,7 @@ } }, { - "accuracy": 0.9655432482250035, + "accuracy": 0.9654078390449286, "total_bits": 30068480, "q_proj": { "group_size": { @@ -19896,7 +19896,7 @@ } }, { - "accuracy": 0.9802206450840458, + "accuracy": 0.9800025676377118, "total_bits": 38308864, "q_proj": { "group_size": { @@ -19948,7 +19948,7 @@ } }, { - "accuracy": 0.981150999199599, + "accuracy": 0.9809808938298374, "total_bits": 38326016, "q_proj": { "group_size": { @@ -20000,7 +20000,7 @@ } }, { - "accuracy": 0.9814195855287835, + "accuracy": 0.982984897098504, "total_bits": 38641152, "q_proj": { "group_size": { @@ -20052,7 +20052,7 @@ } }, { - "accuracy": 0.9820654173381627, + "accuracy": 0.9836763916537166, "total_bits": 39202816, "q_proj": { "group_size": { @@ -20104,7 +20104,7 @@ } }, { - "accuracy": 0.9823487165849656, + "accuracy": 0.9824289524694905, "total_bits": 39505664, "q_proj": { "group_size": { @@ -20168,7 +20168,7 @@ } }, { - "accuracy": 0.9837641709018499, + "accuracy": 0.9842716010753065, "total_bits": 39812608, "q_proj": { "group_size": { @@ -20232,7 +20232,7 @@ } }, { - "accuracy": 0.9869146489072591, + "accuracy": 0.9866743630263954, "total_bits": 40245248, "q_proj": { "group_size": { @@ -20293,7 +20293,7 @@ } }, { - "accuracy": 0.9881504021468572, + "accuracy": 0.9881649905000813, "total_bits": 40701952, "q_proj": { "group_size": { @@ -20354,7 +20354,7 @@ } }, { - "accuracy": 0.9926356603682507, + "accuracy": 0.9925626869080588, "total_bits": 49384448, "q_proj": { "group_size": { @@ -20415,7 +20415,7 @@ } }, { - "accuracy": 0.9939555705932435, + "accuracy": 0.9938833882042672, "total_bits": 50139136, "q_proj": { "group_size": { @@ -20476,7 +20476,7 @@ } }, { - "accuracy": 0.994497589970706, + "accuracy": 0.9943855874880683, "total_bits": 57183232, "q_proj": { "group_size": { @@ -20528,7 +20528,7 @@ } }, { - "accuracy": 0.997064282768406, + "accuracy": 0.9970375800767215, "total_bits": 59125760, "q_proj": { "group_size": { @@ -20580,7 +20580,7 @@ } }, { - "accuracy": 0.9985515986700193, + "accuracy": 0.9985826273623388, "total_bits": 76057600, "q_proj": { "group_size": { @@ -20634,7 +20634,7 @@ ], "model.layers.10.mlp": [ { - "accuracy": 0.9102047909982502, + "accuracy": 0.910159241873771, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -20686,7 +20686,7 @@ } }, { - "accuracy": 0.9125166330486536, + "accuracy": 0.9125154716894031, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -20738,7 +20738,7 @@ } }, { - "accuracy": 0.9266794295981526, + "accuracy": 0.9267166322097182, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -20787,7 +20787,7 @@ } }, { - "accuracy": 0.931165544083342, + "accuracy": 0.9312075695488602, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -20836,7 +20836,7 @@ } }, { - "accuracy": 0.9541585731785744, + "accuracy": 0.9541657795198262, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -20888,7 +20888,7 @@ } }, { - "accuracy": 0.9577395590022206, + "accuracy": 0.957734810654074, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -20940,7 +20940,7 @@ } }, { - "accuracy": 0.9640628923662007, + "accuracy": 0.9640339047182351, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -20989,7 +20989,7 @@ } }, { - "accuracy": 0.9760932810604572, + "accuracy": 0.9760846185963601, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -21032,7 +21032,7 @@ } }, { - "accuracy": 0.9781909013399854, + "accuracy": 0.9781890087760985, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -21075,7 +21075,7 @@ } }, { - "accuracy": 0.9766133881639689, + "accuracy": 0.9766038857633248, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -21127,7 +21127,7 @@ } }, { - "accuracy": 0.9794723733793944, + "accuracy": 0.9794707818655297, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -21179,7 +21179,7 @@ } }, { - "accuracy": 0.9880858223186806, + "accuracy": 0.9880824790452607, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -21231,7 +21231,7 @@ } }, { - "accuracy": 0.9897657120018266, + "accuracy": 0.9897655069944449, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -21283,7 +21283,7 @@ } }, { - "accuracy": 0.993519727664534, + "accuracy": 0.9935211639676709, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -21326,7 +21326,7 @@ } }, { - "accuracy": 0.9939489615499042, + "accuracy": 0.9939489236276131, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -21375,7 +21375,7 @@ } }, { - "accuracy": 0.995243871002458, + "accuracy": 0.9952436523744836, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -21421,7 +21421,7 @@ } }, { - "accuracy": 0.9982818365315325, + "accuracy": 0.9982830558001297, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -21463,7 +21463,7 @@ ], "model.layers.11.self_attn": [ { - "accuracy": 0.9186715800315142, + "accuracy": 0.9193944581784308, "total_bits": 20322304, "q_proj": { "group_size": { @@ -21527,7 +21527,7 @@ } }, { - "accuracy": 0.9192318296991289, + "accuracy": 0.9219264411367476, "total_bits": 20977664, "q_proj": { "group_size": { @@ -21591,7 +21591,7 @@ } }, { - "accuracy": 0.9289245828986168, + "accuracy": 0.9327977206557989, "total_bits": 21419264, "q_proj": { "group_size": { @@ -21655,7 +21655,7 @@ } }, { - "accuracy": 0.94012306840159, + "accuracy": 0.9443284790031612, "total_bits": 25481728, "q_proj": { "group_size": { @@ -21719,7 +21719,7 @@ } }, { - "accuracy": 0.9588701003231108, + "accuracy": 0.958685678197071, "total_bits": 30051328, "q_proj": { "group_size": { @@ -21783,7 +21783,7 @@ } }, { - "accuracy": 0.9602867658250034, + "accuracy": 0.9583908643107861, "total_bits": 30068480, "q_proj": { "group_size": { @@ -21847,7 +21847,7 @@ } }, { - "accuracy": 0.9755191314034164, + "accuracy": 0.9762808877276257, "total_bits": 38308864, "q_proj": { "group_size": { @@ -21899,7 +21899,7 @@ } }, { - "accuracy": 0.9770979050081223, + "accuracy": 0.9768604940036312, "total_bits": 38326016, "q_proj": { "group_size": { @@ -21951,7 +21951,7 @@ } }, { - "accuracy": 0.9780628500739112, + "accuracy": 0.978629301651381, "total_bits": 38641152, "q_proj": { "group_size": { @@ -22003,7 +22003,7 @@ } }, { - "accuracy": 0.9791231205454096, + "accuracy": 0.9797957839909941, "total_bits": 39202816, "q_proj": { "group_size": { @@ -22055,7 +22055,7 @@ } }, { - "accuracy": 0.9787797750905156, + "accuracy": 0.9788612776901573, "total_bits": 39505664, "q_proj": { "group_size": { @@ -22119,7 +22119,7 @@ } }, { - "accuracy": 0.9808323411270976, + "accuracy": 0.9801522343186662, "total_bits": 39812608, "q_proj": { "group_size": { @@ -22183,7 +22183,7 @@ } }, { - "accuracy": 0.9835020124446601, + "accuracy": 0.9833284491905943, "total_bits": 40245248, "q_proj": { "group_size": { @@ -22244,7 +22244,7 @@ } }, { - "accuracy": 0.9848361291224137, + "accuracy": 0.9848593174247071, "total_bits": 40701952, "q_proj": { "group_size": { @@ -22305,7 +22305,7 @@ } }, { - "accuracy": 0.9909266772447154, + "accuracy": 0.990964210126549, "total_bits": 49384448, "q_proj": { "group_size": { @@ -22366,7 +22366,7 @@ } }, { - "accuracy": 0.992412802472245, + "accuracy": 0.9923749796871562, "total_bits": 50139136, "q_proj": { "group_size": { @@ -22427,7 +22427,7 @@ } }, { - "accuracy": 0.9936101068742573, + "accuracy": 0.9936505157675128, "total_bits": 57183232, "q_proj": { "group_size": { @@ -22479,7 +22479,7 @@ } }, { - "accuracy": 0.9961369811207987, + "accuracy": 0.9961516175972065, "total_bits": 59125760, "q_proj": { "group_size": { @@ -22531,7 +22531,7 @@ } }, { - "accuracy": 0.9983186637691688, + "accuracy": 0.9983322603147826, "total_bits": 76057600, "q_proj": { "group_size": { @@ -22585,7 +22585,7 @@ ], "model.layers.11.mlp": [ { - "accuracy": 0.9017781871370971, + "accuracy": 0.9017719221301377, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -22637,7 +22637,7 @@ } }, { - "accuracy": 0.9044851968064904, + "accuracy": 0.904380158521235, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -22689,7 +22689,7 @@ } }, { - "accuracy": 0.9200173448771238, + "accuracy": 0.9199405279941857, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -22738,7 +22738,7 @@ } }, { - "accuracy": 0.9249296132475138, + "accuracy": 0.9248409811407328, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -22787,7 +22787,7 @@ } }, { - "accuracy": 0.9497230714187026, + "accuracy": 0.9496908800210804, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -22839,7 +22839,7 @@ } }, { - "accuracy": 0.9537180438637733, + "accuracy": 0.9536907351575792, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -22891,7 +22891,7 @@ } }, { - "accuracy": 0.9606448367703706, + "accuracy": 0.9606239208951592, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -22940,7 +22940,7 @@ } }, { - "accuracy": 0.9737902890192345, + "accuracy": 0.9737881306791678, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -22983,7 +22983,7 @@ } }, { - "accuracy": 0.9761123352218419, + "accuracy": 0.9761083286721259, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -23026,7 +23026,7 @@ } }, { - "accuracy": 0.974334612255916, + "accuracy": 0.9743334165541455, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -23078,7 +23078,7 @@ } }, { - "accuracy": 0.977497496176511, + "accuracy": 0.977502096327953, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -23130,7 +23130,7 @@ } }, { - "accuracy": 0.9869243035209365, + "accuracy": 0.9869189038290642, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -23182,7 +23182,7 @@ } }, { - "accuracy": 0.9887873591505922, + "accuracy": 0.9887856573332101, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -23234,7 +23234,7 @@ } }, { - "accuracy": 0.9929000677075237, + "accuracy": 0.9928994898218662, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -23277,7 +23277,7 @@ } }, { - "accuracy": 0.9933506377565209, + "accuracy": 0.9933465466601774, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -23326,7 +23326,7 @@ } }, { - "accuracy": 0.9947574314428493, + "accuracy": 0.9947537815605756, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -23372,7 +23372,7 @@ } }, { - "accuracy": 0.9981139888404869, + "accuracy": 0.9981159281887813, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -23414,7 +23414,7 @@ ], "model.layers.12.self_attn": [ { - "accuracy": 0.9173749051988125, + "accuracy": 0.9136519706808031, "total_bits": 20322304, "q_proj": { "group_size": { @@ -23478,7 +23478,7 @@ } }, { - "accuracy": 0.9176692711189389, + "accuracy": 0.9187484430149198, "total_bits": 20977664, "q_proj": { "group_size": { @@ -23542,7 +23542,7 @@ } }, { - "accuracy": 0.9324247860349715, + "accuracy": 0.9335789647884667, "total_bits": 21419264, "q_proj": { "group_size": { @@ -23606,7 +23606,7 @@ } }, { - "accuracy": 0.9480586282443255, + "accuracy": 0.9491945174522698, "total_bits": 25481728, "q_proj": { "group_size": { @@ -23670,7 +23670,7 @@ } }, { - "accuracy": 0.9573442214168608, + "accuracy": 0.958149291574955, "total_bits": 30051328, "q_proj": { "group_size": { @@ -23734,7 +23734,7 @@ } }, { - "accuracy": 0.9590044033247977, + "accuracy": 0.9581987289711833, "total_bits": 30068480, "q_proj": { "group_size": { @@ -23798,7 +23798,7 @@ } }, { - "accuracy": 0.976537905051373, + "accuracy": 0.975914970273152, "total_bits": 38308864, "q_proj": { "group_size": { @@ -23850,7 +23850,7 @@ } }, { - "accuracy": 0.9773259893991053, + "accuracy": 0.9768855628790334, "total_bits": 38326016, "q_proj": { "group_size": { @@ -23902,7 +23902,7 @@ } }, { - "accuracy": 0.9793273204704747, + "accuracy": 0.9790347187081352, "total_bits": 38641152, "q_proj": { "group_size": { @@ -23954,7 +23954,7 @@ } }, { - "accuracy": 0.9804044821066782, + "accuracy": 0.9801103107165545, "total_bits": 39202816, "q_proj": { "group_size": { @@ -24006,7 +24006,7 @@ } }, { - "accuracy": 0.9790864794049412, + "accuracy": 0.9785985123598948, "total_bits": 39505664, "q_proj": { "group_size": { @@ -24070,7 +24070,7 @@ } }, { - "accuracy": 0.9801926102954894, + "accuracy": 0.9801784406881779, "total_bits": 39812608, "q_proj": { "group_size": { @@ -24134,7 +24134,7 @@ } }, { - "accuracy": 0.9832785943290219, + "accuracy": 0.9833301451290026, "total_bits": 40245248, "q_proj": { "group_size": { @@ -24195,7 +24195,7 @@ } }, { - "accuracy": 0.984603087999858, + "accuracy": 0.9846703224466182, "total_bits": 40701952, "q_proj": { "group_size": { @@ -24256,7 +24256,7 @@ } }, { - "accuracy": 0.9908451493247412, + "accuracy": 0.9907486748415977, "total_bits": 49384448, "q_proj": { "group_size": { @@ -24317,7 +24317,7 @@ } }, { - "accuracy": 0.9923665930400603, + "accuracy": 0.9922966239100788, "total_bits": 50139136, "q_proj": { "group_size": { @@ -24378,7 +24378,7 @@ } }, { - "accuracy": 0.9936538017936982, + "accuracy": 0.9936183106037788, "total_bits": 57183232, "q_proj": { "group_size": { @@ -24430,7 +24430,7 @@ } }, { - "accuracy": 0.9961093768797582, + "accuracy": 0.9960765455616638, "total_bits": 59125760, "q_proj": { "group_size": { @@ -24482,7 +24482,7 @@ } }, { - "accuracy": 0.9984034998924471, + "accuracy": 0.9983274860715028, "total_bits": 76057600, "q_proj": { "group_size": { @@ -24536,7 +24536,7 @@ ], "model.layers.12.mlp": [ { - "accuracy": 0.8923830925486982, + "accuracy": 0.8923376193270087, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -24588,7 +24588,7 @@ } }, { - "accuracy": 0.8955784854479134, + "accuracy": 0.8955522533506155, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -24640,7 +24640,7 @@ } }, { - "accuracy": 0.912928182631731, + "accuracy": 0.9128954568877816, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -24689,7 +24689,7 @@ } }, { - "accuracy": 0.9184820861555636, + "accuracy": 0.9184320941567421, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -24738,7 +24738,7 @@ } }, { - "accuracy": 0.94506647111848, + "accuracy": 0.9450353875290602, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -24790,7 +24790,7 @@ } }, { - "accuracy": 0.9494709430728108, + "accuracy": 0.9494706585537642, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -24842,7 +24842,7 @@ } }, { - "accuracy": 0.9571043117903173, + "accuracy": 0.9571018212009221, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -24891,7 +24891,7 @@ } }, { - "accuracy": 0.9710967171704397, + "accuracy": 0.9711021463153884, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -24934,7 +24934,7 @@ } }, { - "accuracy": 0.9736787973670289, + "accuracy": 0.9736879046540707, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -24977,7 +24977,7 @@ } }, { - "accuracy": 0.9719507985282689, + "accuracy": 0.9719566550338641, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -25029,7 +25029,7 @@ } }, { - "accuracy": 0.9754327209666371, + "accuracy": 0.9754247883101925, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -25081,7 +25081,7 @@ } }, { - "accuracy": 0.9857004482764751, + "accuracy": 0.9857010332052596, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -25133,7 +25133,7 @@ } }, { - "accuracy": 0.9877342993859202, + "accuracy": 0.9877379562822171, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -25185,7 +25185,7 @@ } }, { - "accuracy": 0.9921337319246959, + "accuracy": 0.9921366873313673, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -25228,7 +25228,7 @@ } }, { - "accuracy": 0.9927305307064671, + "accuracy": 0.9927341164730024, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -25277,7 +25277,7 @@ } }, { - "accuracy": 0.9943514695332851, + "accuracy": 0.9943532862816937, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -25323,7 +25323,7 @@ } }, { - "accuracy": 0.9978919023124035, + "accuracy": 0.9978937211999437, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -25365,7 +25365,7 @@ ], "model.layers.13.self_attn": [ { - "accuracy": 0.9176904456689954, + "accuracy": 0.9179154583252966, "total_bits": 20322304, "q_proj": { "group_size": { @@ -25429,7 +25429,7 @@ } }, { - "accuracy": 0.9200131385587156, + "accuracy": 0.9185350835323334, "total_bits": 20977664, "q_proj": { "group_size": { @@ -25493,7 +25493,7 @@ } }, { - "accuracy": 0.9300591102801263, + "accuracy": 0.9300135960802436, "total_bits": 21419264, "q_proj": { "group_size": { @@ -25557,7 +25557,7 @@ } }, { - "accuracy": 0.9446402131579816, + "accuracy": 0.9443755131214857, "total_bits": 25481728, "q_proj": { "group_size": { @@ -25621,7 +25621,7 @@ } }, { - "accuracy": 0.9562090737745166, + "accuracy": 0.9563196916133165, "total_bits": 30051328, "q_proj": { "group_size": { @@ -25685,7 +25685,7 @@ } }, { - "accuracy": 0.9567139367572963, + "accuracy": 0.9574573277495801, "total_bits": 30068480, "q_proj": { "group_size": { @@ -25749,7 +25749,7 @@ } }, { - "accuracy": 0.9752687093568966, + "accuracy": 0.9752349962946028, "total_bits": 38308864, "q_proj": { "group_size": { @@ -25801,7 +25801,7 @@ } }, { - "accuracy": 0.9758301599649712, + "accuracy": 0.9761181246722117, "total_bits": 38326016, "q_proj": { "group_size": { @@ -25853,7 +25853,7 @@ } }, { - "accuracy": 0.9781466921558604, + "accuracy": 0.9782854713266715, "total_bits": 38641152, "q_proj": { "group_size": { @@ -25905,7 +25905,7 @@ } }, { - "accuracy": 0.979085453087464, + "accuracy": 0.9793351907283068, "total_bits": 39202816, "q_proj": { "group_size": { @@ -25957,7 +25957,7 @@ } }, { - "accuracy": 0.9783055998850614, + "accuracy": 0.978713070275262, "total_bits": 39505664, "q_proj": { "group_size": { @@ -26021,7 +26021,7 @@ } }, { - "accuracy": 0.9798258004011586, + "accuracy": 0.9799865727545694, "total_bits": 39812608, "q_proj": { "group_size": { @@ -26085,7 +26085,7 @@ } }, { - "accuracy": 0.9825452725635841, + "accuracy": 0.9824670746456832, "total_bits": 40245248, "q_proj": { "group_size": { @@ -26146,7 +26146,7 @@ } }, { - "accuracy": 0.9836509863380343, + "accuracy": 0.9840942462324165, "total_bits": 40701952, "q_proj": { "group_size": { @@ -26207,7 +26207,7 @@ } }, { - "accuracy": 0.990372569358442, + "accuracy": 0.9904396518832073, "total_bits": 49384448, "q_proj": { "group_size": { @@ -26268,7 +26268,7 @@ } }, { - "accuracy": 0.9918290077475831, + "accuracy": 0.991957164806081, "total_bits": 50139136, "q_proj": { "group_size": { @@ -26329,7 +26329,7 @@ } }, { - "accuracy": 0.9935184890055098, + "accuracy": 0.9935693005973008, "total_bits": 57183232, "q_proj": { "group_size": { @@ -26381,7 +26381,7 @@ } }, { - "accuracy": 0.9958510975411627, + "accuracy": 0.9956800245854538, "total_bits": 59125760, "q_proj": { "group_size": { @@ -26433,7 +26433,7 @@ } }, { - "accuracy": 0.9982690347533207, + "accuracy": 0.9983127164086909, "total_bits": 76057600, "q_proj": { "group_size": { @@ -26487,7 +26487,7 @@ ], "model.layers.13.mlp": [ { - "accuracy": 0.8881213283166289, + "accuracy": 0.8881413475610316, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -26539,7 +26539,7 @@ } }, { - "accuracy": 0.8913228893652558, + "accuracy": 0.8913296032696962, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -26591,7 +26591,7 @@ } }, { - "accuracy": 0.9091641381382942, + "accuracy": 0.9091385877691209, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -26640,7 +26640,7 @@ } }, { - "accuracy": 0.9148844359442592, + "accuracy": 0.9148472370579839, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -26689,7 +26689,7 @@ } }, { - "accuracy": 0.9427451903466135, + "accuracy": 0.9427352503407747, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -26741,7 +26741,7 @@ } }, { - "accuracy": 0.9474930218420923, + "accuracy": 0.9475003182888031, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -26793,7 +26793,7 @@ } }, { - "accuracy": 0.9552864958532155, + "accuracy": 0.9553025520872325, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -26842,7 +26842,7 @@ } }, { - "accuracy": 0.9698741511674598, + "accuracy": 0.9698639699490741, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -26885,7 +26885,7 @@ } }, { - "accuracy": 0.9725958183407784, + "accuracy": 0.9725840607425198, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -26928,7 +26928,7 @@ } }, { - "accuracy": 0.9707917935447767, + "accuracy": 0.9707706491462886, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -26980,7 +26980,7 @@ } }, { - "accuracy": 0.9744679839350283, + "accuracy": 0.9744554769713432, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -27032,7 +27032,7 @@ } }, { - "accuracy": 0.9851057628402486, + "accuracy": 0.9850956918671727, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -27084,7 +27084,7 @@ } }, { - "accuracy": 0.9872484983643517, + "accuracy": 0.9872497273026966, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -27136,7 +27136,7 @@ } }, { - "accuracy": 0.991783278179355, + "accuracy": 0.9917794451466762, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -27179,7 +27179,7 @@ } }, { - "accuracy": 0.9924297987308819, + "accuracy": 0.9924305994354654, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -27228,7 +27228,7 @@ } }, { - "accuracy": 0.9940613291983027, + "accuracy": 0.9940630609635264, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -27274,7 +27274,7 @@ } }, { - "accuracy": 0.997787944826996, + "accuracy": 0.9977892612514552, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -27316,7 +27316,7 @@ ], "model.layers.14.self_attn": [ { - "accuracy": 0.9095291160047054, + "accuracy": 0.9107716847211123, "total_bits": 20322304, "q_proj": { "group_size": { @@ -27380,7 +27380,7 @@ } }, { - "accuracy": 0.916604476980865, + "accuracy": 0.9153270763345063, "total_bits": 20977664, "q_proj": { "group_size": { @@ -27444,7 +27444,7 @@ } }, { - "accuracy": 0.929648453835398, + "accuracy": 0.929239088203758, "total_bits": 21419264, "q_proj": { "group_size": { @@ -27508,7 +27508,7 @@ } }, { - "accuracy": 0.9462574280332774, + "accuracy": 0.9458540149498731, "total_bits": 25481728, "q_proj": { "group_size": { @@ -27572,7 +27572,7 @@ } }, { - "accuracy": 0.9556420429144055, + "accuracy": 0.9558859334792942, "total_bits": 30051328, "q_proj": { "group_size": { @@ -27636,7 +27636,7 @@ } }, { - "accuracy": 0.9570662553887814, + "accuracy": 0.9568213103339076, "total_bits": 30068480, "q_proj": { "group_size": { @@ -27700,7 +27700,7 @@ } }, { - "accuracy": 0.9738057117210701, + "accuracy": 0.9737680342514068, "total_bits": 38308864, "q_proj": { "group_size": { @@ -27752,7 +27752,7 @@ } }, { - "accuracy": 0.9744380716001615, + "accuracy": 0.9743268551537767, "total_bits": 38326016, "q_proj": { "group_size": { @@ -27804,7 +27804,7 @@ } }, { - "accuracy": 0.9764348154421896, + "accuracy": 0.9764261088566855, "total_bits": 38641152, "q_proj": { "group_size": { @@ -27856,7 +27856,7 @@ } }, { - "accuracy": 0.9776771338656545, + "accuracy": 0.9776871927315369, "total_bits": 39202816, "q_proj": { "group_size": { @@ -27908,7 +27908,7 @@ } }, { - "accuracy": 0.9777979067293927, + "accuracy": 0.9778663711622357, "total_bits": 39505664, "q_proj": { "group_size": { @@ -27972,7 +27972,7 @@ } }, { - "accuracy": 0.9799313422990963, + "accuracy": 0.9794364429544657, "total_bits": 39812608, "q_proj": { "group_size": { @@ -28036,7 +28036,7 @@ } }, { - "accuracy": 0.9821182899177074, + "accuracy": 0.9822900348808616, "total_bits": 40245248, "q_proj": { "group_size": { @@ -28097,7 +28097,7 @@ } }, { - "accuracy": 0.9835141007788479, + "accuracy": 0.9835491182748228, "total_bits": 40701952, "q_proj": { "group_size": { @@ -28158,7 +28158,7 @@ } }, { - "accuracy": 0.9900213863002136, + "accuracy": 0.9899146651732735, "total_bits": 49384448, "q_proj": { "group_size": { @@ -28219,7 +28219,7 @@ } }, { - "accuracy": 0.9917286091367714, + "accuracy": 0.9917932482203469, "total_bits": 50139136, "q_proj": { "group_size": { @@ -28280,7 +28280,7 @@ } }, { - "accuracy": 0.9931586720049381, + "accuracy": 0.9930848326184787, "total_bits": 57183232, "q_proj": { "group_size": { @@ -28332,7 +28332,7 @@ } }, { - "accuracy": 0.9955504036333878, + "accuracy": 0.9955458572658245, "total_bits": 59125760, "q_proj": { "group_size": { @@ -28384,7 +28384,7 @@ } }, { - "accuracy": 0.9982048964957357, + "accuracy": 0.998172156556393, "total_bits": 76057600, "q_proj": { "group_size": { @@ -28438,7 +28438,7 @@ ], "model.layers.14.mlp": [ { - "accuracy": 0.8856116477400064, + "accuracy": 0.8856581686995924, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -28490,7 +28490,7 @@ } }, { - "accuracy": 0.8888828433118761, + "accuracy": 0.8888984327204525, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -28542,7 +28542,7 @@ } }, { - "accuracy": 0.9069123398512602, + "accuracy": 0.9069627402350307, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -28591,7 +28591,7 @@ } }, { - "accuracy": 0.9128925623372197, + "accuracy": 0.912942417897284, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -28640,7 +28640,7 @@ } }, { - "accuracy": 0.941304479027167, + "accuracy": 0.9413316885475069, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -28692,7 +28692,7 @@ } }, { - "accuracy": 0.9461523101199418, + "accuracy": 0.9461551073472947, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -28744,7 +28744,7 @@ } }, { - "accuracy": 0.9542014615144581, + "accuracy": 0.9541904476936907, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -28793,7 +28793,7 @@ } }, { - "accuracy": 0.9689613208174706, + "accuracy": 0.9689564873697236, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -28836,7 +28836,7 @@ } }, { - "accuracy": 0.9718211867148057, + "accuracy": 0.9718167996034026, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -28879,7 +28879,7 @@ } }, { - "accuracy": 0.9700623671524227, + "accuracy": 0.9700558942276984, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -28931,7 +28931,7 @@ } }, { - "accuracy": 0.9738100699614733, + "accuracy": 0.9738077285001054, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -28983,7 +28983,7 @@ } }, { - "accuracy": 0.9847462885081768, + "accuracy": 0.984742330852896, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -29035,7 +29035,7 @@ } }, { - "accuracy": 0.9869353998801671, + "accuracy": 0.9869330606306903, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -29087,7 +29087,7 @@ } }, { - "accuracy": 0.9915596575010568, + "accuracy": 0.9915604586130939, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -29130,7 +29130,7 @@ } }, { - "accuracy": 0.9922743932402227, + "accuracy": 0.9922754485742189, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -29179,7 +29179,7 @@ } }, { - "accuracy": 0.994001913262764, + "accuracy": 0.9940043366223108, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -29225,7 +29225,7 @@ } }, { - "accuracy": 0.9977399868221255, + "accuracy": 0.9977415750472574, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -29267,7 +29267,7 @@ ], "model.layers.15.self_attn": [ { - "accuracy": 0.8960956558585167, + "accuracy": 0.8969894922338426, "total_bits": 20322304, "q_proj": { "group_size": { @@ -29331,7 +29331,7 @@ } }, { - "accuracy": 0.9011814347468317, + "accuracy": 0.9027267415076494, "total_bits": 20977664, "q_proj": { "group_size": { @@ -29395,7 +29395,7 @@ } }, { - "accuracy": 0.9211668102070689, + "accuracy": 0.9212047667242587, "total_bits": 21419264, "q_proj": { "group_size": { @@ -29459,7 +29459,7 @@ } }, { - "accuracy": 0.9372404778841883, + "accuracy": 0.9372139172628522, "total_bits": 25481728, "q_proj": { "group_size": { @@ -29523,7 +29523,7 @@ } }, { - "accuracy": 0.9480563276447356, + "accuracy": 0.947562956949696, "total_bits": 30051328, "q_proj": { "group_size": { @@ -29587,7 +29587,7 @@ } }, { - "accuracy": 0.9493570134509355, + "accuracy": 0.9495445881038904, "total_bits": 30068480, "q_proj": { "group_size": { @@ -29651,7 +29651,7 @@ } }, { - "accuracy": 0.9693998964503407, + "accuracy": 0.9686730967368931, "total_bits": 38308864, "q_proj": { "group_size": { @@ -29703,7 +29703,7 @@ } }, { - "accuracy": 0.9699793298495933, + "accuracy": 0.9693887827452272, "total_bits": 38326016, "q_proj": { "group_size": { @@ -29755,7 +29755,7 @@ } }, { - "accuracy": 0.9737294832011685, + "accuracy": 0.9734829242806882, "total_bits": 38641152, "q_proj": { "group_size": { @@ -29807,7 +29807,7 @@ } }, { - "accuracy": 0.9749459268059582, + "accuracy": 0.9747996828518808, "total_bits": 39202816, "q_proj": { "group_size": { @@ -29859,7 +29859,7 @@ } }, { - "accuracy": 0.9744235388934612, + "accuracy": 0.97373071545735, "total_bits": 39505664, "q_proj": { "group_size": { @@ -29923,7 +29923,7 @@ } }, { - "accuracy": 0.9762074698228389, + "accuracy": 0.9763597372220829, "total_bits": 39812608, "q_proj": { "group_size": { @@ -29987,7 +29987,7 @@ } }, { - "accuracy": 0.9795820181025192, + "accuracy": 0.9797644936479628, "total_bits": 40245248, "q_proj": { "group_size": { @@ -30048,7 +30048,7 @@ } }, { - "accuracy": 0.9818856550846249, + "accuracy": 0.9818511276971549, "total_bits": 40701952, "q_proj": { "group_size": { @@ -30109,7 +30109,7 @@ } }, { - "accuracy": 0.9887084455695003, + "accuracy": 0.988578466232866, "total_bits": 49384448, "q_proj": { "group_size": { @@ -30170,7 +30170,7 @@ } }, { - "accuracy": 0.9908410778734833, + "accuracy": 0.9907873802585527, "total_bits": 50139136, "q_proj": { "group_size": { @@ -30231,7 +30231,7 @@ } }, { - "accuracy": 0.9918821430765092, + "accuracy": 0.9917124712374061, "total_bits": 57183232, "q_proj": { "group_size": { @@ -30283,7 +30283,7 @@ } }, { - "accuracy": 0.9952785526693333, + "accuracy": 0.9953176533745136, "total_bits": 59125760, "q_proj": { "group_size": { @@ -30335,7 +30335,7 @@ } }, { - "accuracy": 0.9978439158585388, + "accuracy": 0.9977985790756065, "total_bits": 76057600, "q_proj": { "group_size": { @@ -30389,7 +30389,7 @@ ], "model.layers.15.mlp": [ { - "accuracy": 0.8757463633082807, + "accuracy": 0.8757757884450257, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -30441,7 +30441,7 @@ } }, { - "accuracy": 0.8795227808877826, + "accuracy": 0.8794931443408132, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -30493,7 +30493,7 @@ } }, { - "accuracy": 0.8993062707595527, + "accuracy": 0.8993033794686198, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -30542,7 +30542,7 @@ } }, { - "accuracy": 0.9060351783409715, + "accuracy": 0.9060217761434615, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -30591,7 +30591,7 @@ } }, { - "accuracy": 0.9363452955149114, + "accuracy": 0.9363326502498239, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -30643,7 +30643,7 @@ } }, { - "accuracy": 0.941579197300598, + "accuracy": 0.9415606025140733, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -30695,7 +30695,7 @@ } }, { - "accuracy": 0.9505553806666285, + "accuracy": 0.9505282503087074, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -30744,7 +30744,7 @@ } }, { - "accuracy": 0.9661785268690437, + "accuracy": 0.9661882345099002, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -30787,7 +30787,7 @@ } }, { - "accuracy": 0.9692711803363636, + "accuracy": 0.969285067403689, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -30830,7 +30830,7 @@ } }, { - "accuracy": 0.9674788797274232, + "accuracy": 0.9674791201250628, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -30882,7 +30882,7 @@ } }, { - "accuracy": 0.9715715986676514, + "accuracy": 0.971582017140463, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -30934,7 +30934,7 @@ } }, { - "accuracy": 0.9834197586169466, + "accuracy": 0.9834182569175027, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -30986,7 +30986,7 @@ } }, { - "accuracy": 0.9858121484867297, + "accuracy": 0.9858089934568852, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -31038,7 +31038,7 @@ } }, { - "accuracy": 0.9907642401522025, + "accuracy": 0.9907644363120198, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -31081,7 +31081,7 @@ } }, { - "accuracy": 0.9915993981121574, + "accuracy": 0.991599121276522, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -31130,7 +31130,7 @@ } }, { - "accuracy": 0.9935358766233549, + "accuracy": 0.9935369456070475, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -31176,7 +31176,7 @@ } }, { - "accuracy": 0.9974906315765111, + "accuracy": 0.9974924484267831, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -31218,7 +31218,7 @@ ], "model.layers.16.self_attn": [ { - "accuracy": 0.9075210015289485, + "accuracy": 0.9082380309700966, "total_bits": 20322304, "q_proj": { "group_size": { @@ -31282,7 +31282,7 @@ } }, { - "accuracy": 0.9090233980678022, + "accuracy": 0.9121404173783958, "total_bits": 20977664, "q_proj": { "group_size": { @@ -31346,7 +31346,7 @@ } }, { - "accuracy": 0.926638713106513, + "accuracy": 0.9277786235325038, "total_bits": 21419264, "q_proj": { "group_size": { @@ -31410,7 +31410,7 @@ } }, { - "accuracy": 0.9405981756281108, + "accuracy": 0.9420057216193527, "total_bits": 25481728, "q_proj": { "group_size": { @@ -31474,7 +31474,7 @@ } }, { - "accuracy": 0.952345586149022, + "accuracy": 0.9525234028697014, "total_bits": 30051328, "q_proj": { "group_size": { @@ -31538,7 +31538,7 @@ } }, { - "accuracy": 0.9531309120357037, + "accuracy": 0.9548692796379328, "total_bits": 30068480, "q_proj": { "group_size": { @@ -31602,7 +31602,7 @@ } }, { - "accuracy": 0.9726142945000902, + "accuracy": 0.9729025661945343, "total_bits": 38308864, "q_proj": { "group_size": { @@ -31654,7 +31654,7 @@ } }, { - "accuracy": 0.9741090836469084, + "accuracy": 0.9746258014347404, "total_bits": 38326016, "q_proj": { "group_size": { @@ -31706,7 +31706,7 @@ } }, { - "accuracy": 0.9761942652985454, + "accuracy": 0.9762138307560235, "total_bits": 38641152, "q_proj": { "group_size": { @@ -31758,7 +31758,7 @@ } }, { - "accuracy": 0.9774578559445217, + "accuracy": 0.9770606078673154, "total_bits": 39202816, "q_proj": { "group_size": { @@ -31810,7 +31810,7 @@ } }, { - "accuracy": 0.9768870737170801, + "accuracy": 0.976882538292557, "total_bits": 39505664, "q_proj": { "group_size": { @@ -31874,7 +31874,7 @@ } }, { - "accuracy": 0.9781158120604232, + "accuracy": 0.9778225866612047, "total_bits": 39812608, "q_proj": { "group_size": { @@ -31938,7 +31938,7 @@ } }, { - "accuracy": 0.9819771151524037, + "accuracy": 0.9818001367384568, "total_bits": 40245248, "q_proj": { "group_size": { @@ -31999,7 +31999,7 @@ } }, { - "accuracy": 0.9830977199599147, + "accuracy": 0.9828822681447491, "total_bits": 40701952, "q_proj": { "group_size": { @@ -32060,7 +32060,7 @@ } }, { - "accuracy": 0.9899077902082354, + "accuracy": 0.9899290261673741, "total_bits": 49384448, "q_proj": { "group_size": { @@ -32121,7 +32121,7 @@ } }, { - "accuracy": 0.9916064245044254, + "accuracy": 0.9917734954797197, "total_bits": 50139136, "q_proj": { "group_size": { @@ -32182,7 +32182,7 @@ } }, { - "accuracy": 0.9927945938543417, + "accuracy": 0.9928468686994165, "total_bits": 57183232, "q_proj": { "group_size": { @@ -32234,7 +32234,7 @@ } }, { - "accuracy": 0.9958008275134489, + "accuracy": 0.9958058236807119, "total_bits": 59125760, "q_proj": { "group_size": { @@ -32286,7 +32286,7 @@ } }, { - "accuracy": 0.9981787492506555, + "accuracy": 0.998137492017122, "total_bits": 76057600, "q_proj": { "group_size": { @@ -32340,7 +32340,7 @@ ], "model.layers.16.mlp": [ { - "accuracy": 0.8707250105217099, + "accuracy": 0.870710012037307, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -32392,7 +32392,7 @@ } }, { - "accuracy": 0.8745106346905231, + "accuracy": 0.8744872231036425, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -32444,7 +32444,7 @@ } }, { - "accuracy": 0.8954619406722486, + "accuracy": 0.8954966012388468, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -32493,7 +32493,7 @@ } }, { - "accuracy": 0.9026182843372226, + "accuracy": 0.9026583167724311, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -32542,7 +32542,7 @@ } }, { - "accuracy": 0.9338920915033668, + "accuracy": 0.9338845473248512, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -32594,7 +32594,7 @@ } }, { - "accuracy": 0.9393174995202571, + "accuracy": 0.9393400480039418, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -32646,7 +32646,7 @@ } }, { - "accuracy": 0.9486013525165617, + "accuracy": 0.9486405709758401, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -32695,7 +32695,7 @@ } }, { - "accuracy": 0.9647956977132708, + "accuracy": 0.9648088419344276, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -32738,7 +32738,7 @@ } }, { - "accuracy": 0.9681419640546665, + "accuracy": 0.9681426691822708, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -32781,7 +32781,7 @@ } }, { - "accuracy": 0.9662699493346736, + "accuracy": 0.9662436044309288, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -32833,7 +32833,7 @@ } }, { - "accuracy": 0.9704979130765423, + "accuracy": 0.970503983204253, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -32885,7 +32885,7 @@ } }, { - "accuracy": 0.9827976264059544, + "accuracy": 0.9827967949677259, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -32937,7 +32937,7 @@ } }, { - "accuracy": 0.985281364817638, + "accuracy": 0.9852806397830136, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -32989,7 +32989,7 @@ } }, { - "accuracy": 0.990441148460377, + "accuracy": 0.9904438178054988, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -33032,7 +33032,7 @@ } }, { - "accuracy": 0.9912717372062616, + "accuracy": 0.9912758679129183, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -33081,7 +33081,7 @@ } }, { - "accuracy": 0.9933044076897204, + "accuracy": 0.9933096571476199, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -33127,7 +33127,7 @@ } }, { - "accuracy": 0.9974210811924422, + "accuracy": 0.997423453751253, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -33169,7 +33169,7 @@ ], "model.layers.17.self_attn": [ { - "accuracy": 0.9153526779264212, + "accuracy": 0.9123064079321921, "total_bits": 20322304, "q_proj": { "group_size": { @@ -33233,7 +33233,7 @@ } }, { - "accuracy": 0.9189303005114198, + "accuracy": 0.9163885992020369, "total_bits": 20977664, "q_proj": { "group_size": { @@ -33297,7 +33297,7 @@ } }, { - "accuracy": 0.931039173156023, + "accuracy": 0.9304717793129385, "total_bits": 21419264, "q_proj": { "group_size": { @@ -33361,7 +33361,7 @@ } }, { - "accuracy": 0.946169487433508, + "accuracy": 0.9457204439677298, "total_bits": 25481728, "q_proj": { "group_size": { @@ -33425,7 +33425,7 @@ } }, { - "accuracy": 0.9562859626021236, + "accuracy": 0.9561849331948906, "total_bits": 30051328, "q_proj": { "group_size": { @@ -33489,7 +33489,7 @@ } }, { - "accuracy": 0.9575782786123455, + "accuracy": 0.9566359755117446, "total_bits": 30068480, "q_proj": { "group_size": { @@ -33553,7 +33553,7 @@ } }, { - "accuracy": 0.9736042366130278, + "accuracy": 0.9740906710503623, "total_bits": 38308864, "q_proj": { "group_size": { @@ -33605,7 +33605,7 @@ } }, { - "accuracy": 0.9744416913017631, + "accuracy": 0.9744484331458807, "total_bits": 38326016, "q_proj": { "group_size": { @@ -33657,7 +33657,7 @@ } }, { - "accuracy": 0.9770701255183667, + "accuracy": 0.9772818374913186, "total_bits": 38641152, "q_proj": { "group_size": { @@ -33709,7 +33709,7 @@ } }, { - "accuracy": 0.9780390695668757, + "accuracy": 0.978236723691225, "total_bits": 39202816, "q_proj": { "group_size": { @@ -33761,7 +33761,7 @@ } }, { - "accuracy": 0.9779655180172995, + "accuracy": 0.97689908684697, "total_bits": 39505664, "q_proj": { "group_size": { @@ -33825,7 +33825,7 @@ } }, { - "accuracy": 0.9796391371637583, + "accuracy": 0.9795279368991032, "total_bits": 39812608, "q_proj": { "group_size": { @@ -33889,7 +33889,7 @@ } }, { - "accuracy": 0.9821417613420635, + "accuracy": 0.98225297476165, "total_bits": 40245248, "q_proj": { "group_size": { @@ -33950,7 +33950,7 @@ } }, { - "accuracy": 0.9835524157388136, + "accuracy": 0.9835034856805578, "total_bits": 40701952, "q_proj": { "group_size": { @@ -34011,7 +34011,7 @@ } }, { - "accuracy": 0.9898466859012842, + "accuracy": 0.9899880553712137, "total_bits": 49384448, "q_proj": { "group_size": { @@ -34072,7 +34072,7 @@ } }, { - "accuracy": 0.9916954462532885, + "accuracy": 0.9917687639826909, "total_bits": 50139136, "q_proj": { "group_size": { @@ -34133,7 +34133,7 @@ } }, { - "accuracy": 0.992595004150644, + "accuracy": 0.992849877657136, "total_bits": 57183232, "q_proj": { "group_size": { @@ -34185,7 +34185,7 @@ } }, { - "accuracy": 0.9956898246018682, + "accuracy": 0.9956645138736349, "total_bits": 59125760, "q_proj": { "group_size": { @@ -34237,7 +34237,7 @@ } }, { - "accuracy": 0.9980364417788223, + "accuracy": 0.9980730263341684, "total_bits": 76057600, "q_proj": { "group_size": { @@ -34291,7 +34291,7 @@ ], "model.layers.17.mlp": [ { - "accuracy": 0.8728603753261268, + "accuracy": 0.8728781985118985, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -34343,7 +34343,7 @@ } }, { - "accuracy": 0.8762580277398229, + "accuracy": 0.876280159689486, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -34395,7 +34395,7 @@ } }, { - "accuracy": 0.8967053289525211, + "accuracy": 0.8967352961190045, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -34444,7 +34444,7 @@ } }, { - "accuracy": 0.9035036060959101, + "accuracy": 0.9035190902650356, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -34493,7 +34493,7 @@ } }, { - "accuracy": 0.9348402414470911, + "accuracy": 0.9348068400286138, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -34545,7 +34545,7 @@ } }, { - "accuracy": 0.9400133183225989, + "accuracy": 0.9400173944886774, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -34597,7 +34597,7 @@ } }, { - "accuracy": 0.9491435112431645, + "accuracy": 0.9491662157233804, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -34646,7 +34646,7 @@ } }, { - "accuracy": 0.965498898178339, + "accuracy": 0.9654821592848748, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -34689,7 +34689,7 @@ } }, { - "accuracy": 0.9687769180163741, + "accuracy": 0.9687824887223542, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -34732,7 +34732,7 @@ } }, { - "accuracy": 0.9667592031182721, + "accuracy": 0.9667529048165306, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -34784,7 +34784,7 @@ } }, { - "accuracy": 0.9708633943228051, + "accuracy": 0.9708699659677222, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -34836,7 +34836,7 @@ } }, { - "accuracy": 0.9830579466070049, + "accuracy": 0.9830639206338674, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -34888,7 +34888,7 @@ } }, { - "accuracy": 0.9854786905343644, + "accuracy": 0.9854768795194104, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -34940,7 +34940,7 @@ } }, { - "accuracy": 0.9906953814788722, + "accuracy": 0.9906972449389286, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -34983,7 +34983,7 @@ } }, { - "accuracy": 0.9914268311404157, + "accuracy": 0.9914270240697078, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -35032,7 +35032,7 @@ } }, { - "accuracy": 0.9933539273042697, + "accuracy": 0.9933541154896375, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -35078,7 +35078,7 @@ } }, { - "accuracy": 0.9975086938648019, + "accuracy": 0.9975105525954859, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -35120,7 +35120,7 @@ ], "model.layers.18.self_attn": [ { - "accuracy": 0.9103264245204628, + "accuracy": 0.9088634215295315, "total_bits": 20322304, "q_proj": { "group_size": { @@ -35184,7 +35184,7 @@ } }, { - "accuracy": 0.913609532173723, + "accuracy": 0.9153703120537102, "total_bits": 20977664, "q_proj": { "group_size": { @@ -35248,7 +35248,7 @@ } }, { - "accuracy": 0.9246024615131319, + "accuracy": 0.9253094680607319, "total_bits": 21419264, "q_proj": { "group_size": { @@ -35312,7 +35312,7 @@ } }, { - "accuracy": 0.9399101524613798, + "accuracy": 0.9410159010440111, "total_bits": 25481728, "q_proj": { "group_size": { @@ -35376,7 +35376,7 @@ } }, { - "accuracy": 0.952972172293812, + "accuracy": 0.953566029900685, "total_bits": 30051328, "q_proj": { "group_size": { @@ -35440,7 +35440,7 @@ } }, { - "accuracy": 0.954062441829592, + "accuracy": 0.9547900941688567, "total_bits": 30068480, "q_proj": { "group_size": { @@ -35504,7 +35504,7 @@ } }, { - "accuracy": 0.9705156976124272, + "accuracy": 0.9709254525369033, "total_bits": 38308864, "q_proj": { "group_size": { @@ -35556,7 +35556,7 @@ } }, { - "accuracy": 0.9714527239557356, + "accuracy": 0.972082293825224, "total_bits": 38326016, "q_proj": { "group_size": { @@ -35608,7 +35608,7 @@ } }, { - "accuracy": 0.9747130553005263, + "accuracy": 0.9741814552107826, "total_bits": 38641152, "q_proj": { "group_size": { @@ -35660,7 +35660,7 @@ } }, { - "accuracy": 0.9758984125219285, + "accuracy": 0.9754220984177664, "total_bits": 39202816, "q_proj": { "group_size": { @@ -35712,7 +35712,7 @@ } }, { - "accuracy": 0.97633627417963, + "accuracy": 0.9760375062469393, "total_bits": 39505664, "q_proj": { "group_size": { @@ -35776,7 +35776,7 @@ } }, { - "accuracy": 0.9781932511832565, + "accuracy": 0.9775549359619617, "total_bits": 39812608, "q_proj": { "group_size": { @@ -35840,7 +35840,7 @@ } }, { - "accuracy": 0.9803400166565552, + "accuracy": 0.9803462373092771, "total_bits": 40245248, "q_proj": { "group_size": { @@ -35901,7 +35901,7 @@ } }, { - "accuracy": 0.9822616456076503, + "accuracy": 0.9822041114093736, "total_bits": 40701952, "q_proj": { "group_size": { @@ -35962,7 +35962,7 @@ } }, { - "accuracy": 0.9889336972264573, + "accuracy": 0.9889042469440028, "total_bits": 49384448, "q_proj": { "group_size": { @@ -36023,7 +36023,7 @@ } }, { - "accuracy": 0.9910705528454855, + "accuracy": 0.9911492743995041, "total_bits": 50139136, "q_proj": { "group_size": { @@ -36084,7 +36084,7 @@ } }, { - "accuracy": 0.9917217692127451, + "accuracy": 0.9917807224555872, "total_bits": 57183232, "q_proj": { "group_size": { @@ -36136,7 +36136,7 @@ } }, { - "accuracy": 0.9951845193863846, + "accuracy": 0.9951703978586011, "total_bits": 59125760, "q_proj": { "group_size": { @@ -36188,7 +36188,7 @@ } }, { - "accuracy": 0.9977679173025535, + "accuracy": 0.9977872487943387, "total_bits": 76057600, "q_proj": { "group_size": { @@ -36242,7 +36242,7 @@ ], "model.layers.18.mlp": [ { - "accuracy": 0.8708415194414556, + "accuracy": 0.8708666283637285, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -36294,7 +36294,7 @@ } }, { - "accuracy": 0.8742274958640337, + "accuracy": 0.8742867028340697, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -36346,7 +36346,7 @@ } }, { - "accuracy": 0.8939676131121814, + "accuracy": 0.8940495727583766, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -36395,7 +36395,7 @@ } }, { - "accuracy": 0.9005825412459671, + "accuracy": 0.900671096984297, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -36444,7 +36444,7 @@ } }, { - "accuracy": 0.9338501647580415, + "accuracy": 0.9338334542699158, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -36496,7 +36496,7 @@ } }, { - "accuracy": 0.9389537025708705, + "accuracy": 0.9389386961702257, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -36548,7 +36548,7 @@ } }, { - "accuracy": 0.9479271811433136, + "accuracy": 0.9479005362372845, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -36597,7 +36597,7 @@ } }, { - "accuracy": 0.9651007237844169, + "accuracy": 0.9650991873349994, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -36640,7 +36640,7 @@ } }, { - "accuracy": 0.9683221388841048, + "accuracy": 0.9683199158171192, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -36683,7 +36683,7 @@ } }, { - "accuracy": 0.9662486690795049, + "accuracy": 0.9662623617332429, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -36735,7 +36735,7 @@ } }, { - "accuracy": 0.970382378436625, + "accuracy": 0.9703731988556683, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -36787,7 +36787,7 @@ } }, { - "accuracy": 0.9828338834340684, + "accuracy": 0.9828364161076024, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -36839,7 +36839,7 @@ } }, { - "accuracy": 0.9852446754230186, + "accuracy": 0.9852500431588851, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -36891,7 +36891,7 @@ } }, { - "accuracy": 0.9906159875681624, + "accuracy": 0.9906109553994611, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -36934,7 +36934,7 @@ } }, { - "accuracy": 0.9913037064252421, + "accuracy": 0.9913024957058951, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -36983,7 +36983,7 @@ } }, { - "accuracy": 0.9931552672060207, + "accuracy": 0.9931536499934737, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -37029,7 +37029,7 @@ } }, { - "accuracy": 0.9974773659923812, + "accuracy": 0.9974787205865141, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -37071,7 +37071,7 @@ ], "model.layers.19.self_attn": [ { - "accuracy": 0.91381651815027, + "accuracy": 0.9176479880698025, "total_bits": 20322304, "q_proj": { "group_size": { @@ -37135,7 +37135,7 @@ } }, { - "accuracy": 0.9172278349287808, + "accuracy": 0.9197240476496518, "total_bits": 20977664, "q_proj": { "group_size": { @@ -37199,7 +37199,7 @@ } }, { - "accuracy": 0.9367378961760551, + "accuracy": 0.9376092075835913, "total_bits": 21419264, "q_proj": { "group_size": { @@ -37263,7 +37263,7 @@ } }, { - "accuracy": 0.9482615378219634, + "accuracy": 0.9494412580970675, "total_bits": 25481728, "q_proj": { "group_size": { @@ -37327,7 +37327,7 @@ } }, { - "accuracy": 0.9578437705058604, + "accuracy": 0.9588730656541884, "total_bits": 30051328, "q_proj": { "group_size": { @@ -37391,7 +37391,7 @@ } }, { - "accuracy": 0.9583659318741411, + "accuracy": 0.9594525077845901, "total_bits": 30068480, "q_proj": { "group_size": { @@ -37455,7 +37455,7 @@ } }, { - "accuracy": 0.9727135031716898, + "accuracy": 0.9734676006482914, "total_bits": 38308864, "q_proj": { "group_size": { @@ -37507,7 +37507,7 @@ } }, { - "accuracy": 0.9750595226651058, + "accuracy": 0.9746841629967093, "total_bits": 38326016, "q_proj": { "group_size": { @@ -37559,7 +37559,7 @@ } }, { - "accuracy": 0.9770815862575546, + "accuracy": 0.9769488971214741, "total_bits": 38641152, "q_proj": { "group_size": { @@ -37611,7 +37611,7 @@ } }, { - "accuracy": 0.9780753076775, + "accuracy": 0.9778047652216628, "total_bits": 39202816, "q_proj": { "group_size": { @@ -37663,7 +37663,7 @@ } }, { - "accuracy": 0.9783113790908828, + "accuracy": 0.9784690069500357, "total_bits": 39505664, "q_proj": { "group_size": { @@ -37727,7 +37727,7 @@ } }, { - "accuracy": 0.980536918505095, + "accuracy": 0.980993464589119, "total_bits": 39812608, "q_proj": { "group_size": { @@ -37791,7 +37791,7 @@ } }, { - "accuracy": 0.9827054542256519, + "accuracy": 0.9825513790128753, "total_bits": 40245248, "q_proj": { "group_size": { @@ -37852,7 +37852,7 @@ } }, { - "accuracy": 0.9847821660223417, + "accuracy": 0.9846148652723059, "total_bits": 40701952, "q_proj": { "group_size": { @@ -37913,7 +37913,7 @@ } }, { - "accuracy": 0.9898612038814463, + "accuracy": 0.9900583295966499, "total_bits": 49384448, "q_proj": { "group_size": { @@ -37974,7 +37974,7 @@ } }, { - "accuracy": 0.9919800390198361, + "accuracy": 0.9919769621046726, "total_bits": 50139136, "q_proj": { "group_size": { @@ -38035,7 +38035,7 @@ } }, { - "accuracy": 0.9917078913131263, + "accuracy": 0.9918994125619065, "total_bits": 57183232, "q_proj": { "group_size": { @@ -38087,7 +38087,7 @@ } }, { - "accuracy": 0.9959743874933338, + "accuracy": 0.9959455616772175, "total_bits": 59125760, "q_proj": { "group_size": { @@ -38139,7 +38139,7 @@ } }, { - "accuracy": 0.9977810490236152, + "accuracy": 0.9978194363793591, "total_bits": 76057600, "q_proj": { "group_size": { @@ -38193,7 +38193,7 @@ ], "model.layers.19.mlp": [ { - "accuracy": 0.8663804107345641, + "accuracy": 0.8664225754328072, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -38245,7 +38245,7 @@ } }, { - "accuracy": 0.8698392519727349, + "accuracy": 0.8698052424006164, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -38297,7 +38297,7 @@ } }, { - "accuracy": 0.8900767364539206, + "accuracy": 0.8901418377645314, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -38346,7 +38346,7 @@ } }, { - "accuracy": 0.8968699816614389, + "accuracy": 0.8969293641857803, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -38395,7 +38395,7 @@ } }, { - "accuracy": 0.9313416024670005, + "accuracy": 0.9313398345839232, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -38447,7 +38447,7 @@ } }, { - "accuracy": 0.9366983594372869, + "accuracy": 0.936706930398941, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -38499,7 +38499,7 @@ } }, { - "accuracy": 0.9459799854084849, + "accuracy": 0.9459720670711249, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -38548,7 +38548,7 @@ } }, { - "accuracy": 0.9638793664053082, + "accuracy": 0.9638726895209402, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -38591,7 +38591,7 @@ } }, { - "accuracy": 0.9672302826074883, + "accuracy": 0.9672257042257115, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -38634,7 +38634,7 @@ } }, { - "accuracy": 0.965055137174204, + "accuracy": 0.9650480181444436, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -38686,7 +38686,7 @@ } }, { - "accuracy": 0.969295253045857, + "accuracy": 0.9692801123019308, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -38738,7 +38738,7 @@ } }, { - "accuracy": 0.9822289427975193, + "accuracy": 0.9822135223075747, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -38790,7 +38790,7 @@ } }, { - "accuracy": 0.9847121201455593, + "accuracy": 0.9847081050393172, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -38842,7 +38842,7 @@ } }, { - "accuracy": 0.9903098595677875, + "accuracy": 0.9903073518071324, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -38885,7 +38885,7 @@ } }, { - "accuracy": 0.9909830195247196, + "accuracy": 0.9909829886746593, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -38934,7 +38934,7 @@ } }, { - "accuracy": 0.9928994243964553, + "accuracy": 0.9929009438201319, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -38980,7 +38980,7 @@ } }, { - "accuracy": 0.9973993370658718, + "accuracy": 0.9974026714044157, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -39022,7 +39022,7 @@ ], "model.layers.20.self_attn": [ { - "accuracy": 0.9226470687426627, + "accuracy": 0.919053936842829, "total_bits": 20322304, "q_proj": { "group_size": { @@ -39086,7 +39086,7 @@ } }, { - "accuracy": 0.9225568282417953, + "accuracy": 0.9231919501908123, "total_bits": 20977664, "q_proj": { "group_size": { @@ -39150,7 +39150,7 @@ } }, { - "accuracy": 0.9419956349302083, + "accuracy": 0.9416922819800675, "total_bits": 21419264, "q_proj": { "group_size": { @@ -39214,7 +39214,7 @@ } }, { - "accuracy": 0.9531588517129421, + "accuracy": 0.9527852539904416, "total_bits": 25481728, "q_proj": { "group_size": { @@ -39278,7 +39278,7 @@ } }, { - "accuracy": 0.9609904403332621, + "accuracy": 0.9605993672739714, "total_bits": 30051328, "q_proj": { "group_size": { @@ -39342,7 +39342,7 @@ } }, { - "accuracy": 0.962792478967458, + "accuracy": 0.9608008908107877, "total_bits": 30068480, "q_proj": { "group_size": { @@ -39406,7 +39406,7 @@ } }, { - "accuracy": 0.9758201267104596, + "accuracy": 0.9760824019322172, "total_bits": 38308864, "q_proj": { "group_size": { @@ -39458,7 +39458,7 @@ } }, { - "accuracy": 0.976430531241931, + "accuracy": 0.9765508801210672, "total_bits": 38326016, "q_proj": { "group_size": { @@ -39510,7 +39510,7 @@ } }, { - "accuracy": 0.9788923836313188, + "accuracy": 0.9790359369944781, "total_bits": 38641152, "q_proj": { "group_size": { @@ -39562,7 +39562,7 @@ } }, { - "accuracy": 0.9793093597982079, + "accuracy": 0.9795548697002232, "total_bits": 39202816, "q_proj": { "group_size": { @@ -39614,7 +39614,7 @@ } }, { - "accuracy": 0.9796468628337607, + "accuracy": 0.9799470123834908, "total_bits": 39505664, "q_proj": { "group_size": { @@ -39678,7 +39678,7 @@ } }, { - "accuracy": 0.9815771167632192, + "accuracy": 0.9812144176103175, "total_bits": 39812608, "q_proj": { "group_size": { @@ -39742,7 +39742,7 @@ } }, { - "accuracy": 0.9845800460898317, + "accuracy": 0.9844042120384984, "total_bits": 40245248, "q_proj": { "group_size": { @@ -39803,7 +39803,7 @@ } }, { - "accuracy": 0.9861196175334044, + "accuracy": 0.9864334944286384, "total_bits": 40701952, "q_proj": { "group_size": { @@ -39864,7 +39864,7 @@ } }, { - "accuracy": 0.9916834983741865, + "accuracy": 0.9916316523449495, "total_bits": 49384448, "q_proj": { "group_size": { @@ -39925,7 +39925,7 @@ } }, { - "accuracy": 0.992955818248447, + "accuracy": 0.9930807327327784, "total_bits": 50139136, "q_proj": { "group_size": { @@ -39986,7 +39986,7 @@ } }, { - "accuracy": 0.9934278220171109, + "accuracy": 0.9934231227671262, "total_bits": 57183232, "q_proj": { "group_size": { @@ -40038,7 +40038,7 @@ } }, { - "accuracy": 0.996440913353581, + "accuracy": 0.9965193888783688, "total_bits": 59125760, "q_proj": { "group_size": { @@ -40090,7 +40090,7 @@ } }, { - "accuracy": 0.9982685764698545, + "accuracy": 0.9983226815747912, "total_bits": 76057600, "q_proj": { "group_size": { @@ -40144,7 +40144,7 @@ ], "model.layers.20.mlp": [ { - "accuracy": 0.8603538069874048, + "accuracy": 0.8603928601369262, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -40196,7 +40196,7 @@ } }, { - "accuracy": 0.8641403624787927, + "accuracy": 0.8641671189107001, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -40248,7 +40248,7 @@ } }, { - "accuracy": 0.8846050030551851, + "accuracy": 0.8845889158546925, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -40297,7 +40297,7 @@ } }, { - "accuracy": 0.8913812898099422, + "accuracy": 0.8913620258681476, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -40346,7 +40346,7 @@ } }, { - "accuracy": 0.9281160836108029, + "accuracy": 0.9280672203749418, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -40398,7 +40398,7 @@ } }, { - "accuracy": 0.9339064590167254, + "accuracy": 0.9338786187581718, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -40450,7 +40450,7 @@ } }, { - "accuracy": 0.94321479042992, + "accuracy": 0.9432024005800486, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -40499,7 +40499,7 @@ } }, { - "accuracy": 0.9621658476535231, + "accuracy": 0.9621703654993325, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -40542,7 +40542,7 @@ } }, { - "accuracy": 0.9657112886197865, + "accuracy": 0.9657243186375126, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -40585,7 +40585,7 @@ } }, { - "accuracy": 0.9633610309101641, + "accuracy": 0.9633581631351262, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -40637,7 +40637,7 @@ } }, { - "accuracy": 0.9679203201085329, + "accuracy": 0.9679346160264686, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -40689,7 +40689,7 @@ } }, { - "accuracy": 0.9813444587634876, + "accuracy": 0.981346708140336, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -40741,7 +40741,7 @@ } }, { - "accuracy": 0.9840119720320217, + "accuracy": 0.9840151931275614, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -40793,7 +40793,7 @@ } }, { - "accuracy": 0.989789031620603, + "accuracy": 0.989788303966634, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -40836,7 +40836,7 @@ } }, { - "accuracy": 0.9905532479169779, + "accuracy": 0.9905513109406456, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -40885,7 +40885,7 @@ } }, { - "accuracy": 0.9924720326380339, + "accuracy": 0.9924696069501806, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -40931,7 +40931,7 @@ } }, { - "accuracy": 0.9972619387554005, + "accuracy": 0.9972656247846317, "total_bits": 278220352, "gate_proj": { "group_size": { @@ -40973,7 +40973,7 @@ ], "model.layers.21.self_attn": [ { - "accuracy": 0.9182253973558545, + "accuracy": 0.9183254987001419, "total_bits": 20322304, "q_proj": { "group_size": { @@ -41037,7 +41037,7 @@ } }, { - "accuracy": 0.9243325092829764, + "accuracy": 0.9249476795084774, "total_bits": 20977664, "q_proj": { "group_size": { @@ -41101,7 +41101,7 @@ } }, { - "accuracy": 0.9369929884560406, + "accuracy": 0.9377971803769469, "total_bits": 21419264, "q_proj": { "group_size": { @@ -41165,7 +41165,7 @@ } }, { - "accuracy": 0.9504585885442793, + "accuracy": 0.9513013726100326, "total_bits": 25481728, "q_proj": { "group_size": { @@ -41229,7 +41229,7 @@ } }, { - "accuracy": 0.9591148681938648, + "accuracy": 0.9601939956191927, "total_bits": 30051328, "q_proj": { "group_size": { @@ -41293,7 +41293,7 @@ } }, { - "accuracy": 0.9612603934947401, + "accuracy": 0.9612989106681198, "total_bits": 30068480, "q_proj": { "group_size": { @@ -41357,7 +41357,7 @@ } }, { - "accuracy": 0.9768199414247647, + "accuracy": 0.9766241102479398, "total_bits": 38308864, "q_proj": { "group_size": { @@ -41409,7 +41409,7 @@ } }, { - "accuracy": 0.9775638175196946, + "accuracy": 0.9777308126213029, "total_bits": 38326016, "q_proj": { "group_size": { @@ -41461,7 +41461,7 @@ } }, { - "accuracy": 0.9790954444324598, + "accuracy": 0.9793567762244493, "total_bits": 38641152, "q_proj": { "group_size": { @@ -41513,7 +41513,7 @@ } }, { - "accuracy": 0.9794533755630255, + "accuracy": 0.9800748381530866, "total_bits": 39202816, "q_proj": { "group_size": { @@ -41565,7 +41565,7 @@ } }, { - "accuracy": 0.9799003408988938, + "accuracy": 0.9803644901840016, "total_bits": 39505664, "q_proj": { "group_size": { @@ -41629,7 +41629,7 @@ } }, { - "accuracy": 0.9812384465476498, + "accuracy": 0.9816934096161276, "total_bits": 39812608, "q_proj": { "group_size": { @@ -41693,7 +41693,7 @@ } }, { - "accuracy": 0.9845880307839252, + "accuracy": 0.9846250819973648, "total_bits": 40245248, "q_proj": { "group_size": { @@ -41754,7 +41754,7 @@ } }, { - "accuracy": 0.9859071526443586, + "accuracy": 0.9856326691806316, "total_bits": 40701952, "q_proj": { "group_size": { @@ -41815,7 +41815,7 @@ } }, { - "accuracy": 0.9912090235156938, + "accuracy": 0.9912999818916433, "total_bits": 49384448, "q_proj": { "group_size": { @@ -41876,7 +41876,7 @@ } }, { - "accuracy": 0.9928324061038438, + "accuracy": 0.9928109946486074, "total_bits": 50139136, "q_proj": { "group_size": { @@ -41937,7 +41937,7 @@ } }, { - "accuracy": 0.9936406589695252, + "accuracy": 0.9937434990715701, "total_bits": 57183232, "q_proj": { "group_size": { @@ -41989,7 +41989,7 @@ } }, { - "accuracy": 0.9962718351453077, + "accuracy": 0.9962626121123321, "total_bits": 59125760, "q_proj": { "group_size": { @@ -42041,7 +42041,7 @@ } }, { - "accuracy": 0.998356145391881, + "accuracy": 0.9983449484207085, "total_bits": 76057600, "q_proj": { "group_size": { @@ -42095,7 +42095,7 @@ ], "model.layers.21.mlp": [ { - "accuracy": 0.8678224682807922, + "accuracy": 0.8677523634396493, "total_bits": 77888880, "gate_proj": { "group_size": { @@ -42147,7 +42147,7 @@ } }, { - "accuracy": 0.871506676543504, + "accuracy": 0.8714931388385594, "total_bits": 80772464, "gate_proj": { "group_size": { @@ -42199,7 +42199,7 @@ } }, { - "accuracy": 0.8884445764124393, + "accuracy": 0.888358716852963, "total_bits": 90172672, "gate_proj": { "group_size": { @@ -42248,7 +42248,7 @@ } }, { - "accuracy": 0.8937292587943375, + "accuracy": 0.8936427589505911, "total_bits": 101117184, "gate_proj": { "group_size": { @@ -42297,7 +42297,7 @@ } }, { - "accuracy": 0.931507452391088, + "accuracy": 0.9315323932096362, "total_bits": 113848208, "gate_proj": { "group_size": { @@ -42349,7 +42349,7 @@ } }, { - "accuracy": 0.9377884943969548, + "accuracy": 0.937734718201682, "total_bits": 116734208, "gate_proj": { "group_size": { @@ -42401,7 +42401,7 @@ } }, { - "accuracy": 0.9450552228372544, + "accuracy": 0.9449923397041857, "total_bits": 125469072, "gate_proj": { "group_size": { @@ -42450,7 +42450,7 @@ } }, { - "accuracy": 0.9632573653943837, + "accuracy": 0.9632590070832521, "total_bits": 143308944, "gate_proj": { "group_size": { @@ -42493,7 +42493,7 @@ } }, { - "accuracy": 0.9666756325168535, + "accuracy": 0.9666628061095253, "total_bits": 145422592, "gate_proj": { "group_size": { @@ -42536,7 +42536,7 @@ } }, { - "accuracy": 0.9644941638689488, + "accuracy": 0.9644571125973016, "total_bits": 147861392, "gate_proj": { "group_size": { @@ -42588,7 +42588,7 @@ } }, { - "accuracy": 0.9690807153237984, + "accuracy": 0.969106458243914, "total_bits": 150747392, "gate_proj": { "group_size": { @@ -42640,7 +42640,7 @@ } }, { - "accuracy": 0.9814384198980406, + "accuracy": 0.9814396995352581, "total_bits": 181874576, "gate_proj": { "group_size": { @@ -42692,7 +42692,7 @@ } }, { - "accuracy": 0.9843641832121648, + "accuracy": 0.9843679514015093, "total_bits": 184760576, "gate_proj": { "group_size": { @@ -42744,7 +42744,7 @@ } }, { - "accuracy": 0.989396913908422, + "accuracy": 0.9894372876733541, "total_bits": 210251664, "gate_proj": { "group_size": { @@ -42787,7 +42787,7 @@ } }, { - "accuracy": 0.9905827934853733, + "accuracy": 0.9905733634368517, "total_bits": 218451520, "gate_proj": { "group_size": { @@ -42836,7 +42836,7 @@ } }, { - "accuracy": 0.9920948224607855, + "accuracy": 0.9920839264523238, "total_bits": 237850176, "gate_proj": { "group_size": { @@ -42882,7 +42882,7 @@ } }, { - "accuracy": 0.9971556706441334, + "accuracy": 0.9971576091047609, "total_bits": 278220352, "gate_proj": { "group_size": {