diff --git "a/measurement.json" "b/measurement.json" --- "a/measurement.json" +++ "b/measurement.json" @@ -2,7 +2,7 @@ "measurement": { "model.layers.0.self_attn": [ { - "accuracy": 0.8838959559798241, + "accuracy": 0.8551338267953772, "total_bits": 89665536, "q_proj": { "group_size": { @@ -66,7 +66,7 @@ } }, { - "accuracy": 0.896147120547922, + "accuracy": 0.8733699164892498, "total_bits": 92221440, "q_proj": { "group_size": { @@ -130,7 +130,7 @@ } }, { - "accuracy": 0.9175817986067972, + "accuracy": 0.8909268571357978, "total_bits": 95758848, "q_proj": { "group_size": { @@ -194,7 +194,7 @@ } }, { - "accuracy": 0.9393696539888257, + "accuracy": 0.9217061457273207, "total_bits": 112272384, "q_proj": { "group_size": { @@ -258,7 +258,7 @@ } }, { - "accuracy": 0.9440036225867898, + "accuracy": 0.9276937558070609, "total_bits": 132913152, "q_proj": { "group_size": { @@ -322,7 +322,7 @@ } }, { - "accuracy": 0.9433559140092448, + "accuracy": 0.9277610974876505, "total_bits": 132980224, "q_proj": { "group_size": { @@ -386,7 +386,7 @@ } }, { - "accuracy": 0.9553854636063701, + "accuracy": 0.9431704225900926, "total_bits": 169613312, "q_proj": { "group_size": { @@ -438,7 +438,7 @@ } }, { - "accuracy": 0.9551399912881224, + "accuracy": 0.9436987848266175, "total_bits": 169745920, "q_proj": { "group_size": { @@ -490,7 +490,7 @@ } }, { - "accuracy": 0.9623956184246039, + "accuracy": 0.9541762590800461, "total_bits": 171195392, "q_proj": { "group_size": { @@ -542,7 +542,7 @@ } }, { - "accuracy": 0.9641238191214047, + "accuracy": 0.9562624773304713, "total_bits": 173563904, "q_proj": { "group_size": { @@ -594,7 +594,7 @@ } }, { - "accuracy": 0.9725993960899743, + "accuracy": 0.9643672986054107, "total_bits": 174923264, "q_proj": { "group_size": { @@ -658,7 +658,7 @@ } }, { - "accuracy": 0.9745138308131381, + "accuracy": 0.9676855945665586, "total_bits": 175750144, "q_proj": { "group_size": { @@ -722,7 +722,7 @@ } }, { - "accuracy": 0.9755942204869107, + "accuracy": 0.9683421806089187, "total_bits": 179253248, "q_proj": { "group_size": { @@ -783,7 +783,7 @@ } }, { - "accuracy": 0.9775272706817639, + "accuracy": 0.9718343669450596, "total_bits": 181592064, "q_proj": { "group_size": { @@ -844,7 +844,7 @@ } }, { - "accuracy": 0.9868796370237282, + "accuracy": 0.9825963614214408, "total_bits": 220469248, "q_proj": { "group_size": { @@ -905,7 +905,7 @@ } }, { - "accuracy": 0.9890970591161596, + "accuracy": 0.9858642875363952, "total_bits": 223535104, "q_proj": { "group_size": { @@ -966,7 +966,7 @@ } }, { - "accuracy": 0.9889701738414404, + "accuracy": 0.9853400478237554, "total_bits": 253499392, "q_proj": { "group_size": { @@ -1018,7 +1018,7 @@ } }, { - "accuracy": 0.9942832984226314, + "accuracy": 0.9922555782342035, "total_bits": 265838592, "q_proj": { "group_size": { @@ -1070,7 +1070,7 @@ } }, { - "accuracy": 0.9969293696830344, + "accuracy": 0.9958325235393682, "total_bits": 337385472, "q_proj": { "group_size": { @@ -1124,7 +1124,7 @@ ], "model.layers.0.mlp": [ { - "accuracy": 0.8157823964169151, + "accuracy": 0.8078629633313731, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -1176,7 +1176,7 @@ } }, { - "accuracy": 0.8214181253784582, + "accuracy": 0.8133499347849896, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -1228,7 +1228,7 @@ } }, { - "accuracy": 0.8489965176896045, + "accuracy": 0.844286215148474, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -1277,7 +1277,7 @@ } }, { - "accuracy": 0.8576634851725478, + "accuracy": 0.8541672006249428, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -1326,7 +1326,7 @@ } }, { - "accuracy": 0.9089305730242478, + "accuracy": 0.9041820619451373, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -1378,7 +1378,7 @@ } }, { - "accuracy": 0.9164342676338396, + "accuracy": 0.9119999181283147, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -1430,7 +1430,7 @@ } }, { - "accuracy": 0.9282353559606954, + "accuracy": 0.9253550120874455, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -1479,7 +1479,7 @@ } }, { - "accuracy": 0.9523349684712134, + "accuracy": 0.9497876184943476, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -1522,7 +1522,7 @@ } }, { - "accuracy": 0.9568782968348578, + "accuracy": 0.9546097371923297, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -1565,7 +1565,7 @@ } }, { - "accuracy": 0.9536851126896708, + "accuracy": 0.951205326342269, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -1617,7 +1617,7 @@ } }, { - "accuracy": 0.959543928798092, + "accuracy": 0.9573620824437392, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -1669,7 +1669,7 @@ } }, { - "accuracy": 0.9763227719813585, + "accuracy": 0.9750397348482358, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -1721,7 +1721,7 @@ } }, { - "accuracy": 0.9797908355923075, + "accuracy": 0.97869657185909, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -1773,7 +1773,7 @@ } }, { - "accuracy": 0.9870342655401481, + "accuracy": 0.9863262546101683, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -1816,7 +1816,7 @@ } }, { - "accuracy": 0.9879123883714017, + "accuracy": 0.987281944308626, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -1865,7 +1865,7 @@ } }, { - "accuracy": 0.9905281746514926, + "accuracy": 0.9902545911456017, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -1911,7 +1911,7 @@ } }, { - "accuracy": 0.9964610531950664, + "accuracy": 0.9962879017019939, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -1953,7 +1953,7 @@ ], "model.layers.1.self_attn": [ { - "accuracy": 0.873729416414311, + "accuracy": 0.8568857798450872, "total_bits": 89665536, "q_proj": { "group_size": { @@ -2017,7 +2017,7 @@ } }, { - "accuracy": 0.8840516735064357, + "accuracy": 0.8691579346594057, "total_bits": 92221440, "q_proj": { "group_size": { @@ -2081,7 +2081,7 @@ } }, { - "accuracy": 0.8936097402321665, + "accuracy": 0.881192290077084, "total_bits": 95758848, "q_proj": { "group_size": { @@ -2145,7 +2145,7 @@ } }, { - "accuracy": 0.9302691970216601, + "accuracy": 0.9243471567568026, "total_bits": 112272384, "q_proj": { "group_size": { @@ -2209,7 +2209,7 @@ } }, { - "accuracy": 0.9358116282444251, + "accuracy": 0.9284957635559534, "total_bits": 132913152, "q_proj": { "group_size": { @@ -2273,7 +2273,7 @@ } }, { - "accuracy": 0.9375250337547377, + "accuracy": 0.9295562272401232, "total_bits": 132980224, "q_proj": { "group_size": { @@ -2337,7 +2337,7 @@ } }, { - "accuracy": 0.9544171105678144, + "accuracy": 0.9507480451935216, "total_bits": 169613312, "q_proj": { "group_size": { @@ -2389,7 +2389,7 @@ } }, { - "accuracy": 0.9567160626971408, + "accuracy": 0.9527322036263189, "total_bits": 169745920, "q_proj": { "group_size": { @@ -2441,7 +2441,7 @@ } }, { - "accuracy": 0.9603348081245234, + "accuracy": 0.9564735854142591, "total_bits": 171195392, "q_proj": { "group_size": { @@ -2493,7 +2493,7 @@ } }, { - "accuracy": 0.9627624292318758, + "accuracy": 0.9589888078993872, "total_bits": 173563904, "q_proj": { "group_size": { @@ -2545,7 +2545,7 @@ } }, { - "accuracy": 0.9679131528460666, + "accuracy": 0.9638312317823109, "total_bits": 174923264, "q_proj": { "group_size": { @@ -2609,7 +2609,7 @@ } }, { - "accuracy": 0.9701808158700403, + "accuracy": 0.9661258317922291, "total_bits": 175750144, "q_proj": { "group_size": { @@ -2673,7 +2673,7 @@ } }, { - "accuracy": 0.971465162540737, + "accuracy": 0.9680543750720589, "total_bits": 179253248, "q_proj": { "group_size": { @@ -2734,7 +2734,7 @@ } }, { - "accuracy": 0.9741276444769219, + "accuracy": 0.9706894384795114, "total_bits": 181592064, "q_proj": { "group_size": { @@ -2795,7 +2795,7 @@ } }, { - "accuracy": 0.9831139367858046, + "accuracy": 0.9818780322216059, "total_bits": 220469248, "q_proj": { "group_size": { @@ -2856,7 +2856,7 @@ } }, { - "accuracy": 0.9865419897986086, + "accuracy": 0.9849732829944083, "total_bits": 223535104, "q_proj": { "group_size": { @@ -2917,7 +2917,7 @@ } }, { - "accuracy": 0.9867124832480362, + "accuracy": 0.9864370079318944, "total_bits": 253499392, "q_proj": { "group_size": { @@ -2969,7 +2969,7 @@ } }, { - "accuracy": 0.9925015786613681, + "accuracy": 0.991542876305941, "total_bits": 265838592, "q_proj": { "group_size": { @@ -3021,7 +3021,7 @@ } }, { - "accuracy": 0.9963161236189894, + "accuracy": 0.9963689157371655, "total_bits": 337385472, "q_proj": { "group_size": { @@ -3075,7 +3075,7 @@ ], "model.layers.1.mlp": [ { - "accuracy": 0.9052229947165439, + "accuracy": 0.8859159040607905, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -3127,7 +3127,7 @@ } }, { - "accuracy": 0.9411061168893388, + "accuracy": 0.9340497320027727, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -3179,7 +3179,7 @@ } }, { - "accuracy": 0.9422329687758496, + "accuracy": 0.934241257215801, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -3228,7 +3228,7 @@ } }, { - "accuracy": 0.9429085944828234, + "accuracy": 0.9349827199782196, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -3277,7 +3277,7 @@ } }, { - "accuracy": 0.9799367725162914, + "accuracy": 0.9792390784346744, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -3329,7 +3329,7 @@ } }, { - "accuracy": 0.9854210519574975, + "accuracy": 0.9845926615556604, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -3381,7 +3381,7 @@ } }, { - "accuracy": 0.9875190489386257, + "accuracy": 0.9869137745056498, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -3430,7 +3430,7 @@ } }, { - "accuracy": 0.9916378201083526, + "accuracy": 0.9912057959131504, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -3473,7 +3473,7 @@ } }, { - "accuracy": 0.9925511500209963, + "accuracy": 0.9923221149579867, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -3516,7 +3516,7 @@ } }, { - "accuracy": 0.9922057429916764, + "accuracy": 0.9915538006707242, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -3568,7 +3568,7 @@ } }, { - "accuracy": 0.9925746305747644, + "accuracy": 0.9928785573053909, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -3620,7 +3620,7 @@ } }, { - "accuracy": 0.9960009308262286, + "accuracy": 0.9958921397766588, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -3672,7 +3672,7 @@ } }, { - "accuracy": 0.9962143495948496, + "accuracy": 0.9962745776743089, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -3724,7 +3724,7 @@ } }, { - "accuracy": 0.9976411774068287, + "accuracy": 0.9975251450423935, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -3767,7 +3767,7 @@ } }, { - "accuracy": 0.9979003679044055, + "accuracy": 0.9977877197456301, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -3816,7 +3816,7 @@ } }, { - "accuracy": 0.9983435699740719, + "accuracy": 0.9982760117303482, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -3862,7 +3862,7 @@ } }, { - "accuracy": 0.9989042300485859, + "accuracy": 0.9989709607723757, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -3904,7 +3904,7 @@ ], "model.layers.2.self_attn": [ { - "accuracy": 0.9778485428541899, + "accuracy": 0.9784636181828222, "total_bits": 89665536, "q_proj": { "group_size": { @@ -3968,7 +3968,7 @@ } }, { - "accuracy": 0.978873814113046, + "accuracy": 0.979402962091722, "total_bits": 92221440, "q_proj": { "group_size": { @@ -4032,7 +4032,7 @@ } }, { - "accuracy": 0.9806304232364422, + "accuracy": 0.9818074703216553, "total_bits": 95758848, "q_proj": { "group_size": { @@ -4096,7 +4096,7 @@ } }, { - "accuracy": 0.9834804827543465, + "accuracy": 0.9841136410342235, "total_bits": 112272384, "q_proj": { "group_size": { @@ -4160,7 +4160,7 @@ } }, { - "accuracy": 0.9881575262468112, + "accuracy": 0.987477179028486, "total_bits": 132913152, "q_proj": { "group_size": { @@ -4224,7 +4224,7 @@ } }, { - "accuracy": 0.9876864149088138, + "accuracy": 0.9875245276152304, "total_bits": 132980224, "q_proj": { "group_size": { @@ -4288,7 +4288,7 @@ } }, { - "accuracy": 0.9920548180755424, + "accuracy": 0.9910468665000639, "total_bits": 169613312, "q_proj": { "group_size": { @@ -4340,7 +4340,7 @@ } }, { - "accuracy": 0.9921387106327242, + "accuracy": 0.9921955850808636, "total_bits": 169745920, "q_proj": { "group_size": { @@ -4392,7 +4392,7 @@ } }, { - "accuracy": 0.9926909372014435, + "accuracy": 0.991913566561906, "total_bits": 171195392, "q_proj": { "group_size": { @@ -4444,7 +4444,7 @@ } }, { - "accuracy": 0.9929471172294334, + "accuracy": 0.992210047196989, "total_bits": 173563904, "q_proj": { "group_size": { @@ -4496,7 +4496,7 @@ } }, { - "accuracy": 0.9929930443238271, + "accuracy": 0.992774043158677, "total_bits": 174923264, "q_proj": { "group_size": { @@ -4560,7 +4560,7 @@ } }, { - "accuracy": 0.9933495364200912, + "accuracy": 0.9924662259015206, "total_bits": 175750144, "q_proj": { "group_size": { @@ -4624,7 +4624,7 @@ } }, { - "accuracy": 0.9948340031857553, + "accuracy": 0.9946202190936004, "total_bits": 179253248, "q_proj": { "group_size": { @@ -4685,7 +4685,7 @@ } }, { - "accuracy": 0.9951991248434704, + "accuracy": 0.9949076533513633, "total_bits": 181592064, "q_proj": { "group_size": { @@ -4746,7 +4746,7 @@ } }, { - "accuracy": 0.9971235895798983, + "accuracy": 0.9970136258113933, "total_bits": 220469248, "q_proj": { "group_size": { @@ -4807,7 +4807,7 @@ } }, { - "accuracy": 0.9974903866133996, + "accuracy": 0.9975276898568202, "total_bits": 223535104, "q_proj": { "group_size": { @@ -4868,7 +4868,7 @@ } }, { - "accuracy": 0.9977074651611283, + "accuracy": 0.997475139808988, "total_bits": 253499392, "q_proj": { "group_size": { @@ -4920,7 +4920,7 @@ } }, { - "accuracy": 0.9988952218309829, + "accuracy": 0.9989368900240055, "total_bits": 265838592, "q_proj": { "group_size": { @@ -4972,7 +4972,7 @@ } }, { - "accuracy": 0.9993557605132657, + "accuracy": 0.9993269720580429, "total_bits": 337385472, "q_proj": { "group_size": { @@ -5026,7 +5026,7 @@ ], "model.layers.2.mlp": [ { - "accuracy": 0.963683731657894, + "accuracy": 0.9605733213063917, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -5078,7 +5078,7 @@ } }, { - "accuracy": 0.9647432022580975, + "accuracy": 0.9617722071707249, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -5130,7 +5130,7 @@ } }, { - "accuracy": 0.969874828367641, + "accuracy": 0.9672769135550449, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -5179,7 +5179,7 @@ } }, { - "accuracy": 0.9714735899316637, + "accuracy": 0.9689953029155731, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -5228,7 +5228,7 @@ } }, { - "accuracy": 0.9816295561429701, + "accuracy": 0.9800168797863942, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -5280,7 +5280,7 @@ } }, { - "accuracy": 0.9830398863965744, + "accuracy": 0.9815624053344915, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -5332,7 +5332,7 @@ } }, { - "accuracy": 0.9852980317940053, + "accuracy": 0.9840028328134826, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -5381,7 +5381,7 @@ } }, { - "accuracy": 0.9904022783678221, + "accuracy": 0.9895428748017079, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -5424,7 +5424,7 @@ } }, { - "accuracy": 0.9912414738271189, + "accuracy": 0.990459648916792, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -5467,7 +5467,7 @@ } }, { - "accuracy": 0.9906415854531684, + "accuracy": 0.9898142145799571, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -5519,7 +5519,7 @@ } }, { - "accuracy": 0.9917709064228755, + "accuracy": 0.9910451381614334, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -5571,7 +5571,7 @@ } }, { - "accuracy": 0.9952364674352697, + "accuracy": 0.9948111472553328, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -5623,7 +5623,7 @@ } }, { - "accuracy": 0.995897007530163, + "accuracy": 0.9955334415487749, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -5675,7 +5675,7 @@ } }, { - "accuracy": 0.9974010585880789, + "accuracy": 0.9971662092292192, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -5718,7 +5718,7 @@ } }, { - "accuracy": 0.9975764343613073, + "accuracy": 0.9973614702344333, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -5767,7 +5767,7 @@ } }, { - "accuracy": 0.9980377088374409, + "accuracy": 0.9978592684063571, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -5813,7 +5813,7 @@ } }, { - "accuracy": 0.999301058099311, + "accuracy": 0.9992317291754788, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -5855,7 +5855,7 @@ ], "model.layers.3.self_attn": [ { - "accuracy": 0.949321816626348, + "accuracy": 0.945514768950249, "total_bits": 89665536, "q_proj": { "group_size": { @@ -5919,7 +5919,7 @@ } }, { - "accuracy": 0.9523889604759843, + "accuracy": 0.9495002888143063, "total_bits": 92221440, "q_proj": { "group_size": { @@ -5983,7 +5983,7 @@ } }, { - "accuracy": 0.9586663481436277, + "accuracy": 0.9598797216619316, "total_bits": 95758848, "q_proj": { "group_size": { @@ -6047,7 +6047,7 @@ } }, { - "accuracy": 0.9620552257095513, + "accuracy": 0.9629466613068393, "total_bits": 112272384, "q_proj": { "group_size": { @@ -6111,7 +6111,7 @@ } }, { - "accuracy": 0.9763696851502908, + "accuracy": 0.9747597301672948, "total_bits": 132913152, "q_proj": { "group_size": { @@ -6175,7 +6175,7 @@ } }, { - "accuracy": 0.9764881043841964, + "accuracy": 0.9751808379629725, "total_bits": 132980224, "q_proj": { "group_size": { @@ -6239,7 +6239,7 @@ } }, { - "accuracy": 0.9871843974351099, + "accuracy": 0.986498030637832, "total_bits": 169613312, "q_proj": { "group_size": { @@ -6291,7 +6291,7 @@ } }, { - "accuracy": 0.9883011298646268, + "accuracy": 0.9875455365859365, "total_bits": 169745920, "q_proj": { "group_size": { @@ -6343,7 +6343,7 @@ } }, { - "accuracy": 0.989135164375368, + "accuracy": 0.9886499606072903, "total_bits": 171195392, "q_proj": { "group_size": { @@ -6395,7 +6395,7 @@ } }, { - "accuracy": 0.9893392246510637, + "accuracy": 0.9888809921317979, "total_bits": 173563904, "q_proj": { "group_size": { @@ -6447,7 +6447,7 @@ } }, { - "accuracy": 0.9888136354520133, + "accuracy": 0.9875724345053497, "total_bits": 174923264, "q_proj": { "group_size": { @@ -6511,7 +6511,7 @@ } }, { - "accuracy": 0.9898777146774688, + "accuracy": 0.9888290691826689, "total_bits": 175750144, "q_proj": { "group_size": { @@ -6575,7 +6575,7 @@ } }, { - "accuracy": 0.9924751180714291, + "accuracy": 0.992328321046539, "total_bits": 179253248, "q_proj": { "group_size": { @@ -6636,7 +6636,7 @@ } }, { - "accuracy": 0.9930084294786579, + "accuracy": 0.9929471696775994, "total_bits": 181592064, "q_proj": { "group_size": { @@ -6697,7 +6697,7 @@ } }, { - "accuracy": 0.9958171848771408, + "accuracy": 0.9957813784529111, "total_bits": 220469248, "q_proj": { "group_size": { @@ -6758,7 +6758,7 @@ } }, { - "accuracy": 0.9965589083853716, + "accuracy": 0.9964809180727523, "total_bits": 223535104, "q_proj": { "group_size": { @@ -6819,7 +6819,7 @@ } }, { - "accuracy": 0.996675236579521, + "accuracy": 0.9963845002930611, "total_bits": 253499392, "q_proj": { "group_size": { @@ -6871,7 +6871,7 @@ } }, { - "accuracy": 0.9985293466413981, + "accuracy": 0.9985229569658833, "total_bits": 265838592, "q_proj": { "group_size": { @@ -6923,7 +6923,7 @@ } }, { - "accuracy": 0.9991085240464216, + "accuracy": 0.9990528322707274, "total_bits": 337385472, "q_proj": { "group_size": { @@ -6977,7 +6977,7 @@ ], "model.layers.3.mlp": [ { - "accuracy": 0.9504249517462755, + "accuracy": 0.9465131538086816, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -7029,7 +7029,7 @@ } }, { - "accuracy": 0.9518397824936792, + "accuracy": 0.9480867315279811, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -7081,7 +7081,7 @@ } }, { - "accuracy": 0.9591200077220013, + "accuracy": 0.955652790046052, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -7130,7 +7130,7 @@ } }, { - "accuracy": 0.9613179435071192, + "accuracy": 0.9579513204333029, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -7179,7 +7179,7 @@ } }, { - "accuracy": 0.9748480219982172, + "accuracy": 0.9728319195932463, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -7231,7 +7231,7 @@ } }, { - "accuracy": 0.9768061021244839, + "accuracy": 0.9749433507064456, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -7283,7 +7283,7 @@ } }, { - "accuracy": 0.9799343796544954, + "accuracy": 0.9782121604014384, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -7332,7 +7332,7 @@ } }, { - "accuracy": 0.9869387187063694, + "accuracy": 0.9858414913576684, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -7375,7 +7375,7 @@ } }, { - "accuracy": 0.9880472763784622, + "accuracy": 0.9870498525468927, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -7418,7 +7418,7 @@ } }, { - "accuracy": 0.9871924571496876, + "accuracy": 0.986164881406646, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -7470,7 +7470,7 @@ } }, { - "accuracy": 0.9887480674997756, + "accuracy": 0.9878415154587281, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -7522,7 +7522,7 @@ } }, { - "accuracy": 0.9934847178427797, + "accuracy": 0.9929598860785758, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -7574,7 +7574,7 @@ } }, { - "accuracy": 0.9943949701754671, + "accuracy": 0.9939405463979041, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -7626,7 +7626,7 @@ } }, { - "accuracy": 0.9964648414966896, + "accuracy": 0.9961690912880984, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -7669,7 +7669,7 @@ } }, { - "accuracy": 0.9966820932581628, + "accuracy": 0.9964200250902459, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -7718,7 +7718,7 @@ } }, { - "accuracy": 0.9973165744695028, + "accuracy": 0.9970839632013323, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -7764,7 +7764,7 @@ } }, { - "accuracy": 0.9990641862356202, + "accuracy": 0.9989839393621016, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -7806,7 +7806,7 @@ ], "model.layers.4.self_attn": [ { - "accuracy": 0.9442645130973113, + "accuracy": 0.9397523248274076, "total_bits": 89665536, "q_proj": { "group_size": { @@ -7870,7 +7870,7 @@ } }, { - "accuracy": 0.947693897901397, + "accuracy": 0.9423347350798155, "total_bits": 92221440, "q_proj": { "group_size": { @@ -7934,7 +7934,7 @@ } }, { - "accuracy": 0.9557674564421177, + "accuracy": 0.9526160363303988, "total_bits": 95758848, "q_proj": { "group_size": { @@ -7998,7 +7998,7 @@ } }, { - "accuracy": 0.96068250015378, + "accuracy": 0.9578955967567468, "total_bits": 112272384, "q_proj": { "group_size": { @@ -8062,7 +8062,7 @@ } }, { - "accuracy": 0.9754620161103574, + "accuracy": 0.9698168594194087, "total_bits": 132913152, "q_proj": { "group_size": { @@ -8126,7 +8126,7 @@ } }, { - "accuracy": 0.9758979768345231, + "accuracy": 0.9712330932287794, "total_bits": 132980224, "q_proj": { "group_size": { @@ -8190,7 +8190,7 @@ } }, { - "accuracy": 0.9854180766269565, + "accuracy": 0.9841421904336465, "total_bits": 169613312, "q_proj": { "group_size": { @@ -8242,7 +8242,7 @@ } }, { - "accuracy": 0.9860718849752295, + "accuracy": 0.9839555725063148, "total_bits": 169745920, "q_proj": { "group_size": { @@ -8294,7 +8294,7 @@ } }, { - "accuracy": 0.9873312846022216, + "accuracy": 0.9852670263989192, "total_bits": 171195392, "q_proj": { "group_size": { @@ -8346,7 +8346,7 @@ } }, { - "accuracy": 0.9876361977014887, + "accuracy": 0.9859834677098613, "total_bits": 173563904, "q_proj": { "group_size": { @@ -8398,7 +8398,7 @@ } }, { - "accuracy": 0.9873475398084051, + "accuracy": 0.9856850100485118, "total_bits": 174923264, "q_proj": { "group_size": { @@ -8462,7 +8462,7 @@ } }, { - "accuracy": 0.9882597574768098, + "accuracy": 0.9870418010181502, "total_bits": 175750144, "q_proj": { "group_size": { @@ -8526,7 +8526,7 @@ } }, { - "accuracy": 0.990622558483952, + "accuracy": 0.9897374921037179, "total_bits": 179253248, "q_proj": { "group_size": { @@ -8587,7 +8587,7 @@ } }, { - "accuracy": 0.9916581241168866, + "accuracy": 0.9905317399748846, "total_bits": 181592064, "q_proj": { "group_size": { @@ -8648,7 +8648,7 @@ } }, { - "accuracy": 0.994972226136413, + "accuracy": 0.9944959184350936, "total_bits": 220469248, "q_proj": { "group_size": { @@ -8709,7 +8709,7 @@ } }, { - "accuracy": 0.9956853995957461, + "accuracy": 0.9951955334185377, "total_bits": 223535104, "q_proj": { "group_size": { @@ -8770,7 +8770,7 @@ } }, { - "accuracy": 0.9959400214475432, + "accuracy": 0.9955848034128154, "total_bits": 253499392, "q_proj": { "group_size": { @@ -8822,7 +8822,7 @@ } }, { - "accuracy": 0.9980314925656115, + "accuracy": 0.9978667292805192, "total_bits": 265838592, "q_proj": { "group_size": { @@ -8874,7 +8874,7 @@ } }, { - "accuracy": 0.998916647737037, + "accuracy": 0.998791545660137, "total_bits": 337385472, "q_proj": { "group_size": { @@ -8928,7 +8928,7 @@ ], "model.layers.4.mlp": [ { - "accuracy": 0.9375299619216668, + "accuracy": 0.9341896542985189, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -8980,7 +8980,7 @@ } }, { - "accuracy": 0.9394980553341539, + "accuracy": 0.9362509362399578, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -9032,7 +9032,7 @@ } }, { - "accuracy": 0.9494428656211025, + "accuracy": 0.946533562125344, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -9081,7 +9081,7 @@ } }, { - "accuracy": 0.9522974602878094, + "accuracy": 0.9495758124087986, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -9130,7 +9130,7 @@ } }, { - "accuracy": 0.9686641776444096, + "accuracy": 0.9668482229309647, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -9182,7 +9182,7 @@ } }, { - "accuracy": 0.9711432516770927, + "accuracy": 0.9694663428358341, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -9234,7 +9234,7 @@ } }, { - "accuracy": 0.9752039851522759, + "accuracy": 0.9737474844840012, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -9283,7 +9283,7 @@ } }, { - "accuracy": 0.9837143177068547, + "accuracy": 0.9826763792845764, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -9326,7 +9326,7 @@ } }, { - "accuracy": 0.9850748951889967, + "accuracy": 0.9841496786592823, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -9369,7 +9369,7 @@ } }, { - "accuracy": 0.9840410123824289, + "accuracy": 0.9831150794695867, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -9421,7 +9421,7 @@ } }, { - "accuracy": 0.9859999646677783, + "accuracy": 0.985180498345902, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -9473,7 +9473,7 @@ } }, { - "accuracy": 0.9918716525609949, + "accuracy": 0.9913982396553221, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -9525,7 +9525,7 @@ } }, { - "accuracy": 0.9930249779534183, + "accuracy": 0.9926125704506902, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -9577,7 +9577,7 @@ } }, { - "accuracy": 0.995568137309563, + "accuracy": 0.9952827439349341, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -9620,7 +9620,7 @@ } }, { - "accuracy": 0.995866280772086, + "accuracy": 0.9956222809483543, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -9669,7 +9669,7 @@ } }, { - "accuracy": 0.9967203077271973, + "accuracy": 0.996517781499087, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -9715,7 +9715,7 @@ } }, { - "accuracy": 0.9988276754769398, + "accuracy": 0.9987409716521046, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -9757,7 +9757,7 @@ ], "model.layers.5.self_attn": [ { - "accuracy": 0.9478426473705392, + "accuracy": 0.9412755552483232, "total_bits": 89665536, "q_proj": { "group_size": { @@ -9821,7 +9821,7 @@ } }, { - "accuracy": 0.9477628679259827, + "accuracy": 0.9447065431036448, "total_bits": 92221440, "q_proj": { "group_size": { @@ -9885,7 +9885,7 @@ } }, { - "accuracy": 0.9560026687226797, + "accuracy": 0.9526618415195691, "total_bits": 95758848, "q_proj": { "group_size": { @@ -9949,7 +9949,7 @@ } }, { - "accuracy": 0.9609302935239515, + "accuracy": 0.9585961715171212, "total_bits": 112272384, "q_proj": { "group_size": { @@ -10013,7 +10013,7 @@ } }, { - "accuracy": 0.9732114939313186, + "accuracy": 0.9718421852510226, "total_bits": 132913152, "q_proj": { "group_size": { @@ -10077,7 +10077,7 @@ } }, { - "accuracy": 0.9731872834657368, + "accuracy": 0.9730496496746415, "total_bits": 132980224, "q_proj": { "group_size": { @@ -10141,7 +10141,7 @@ } }, { - "accuracy": 0.9857967468958936, + "accuracy": 0.9849364037968611, "total_bits": 169613312, "q_proj": { "group_size": { @@ -10193,7 +10193,7 @@ } }, { - "accuracy": 0.9860525785602237, + "accuracy": 0.9850907399760265, "total_bits": 169745920, "q_proj": { "group_size": { @@ -10245,7 +10245,7 @@ } }, { - "accuracy": 0.9872025809691924, + "accuracy": 0.9860523644540655, "total_bits": 171195392, "q_proj": { "group_size": { @@ -10297,7 +10297,7 @@ } }, { - "accuracy": 0.9878684500918576, + "accuracy": 0.9869589876677645, "total_bits": 173563904, "q_proj": { "group_size": { @@ -10349,7 +10349,7 @@ } }, { - "accuracy": 0.9872042004411158, + "accuracy": 0.9860099015855476, "total_bits": 174923264, "q_proj": { "group_size": { @@ -10413,7 +10413,7 @@ } }, { - "accuracy": 0.988138643436526, + "accuracy": 0.9872240720708904, "total_bits": 175750144, "q_proj": { "group_size": { @@ -10477,7 +10477,7 @@ } }, { - "accuracy": 0.9904673427931572, + "accuracy": 0.989546793709068, "total_bits": 179253248, "q_proj": { "group_size": { @@ -10538,7 +10538,7 @@ } }, { - "accuracy": 0.991657407341623, + "accuracy": 0.9907753007780564, "total_bits": 181592064, "q_proj": { "group_size": { @@ -10599,7 +10599,7 @@ } }, { - "accuracy": 0.9950607832717268, + "accuracy": 0.9945431699682223, "total_bits": 220469248, "q_proj": { "group_size": { @@ -10660,7 +10660,7 @@ } }, { - "accuracy": 0.9958379331387972, + "accuracy": 0.9953609075348236, "total_bits": 223535104, "q_proj": { "group_size": { @@ -10721,7 +10721,7 @@ } }, { - "accuracy": 0.9961820691088704, + "accuracy": 0.9959546408101329, "total_bits": 253499392, "q_proj": { "group_size": { @@ -10773,7 +10773,7 @@ } }, { - "accuracy": 0.997976019868235, + "accuracy": 0.9976584949457136, "total_bits": 265838592, "q_proj": { "group_size": { @@ -10825,7 +10825,7 @@ } }, { - "accuracy": 0.9990085205675936, + "accuracy": 0.9989140179731246, "total_bits": 337385472, "q_proj": { "group_size": { @@ -10879,7 +10879,7 @@ ], "model.layers.5.mlp": [ { - "accuracy": 0.9264793931261489, + "accuracy": 0.9215240878494162, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -10931,7 +10931,7 @@ } }, { - "accuracy": 0.9288466717851789, + "accuracy": 0.9240283817052841, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -10983,7 +10983,7 @@ } }, { - "accuracy": 0.9403523685116517, + "accuracy": 0.9363689455938966, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -11032,7 +11032,7 @@ } }, { - "accuracy": 0.9436239251180699, + "accuracy": 0.9399521829266297, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -11081,7 +11081,7 @@ } }, { - "accuracy": 0.9631616506529481, + "accuracy": 0.9605779392938865, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -11133,7 +11133,7 @@ } }, { - "accuracy": 0.9660527241465292, + "accuracy": 0.9636814887390325, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -11185,7 +11185,7 @@ } }, { - "accuracy": 0.9707509006716704, + "accuracy": 0.96879299024218, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -11234,7 +11234,7 @@ } }, { - "accuracy": 0.9808605029982956, + "accuracy": 0.9794552991852948, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -11277,7 +11277,7 @@ } }, { - "accuracy": 0.9824351825212178, + "accuracy": 0.981168132079275, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -11320,7 +11320,7 @@ } }, { - "accuracy": 0.9812328574786845, + "accuracy": 0.97992213972305, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -11372,7 +11372,7 @@ } }, { - "accuracy": 0.9835323596765336, + "accuracy": 0.9823739239455838, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -11424,7 +11424,7 @@ } }, { - "accuracy": 0.9904467083856856, + "accuracy": 0.989777511132783, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -11476,7 +11476,7 @@ } }, { - "accuracy": 0.9917935944456411, + "accuracy": 0.9912125934405547, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -11528,7 +11528,7 @@ } }, { - "accuracy": 0.9947831295185575, + "accuracy": 0.9944078904135447, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -11571,7 +11571,7 @@ } }, { - "accuracy": 0.9951379354307918, + "accuracy": 0.9947981049894894, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -11620,7 +11620,7 @@ } }, { - "accuracy": 0.9961133202243793, + "accuracy": 0.9958619757457391, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -11666,7 +11666,7 @@ } }, { - "accuracy": 0.9986082243573803, + "accuracy": 0.9985021076557276, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -11708,7 +11708,7 @@ ], "model.layers.6.self_attn": [ { - "accuracy": 0.9426956278713126, + "accuracy": 0.939269758956997, "total_bits": 89665536, "q_proj": { "group_size": { @@ -11772,7 +11772,7 @@ } }, { - "accuracy": 0.9467800592905596, + "accuracy": 0.9410147437531697, "total_bits": 92221440, "q_proj": { "group_size": { @@ -11836,7 +11836,7 @@ } }, { - "accuracy": 0.9561439956489363, + "accuracy": 0.9508871602776804, "total_bits": 95758848, "q_proj": { "group_size": { @@ -11900,7 +11900,7 @@ } }, { - "accuracy": 0.9645767875603939, + "accuracy": 0.9604994780138919, "total_bits": 112272384, "q_proj": { "group_size": { @@ -11964,7 +11964,7 @@ } }, { - "accuracy": 0.9722918794539414, + "accuracy": 0.9703341028408, "total_bits": 132913152, "q_proj": { "group_size": { @@ -12028,7 +12028,7 @@ } }, { - "accuracy": 0.9732542194818196, + "accuracy": 0.9708823141102728, "total_bits": 132980224, "q_proj": { "group_size": { @@ -12092,7 +12092,7 @@ } }, { - "accuracy": 0.9851027573703935, + "accuracy": 0.9834798977857357, "total_bits": 169613312, "q_proj": { "group_size": { @@ -12144,7 +12144,7 @@ } }, { - "accuracy": 0.9851342911684984, + "accuracy": 0.9843510202083149, "total_bits": 169745920, "q_proj": { "group_size": { @@ -12196,7 +12196,7 @@ } }, { - "accuracy": 0.9866078067080755, + "accuracy": 0.9854518298647905, "total_bits": 171195392, "q_proj": { "group_size": { @@ -12248,7 +12248,7 @@ } }, { - "accuracy": 0.9871764593806706, + "accuracy": 0.9861718885306465, "total_bits": 173563904, "q_proj": { "group_size": { @@ -12300,7 +12300,7 @@ } }, { - "accuracy": 0.9859767018474246, + "accuracy": 0.9852286001765415, "total_bits": 174923264, "q_proj": { "group_size": { @@ -12364,7 +12364,7 @@ } }, { - "accuracy": 0.9870459780979314, + "accuracy": 0.9860753640042323, "total_bits": 175750144, "q_proj": { "group_size": { @@ -12428,7 +12428,7 @@ } }, { - "accuracy": 0.9894579400945651, + "accuracy": 0.9885002706984156, "total_bits": 179253248, "q_proj": { "group_size": { @@ -12489,7 +12489,7 @@ } }, { - "accuracy": 0.9905543601091363, + "accuracy": 0.9894275164819861, "total_bits": 181592064, "q_proj": { "group_size": { @@ -12550,7 +12550,7 @@ } }, { - "accuracy": 0.994442265039604, + "accuracy": 0.993872737487484, "total_bits": 220469248, "q_proj": { "group_size": { @@ -12611,7 +12611,7 @@ } }, { - "accuracy": 0.9952558595932236, + "accuracy": 0.9948142126055532, "total_bits": 223535104, "q_proj": { "group_size": { @@ -12672,7 +12672,7 @@ } }, { - "accuracy": 0.9960484887522302, + "accuracy": 0.9957414959483829, "total_bits": 253499392, "q_proj": { "group_size": { @@ -12724,7 +12724,7 @@ } }, { - "accuracy": 0.9976551770110076, + "accuracy": 0.9974020329291785, "total_bits": 265838592, "q_proj": { "group_size": { @@ -12776,7 +12776,7 @@ } }, { - "accuracy": 0.9989677787403037, + "accuracy": 0.9988838529404204, "total_bits": 337385472, "q_proj": { "group_size": { @@ -12830,7 +12830,7 @@ ], "model.layers.6.mlp": [ { - "accuracy": 0.9187966230276384, + "accuracy": 0.9143470423786264, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -12882,7 +12882,7 @@ } }, { - "accuracy": 0.9212499721661994, + "accuracy": 0.9169298984894627, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -12934,7 +12934,7 @@ } }, { - "accuracy": 0.934231987321063, + "accuracy": 0.9307079168134614, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -12983,7 +12983,7 @@ } }, { - "accuracy": 0.9379115506614509, + "accuracy": 0.9346397350493231, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -13032,7 +13032,7 @@ } }, { - "accuracy": 0.959186074765105, + "accuracy": 0.95692395360062, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -13084,7 +13084,7 @@ } }, { - "accuracy": 0.9623984370968843, + "accuracy": 0.960309278808142, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -13136,7 +13136,7 @@ } }, { - "accuracy": 0.9677002445647591, + "accuracy": 0.9659540031693483, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -13185,7 +13185,7 @@ } }, { - "accuracy": 0.978826585127727, + "accuracy": 0.977623405523206, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -13228,7 +13228,7 @@ } }, { - "accuracy": 0.980553730243915, + "accuracy": 0.9794559329748154, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -13271,7 +13271,7 @@ } }, { - "accuracy": 0.9791661083306137, + "accuracy": 0.9780155413440967, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -13323,7 +13323,7 @@ } }, { - "accuracy": 0.981709912958506, + "accuracy": 0.9806954817552316, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -13375,7 +13375,7 @@ } }, { - "accuracy": 0.9893726436911445, + "accuracy": 0.9887898729525899, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -13427,7 +13427,7 @@ } }, { - "accuracy": 0.9908787846124094, + "accuracy": 0.9903690686057273, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -13479,7 +13479,7 @@ } }, { - "accuracy": 0.994223457467007, + "accuracy": 0.9939004592107314, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -13522,7 +13522,7 @@ } }, { - "accuracy": 0.9945841832821699, + "accuracy": 0.994289485419071, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -13571,7 +13571,7 @@ } }, { - "accuracy": 0.9957072965212559, + "accuracy": 0.9954848532368871, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -13617,7 +13617,7 @@ } }, { - "accuracy": 0.9984760147850275, + "accuracy": 0.9983886381684753, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -13659,7 +13659,7 @@ ], "model.layers.7.self_attn": [ { - "accuracy": 0.9367876839088767, + "accuracy": 0.9334858781413028, "total_bits": 89665536, "q_proj": { "group_size": { @@ -13723,7 +13723,7 @@ } }, { - "accuracy": 0.9395746192649791, + "accuracy": 0.9355627480698259, "total_bits": 92221440, "q_proj": { "group_size": { @@ -13787,7 +13787,7 @@ } }, { - "accuracy": 0.9492401402247579, + "accuracy": 0.9447977629147077, "total_bits": 95758848, "q_proj": { "group_size": { @@ -13851,7 +13851,7 @@ } }, { - "accuracy": 0.9600960441717976, + "accuracy": 0.9563836555339789, "total_bits": 112272384, "q_proj": { "group_size": { @@ -13915,7 +13915,7 @@ } }, { - "accuracy": 0.9689697388951716, + "accuracy": 0.9667966822652441, "total_bits": 132913152, "q_proj": { "group_size": { @@ -13979,7 +13979,7 @@ } }, { - "accuracy": 0.9693979847391969, + "accuracy": 0.9674794872928607, "total_bits": 132980224, "q_proj": { "group_size": { @@ -14043,7 +14043,7 @@ } }, { - "accuracy": 0.9828039001869527, + "accuracy": 0.981636960843676, "total_bits": 169613312, "q_proj": { "group_size": { @@ -14095,7 +14095,7 @@ } }, { - "accuracy": 0.9834778770118168, + "accuracy": 0.9818388979489866, "total_bits": 169745920, "q_proj": { "group_size": { @@ -14147,7 +14147,7 @@ } }, { - "accuracy": 0.9843875017311228, + "accuracy": 0.9835617234440226, "total_bits": 171195392, "q_proj": { "group_size": { @@ -14199,7 +14199,7 @@ } }, { - "accuracy": 0.9851596544153596, + "accuracy": 0.984449803927227, "total_bits": 173563904, "q_proj": { "group_size": { @@ -14251,7 +14251,7 @@ } }, { - "accuracy": 0.984584570617268, + "accuracy": 0.9832110116748434, "total_bits": 174923264, "q_proj": { "group_size": { @@ -14315,7 +14315,7 @@ } }, { - "accuracy": 0.985552386478766, + "accuracy": 0.9847622281920753, "total_bits": 175750144, "q_proj": { "group_size": { @@ -14379,7 +14379,7 @@ } }, { - "accuracy": 0.9876001916433635, + "accuracy": 0.9868362697429562, "total_bits": 179253248, "q_proj": { "group_size": { @@ -14440,7 +14440,7 @@ } }, { - "accuracy": 0.988760414729385, + "accuracy": 0.9878616500155706, "total_bits": 181592064, "q_proj": { "group_size": { @@ -14501,7 +14501,7 @@ } }, { - "accuracy": 0.993323949802863, + "accuracy": 0.9928730591445377, "total_bits": 220469248, "q_proj": { "group_size": { @@ -14562,7 +14562,7 @@ } }, { - "accuracy": 0.9943080702796578, + "accuracy": 0.9939244512811696, "total_bits": 223535104, "q_proj": { "group_size": { @@ -14623,7 +14623,7 @@ } }, { - "accuracy": 0.9955731232552544, + "accuracy": 0.9953156891156381, "total_bits": 253499392, "q_proj": { "group_size": { @@ -14675,7 +14675,7 @@ } }, { - "accuracy": 0.9970722506067863, + "accuracy": 0.9968795916678286, "total_bits": 265838592, "q_proj": { "group_size": { @@ -14727,7 +14727,7 @@ } }, { - "accuracy": 0.9988120670865388, + "accuracy": 0.9987448153980566, "total_bits": 337385472, "q_proj": { "group_size": { @@ -14781,7 +14781,7 @@ ], "model.layers.7.mlp": [ { - "accuracy": 0.9131226184728899, + "accuracy": 0.910364681952878, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -14833,7 +14833,7 @@ } }, { - "accuracy": 0.9156442043420515, + "accuracy": 0.9130439742615348, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -14885,7 +14885,7 @@ } }, { - "accuracy": 0.9299352000418463, + "accuracy": 0.927672556160312, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -14934,7 +14934,7 @@ } }, { - "accuracy": 0.9339723606642923, + "accuracy": 0.9318286582435432, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -14983,7 +14983,7 @@ } }, { - "accuracy": 0.9561350736767054, + "accuracy": 0.9547163499029059, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -15035,7 +15035,7 @@ } }, { - "accuracy": 0.9597003249157416, + "accuracy": 0.9584245108264058, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -15087,7 +15087,7 @@ } }, { - "accuracy": 0.9655053725368098, + "accuracy": 0.9643782377243042, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -15136,7 +15136,7 @@ } }, { - "accuracy": 0.9772174473067647, + "accuracy": 0.9764540369965529, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -15179,7 +15179,7 @@ } }, { - "accuracy": 0.9791567553520987, + "accuracy": 0.9784491668994489, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -15222,7 +15222,7 @@ } }, { - "accuracy": 0.9775949697941542, + "accuracy": 0.9768619110905811, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -15274,7 +15274,7 @@ } }, { - "accuracy": 0.9803560542825022, + "accuracy": 0.9797288301940027, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -15326,7 +15326,7 @@ } }, { - "accuracy": 0.988556227744802, + "accuracy": 0.9881840256091795, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -15378,7 +15378,7 @@ } }, { - "accuracy": 0.990187862005673, + "accuracy": 0.989874165260086, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -15430,7 +15430,7 @@ } }, { - "accuracy": 0.9937816925689971, + "accuracy": 0.9935673973277995, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -15473,7 +15473,7 @@ } }, { - "accuracy": 0.9941651814519182, + "accuracy": 0.993975379283687, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -15522,7 +15522,7 @@ } }, { - "accuracy": 0.995445772625604, + "accuracy": 0.9952983743829751, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -15568,7 +15568,7 @@ } }, { - "accuracy": 0.9983620519112599, + "accuracy": 0.9982971500813667, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -15610,7 +15610,7 @@ ], "model.layers.8.self_attn": [ { - "accuracy": 0.9307058775111249, + "accuracy": 0.9276927342932475, "total_bits": 89665536, "q_proj": { "group_size": { @@ -15674,7 +15674,7 @@ } }, { - "accuracy": 0.93483770854379, + "accuracy": 0.9292974299506137, "total_bits": 92221440, "q_proj": { "group_size": { @@ -15738,7 +15738,7 @@ } }, { - "accuracy": 0.9437413127406648, + "accuracy": 0.9396416805684566, "total_bits": 95758848, "q_proj": { "group_size": { @@ -15802,7 +15802,7 @@ } }, { - "accuracy": 0.9557121358811855, + "accuracy": 0.9526345129860074, "total_bits": 112272384, "q_proj": { "group_size": { @@ -15866,7 +15866,7 @@ } }, { - "accuracy": 0.9655123960814977, + "accuracy": 0.9621112007451684, "total_bits": 132913152, "q_proj": { "group_size": { @@ -15930,7 +15930,7 @@ } }, { - "accuracy": 0.9662100747227669, + "accuracy": 0.9630721219276127, "total_bits": 132980224, "q_proj": { "group_size": { @@ -15994,7 +15994,7 @@ } }, { - "accuracy": 0.9812625166714976, + "accuracy": 0.9794316591792985, "total_bits": 169613312, "q_proj": { "group_size": { @@ -16046,7 +16046,7 @@ } }, { - "accuracy": 0.9816401607700085, + "accuracy": 0.9800019029920038, "total_bits": 169745920, "q_proj": { "group_size": { @@ -16098,7 +16098,7 @@ } }, { - "accuracy": 0.9828299809443323, + "accuracy": 0.9815118122159651, "total_bits": 171195392, "q_proj": { "group_size": { @@ -16150,7 +16150,7 @@ } }, { - "accuracy": 0.9838107355723256, + "accuracy": 0.9824583628459981, "total_bits": 173563904, "q_proj": { "group_size": { @@ -16202,7 +16202,7 @@ } }, { - "accuracy": 0.982891378041945, + "accuracy": 0.9811670321873144, "total_bits": 174923264, "q_proj": { "group_size": { @@ -16266,7 +16266,7 @@ } }, { - "accuracy": 0.9841919016387117, + "accuracy": 0.9825930311099479, "total_bits": 175750144, "q_proj": { "group_size": { @@ -16330,7 +16330,7 @@ } }, { - "accuracy": 0.9863905014568254, + "accuracy": 0.9853010161436702, "total_bits": 179253248, "q_proj": { "group_size": { @@ -16391,7 +16391,7 @@ } }, { - "accuracy": 0.9874883442136803, + "accuracy": 0.9864208882086372, "total_bits": 181592064, "q_proj": { "group_size": { @@ -16452,7 +16452,7 @@ } }, { - "accuracy": 0.9925591436606881, + "accuracy": 0.9919603881426156, "total_bits": 220469248, "q_proj": { "group_size": { @@ -16513,7 +16513,7 @@ } }, { - "accuracy": 0.9936445126506058, + "accuracy": 0.9931313756020054, "total_bits": 223535104, "q_proj": { "group_size": { @@ -16574,7 +16574,7 @@ } }, { - "accuracy": 0.9950577928194482, + "accuracy": 0.994558430570913, "total_bits": 253499392, "q_proj": { "group_size": { @@ -16626,7 +16626,7 @@ } }, { - "accuracy": 0.9967101436157367, + "accuracy": 0.9964824280775103, "total_bits": 265838592, "q_proj": { "group_size": { @@ -16678,7 +16678,7 @@ } }, { - "accuracy": 0.9986815969766069, + "accuracy": 0.9985868175342483, "total_bits": 337385472, "q_proj": { "group_size": { @@ -16732,7 +16732,7 @@ ], "model.layers.8.mlp": [ { - "accuracy": 0.9114434626933775, + "accuracy": 0.9099160409287402, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -16784,7 +16784,7 @@ } }, { - "accuracy": 0.9140108864950507, + "accuracy": 0.9126251845767623, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -16836,7 +16836,7 @@ } }, { - "accuracy": 0.9280736605195623, + "accuracy": 0.9267295008819354, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -16885,7 +16885,7 @@ } }, { - "accuracy": 0.9320498279442913, + "accuracy": 0.9307615366813383, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -16934,7 +16934,7 @@ } }, { - "accuracy": 0.9552673920008697, + "accuracy": 0.9545008730339377, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -16986,7 +16986,7 @@ } }, { - "accuracy": 0.9588710026521432, + "accuracy": 0.9581509520740885, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -17038,7 +17038,7 @@ } }, { - "accuracy": 0.9646268920286706, + "accuracy": 0.9639370361048925, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -17087,7 +17087,7 @@ } }, { - "accuracy": 0.9768101034784004, + "accuracy": 0.9763504872588735, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -17130,7 +17130,7 @@ } }, { - "accuracy": 0.9787262930583797, + "accuracy": 0.9782979533468422, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -17173,7 +17173,7 @@ } }, { - "accuracy": 0.977124530086784, + "accuracy": 0.9767491038104421, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -17225,7 +17225,7 @@ } }, { - "accuracy": 0.9799566481654581, + "accuracy": 0.9796127283357476, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -17277,7 +17277,7 @@ } }, { - "accuracy": 0.9883173551214369, + "accuracy": 0.988122488126943, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -17329,7 +17329,7 @@ } }, { - "accuracy": 0.989986608736217, + "accuracy": 0.9898179635699642, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -17381,7 +17381,7 @@ } }, { - "accuracy": 0.9936494619683608, + "accuracy": 0.9935262526973689, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -17424,7 +17424,7 @@ } }, { - "accuracy": 0.99403378286546, + "accuracy": 0.9939380896914947, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -17473,7 +17473,7 @@ } }, { - "accuracy": 0.9952835758388239, + "accuracy": 0.9951961418295181, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -17519,7 +17519,7 @@ } }, { - "accuracy": 0.9983155575985285, + "accuracy": 0.9982824129248528, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -17561,7 +17561,7 @@ ], "model.layers.9.self_attn": [ { - "accuracy": 0.9178362818140733, + "accuracy": 0.9147989181311507, "total_bits": 89665536, "q_proj": { "group_size": { @@ -17625,7 +17625,7 @@ } }, { - "accuracy": 0.919641686505393, + "accuracy": 0.9145158490068034, "total_bits": 92221440, "q_proj": { "group_size": { @@ -17689,7 +17689,7 @@ } }, { - "accuracy": 0.9359353306262117, + "accuracy": 0.9319906530803755, "total_bits": 95758848, "q_proj": { "group_size": { @@ -17753,7 +17753,7 @@ } }, { - "accuracy": 0.9464520512050704, + "accuracy": 0.9434510640015727, "total_bits": 112272384, "q_proj": { "group_size": { @@ -17817,7 +17817,7 @@ } }, { - "accuracy": 0.9592442696816043, + "accuracy": 0.9567102452642039, "total_bits": 132913152, "q_proj": { "group_size": { @@ -17881,7 +17881,7 @@ } }, { - "accuracy": 0.9588079564273357, + "accuracy": 0.9567822727717852, "total_bits": 132980224, "q_proj": { "group_size": { @@ -17945,7 +17945,7 @@ } }, { - "accuracy": 0.9777955757944208, + "accuracy": 0.975358749102605, "total_bits": 169613312, "q_proj": { "group_size": { @@ -17997,7 +17997,7 @@ } }, { - "accuracy": 0.9782332308394345, + "accuracy": 0.9764222180176723, "total_bits": 169745920, "q_proj": { "group_size": { @@ -18049,7 +18049,7 @@ } }, { - "accuracy": 0.9808911404719478, + "accuracy": 0.9788806583536299, "total_bits": 171195392, "q_proj": { "group_size": { @@ -18101,7 +18101,7 @@ } }, { - "accuracy": 0.981912729036259, + "accuracy": 0.9800338829426389, "total_bits": 173563904, "q_proj": { "group_size": { @@ -18153,7 +18153,7 @@ } }, { - "accuracy": 0.9796171469711944, + "accuracy": 0.9781023707044753, "total_bits": 174923264, "q_proj": { "group_size": { @@ -18217,7 +18217,7 @@ } }, { - "accuracy": 0.9808088033214996, + "accuracy": 0.9794677708690104, "total_bits": 175750144, "q_proj": { "group_size": { @@ -18281,7 +18281,7 @@ } }, { - "accuracy": 0.9844405289347234, + "accuracy": 0.9828459836640641, "total_bits": 179253248, "q_proj": { "group_size": { @@ -18342,7 +18342,7 @@ } }, { - "accuracy": 0.9860807846937525, + "accuracy": 0.9851044471326628, "total_bits": 181592064, "q_proj": { "group_size": { @@ -18403,7 +18403,7 @@ } }, { - "accuracy": 0.9915062421197561, + "accuracy": 0.9908749437890947, "total_bits": 220469248, "q_proj": { "group_size": { @@ -18464,7 +18464,7 @@ } }, { - "accuracy": 0.9929123533840635, + "accuracy": 0.9924298478290439, "total_bits": 223535104, "q_proj": { "group_size": { @@ -18525,7 +18525,7 @@ } }, { - "accuracy": 0.9939596872090509, + "accuracy": 0.9936294125540084, "total_bits": 253499392, "q_proj": { "group_size": { @@ -18577,7 +18577,7 @@ } }, { - "accuracy": 0.9965334626551914, + "accuracy": 0.9963382684846261, "total_bits": 265838592, "q_proj": { "group_size": { @@ -18629,7 +18629,7 @@ } }, { - "accuracy": 0.9984507534567169, + "accuracy": 0.9983228891659038, "total_bits": 337385472, "q_proj": { "group_size": { @@ -18683,7 +18683,7 @@ ], "model.layers.9.mlp": [ { - "accuracy": 0.9091744471929575, + "accuracy": 0.90854089158146, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -18735,7 +18735,7 @@ } }, { - "accuracy": 0.9118311681637639, + "accuracy": 0.9112645805274185, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -18787,7 +18787,7 @@ } }, { - "accuracy": 0.9259752558642312, + "accuracy": 0.9254555192432905, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -18836,7 +18836,7 @@ } }, { - "accuracy": 0.9299621440862355, + "accuracy": 0.9295475853509024, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -18885,7 +18885,7 @@ } }, { - "accuracy": 0.9541753985379872, + "accuracy": 0.9538222521935639, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -18937,7 +18937,7 @@ } }, { - "accuracy": 0.9578626438191062, + "accuracy": 0.9575373954874904, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -18989,7 +18989,7 @@ } }, { - "accuracy": 0.9636124653839752, + "accuracy": 0.9633479091878, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -19038,7 +19038,7 @@ } }, { - "accuracy": 0.9762214837889922, + "accuracy": 0.9759563458593268, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -19081,7 +19081,7 @@ } }, { - "accuracy": 0.978161746734067, + "accuracy": 0.9779436599071089, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -19124,7 +19124,7 @@ } }, { - "accuracy": 0.9765838207186837, + "accuracy": 0.9763963685223931, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -19176,7 +19176,7 @@ } }, { - "accuracy": 0.9794569486556085, + "accuracy": 0.9793033470938864, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -19228,7 +19228,7 @@ } }, { - "accuracy": 0.9880468420880405, + "accuracy": 0.9879485725082064, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -19280,7 +19280,7 @@ } }, { - "accuracy": 0.9897436211620899, + "accuracy": 0.989668093327629, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -19332,7 +19332,7 @@ } }, { - "accuracy": 0.9934926767049259, + "accuracy": 0.9934219423142311, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -19375,7 +19375,7 @@ } }, { - "accuracy": 0.9938939328452474, + "accuracy": 0.9938559937290847, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -19424,7 +19424,7 @@ } }, { - "accuracy": 0.9951528880720664, + "accuracy": 0.9951272335663242, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -19470,7 +19470,7 @@ } }, { - "accuracy": 0.9982778039871176, + "accuracy": 0.9982532308142829, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -19512,7 +19512,7 @@ ], "model.layers.10.self_attn": [ { - "accuracy": 0.9272860884666443, + "accuracy": 0.9260168099089673, "total_bits": 89665536, "q_proj": { "group_size": { @@ -19576,7 +19576,7 @@ } }, { - "accuracy": 0.9302180107486875, + "accuracy": 0.9273232072591782, "total_bits": 92221440, "q_proj": { "group_size": { @@ -19640,7 +19640,7 @@ } }, { - "accuracy": 0.9413315718503374, + "accuracy": 0.9386902937763616, "total_bits": 95758848, "q_proj": { "group_size": { @@ -19704,7 +19704,7 @@ } }, { - "accuracy": 0.9540640745115907, + "accuracy": 0.9519001576853425, "total_bits": 112272384, "q_proj": { "group_size": { @@ -19768,7 +19768,7 @@ } }, { - "accuracy": 0.9637178431608175, + "accuracy": 0.9622136529927191, "total_bits": 132913152, "q_proj": { "group_size": { @@ -19832,7 +19832,7 @@ } }, { - "accuracy": 0.9640948317552868, + "accuracy": 0.9627230168369255, "total_bits": 132980224, "q_proj": { "group_size": { @@ -19896,7 +19896,7 @@ } }, { - "accuracy": 0.9796087876158325, + "accuracy": 0.9785611537334166, "total_bits": 169613312, "q_proj": { "group_size": { @@ -19948,7 +19948,7 @@ } }, { - "accuracy": 0.9797961802564954, + "accuracy": 0.9788986903272177, "total_bits": 169745920, "q_proj": { "group_size": { @@ -20000,7 +20000,7 @@ } }, { - "accuracy": 0.9816929908273252, + "accuracy": 0.9808335604734326, "total_bits": 171195392, "q_proj": { "group_size": { @@ -20052,7 +20052,7 @@ } }, { - "accuracy": 0.9826860945965898, + "accuracy": 0.9817547850114735, "total_bits": 173563904, "q_proj": { "group_size": { @@ -20104,7 +20104,7 @@ } }, { - "accuracy": 0.9821418084596333, + "accuracy": 0.9809134763322378, "total_bits": 174923264, "q_proj": { "group_size": { @@ -20168,7 +20168,7 @@ } }, { - "accuracy": 0.9828495038183112, + "accuracy": 0.9821061907630217, "total_bits": 175750144, "q_proj": { "group_size": { @@ -20232,7 +20232,7 @@ } }, { - "accuracy": 0.9852504982662044, + "accuracy": 0.9847800757147764, "total_bits": 179253248, "q_proj": { "group_size": { @@ -20293,7 +20293,7 @@ } }, { - "accuracy": 0.9865616434008667, + "accuracy": 0.9858180463412091, "total_bits": 181592064, "q_proj": { "group_size": { @@ -20354,7 +20354,7 @@ } }, { - "accuracy": 0.9920558771363607, + "accuracy": 0.9916184154878321, "total_bits": 220469248, "q_proj": { "group_size": { @@ -20415,7 +20415,7 @@ } }, { - "accuracy": 0.9932412711266232, + "accuracy": 0.9929327660142199, "total_bits": 223535104, "q_proj": { "group_size": { @@ -20476,7 +20476,7 @@ } }, { - "accuracy": 0.9947530593183872, + "accuracy": 0.9944713705611464, "total_bits": 253499392, "q_proj": { "group_size": { @@ -20528,7 +20528,7 @@ } }, { - "accuracy": 0.9964173585544095, + "accuracy": 0.9962457851261685, "total_bits": 265838592, "q_proj": { "group_size": { @@ -20580,7 +20580,7 @@ } }, { - "accuracy": 0.9985927642678449, + "accuracy": 0.9984889174382644, "total_bits": 337385472, "q_proj": { "group_size": { @@ -20634,7 +20634,7 @@ ], "model.layers.10.mlp": [ { - "accuracy": 0.9082281465985274, + "accuracy": 0.9075323623654089, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -20686,7 +20686,7 @@ } }, { - "accuracy": 0.9109148557641005, + "accuracy": 0.9102706266076941, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -20738,7 +20738,7 @@ } }, { - "accuracy": 0.9250412800986516, + "accuracy": 0.924500753220759, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -20787,7 +20787,7 @@ } }, { - "accuracy": 0.9290863532376916, + "accuracy": 0.9285951978281924, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -20836,7 +20836,7 @@ } }, { - "accuracy": 0.9537028785991042, + "accuracy": 0.9533497738210779, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -20888,7 +20888,7 @@ } }, { - "accuracy": 0.9573582681386095, + "accuracy": 0.9570253470814541, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -20940,7 +20940,7 @@ } }, { - "accuracy": 0.9632230326533318, + "accuracy": 0.9629240397756037, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -20989,7 +20989,7 @@ } }, { - "accuracy": 0.9760550118394589, + "accuracy": 0.9758446858705658, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -21032,7 +21032,7 @@ } }, { - "accuracy": 0.9779636478051543, + "accuracy": 0.9777678654186035, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -21075,7 +21075,7 @@ } }, { - "accuracy": 0.9763819092492524, + "accuracy": 0.9761960578984336, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -21127,7 +21127,7 @@ } }, { - "accuracy": 0.979239768838804, + "accuracy": 0.9790827447156373, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -21179,7 +21179,7 @@ } }, { - "accuracy": 0.987954590077463, + "accuracy": 0.9878604657653915, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -21231,7 +21231,7 @@ } }, { - "accuracy": 0.9896407628088797, + "accuracy": 0.9895663006035121, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -21283,7 +21283,7 @@ } }, { - "accuracy": 0.9934673812730532, + "accuracy": 0.9934073392988035, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -21326,7 +21326,7 @@ } }, { - "accuracy": 0.993850626909223, + "accuracy": 0.9938080159604157, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -21375,7 +21375,7 @@ } }, { - "accuracy": 0.995097728495143, + "accuracy": 0.9950642152444312, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -21421,7 +21421,7 @@ } }, { - "accuracy": 0.9982704734490988, + "accuracy": 0.9982526966701507, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -21463,7 +21463,7 @@ ], "model.layers.11.self_attn": [ { - "accuracy": 0.9282438594259714, + "accuracy": 0.9234915920778325, "total_bits": 89665536, "q_proj": { "group_size": { @@ -21527,7 +21527,7 @@ } }, { - "accuracy": 0.9283739987172579, + "accuracy": 0.924774644994422, "total_bits": 92221440, "q_proj": { "group_size": { @@ -21591,7 +21591,7 @@ } }, { - "accuracy": 0.93796777137016, + "accuracy": 0.9365185058038485, "total_bits": 95758848, "q_proj": { "group_size": { @@ -21655,7 +21655,7 @@ } }, { - "accuracy": 0.9491332240010563, + "accuracy": 0.9479661776047004, "total_bits": 112272384, "q_proj": { "group_size": { @@ -21719,7 +21719,7 @@ } }, { - "accuracy": 0.9637114225249541, + "accuracy": 0.9613859844639113, "total_bits": 132913152, "q_proj": { "group_size": { @@ -21783,7 +21783,7 @@ } }, { - "accuracy": 0.9634973481297493, + "accuracy": 0.9623094382450769, "total_bits": 132980224, "q_proj": { "group_size": { @@ -21847,7 +21847,7 @@ } }, { - "accuracy": 0.9796298789840779, + "accuracy": 0.9789326298785838, "total_bits": 169613312, "q_proj": { "group_size": { @@ -21899,7 +21899,7 @@ } }, { - "accuracy": 0.9801208466585529, + "accuracy": 0.9794921794612157, "total_bits": 169745920, "q_proj": { "group_size": { @@ -21951,7 +21951,7 @@ } }, { - "accuracy": 0.9818359940361819, + "accuracy": 0.980963638689565, "total_bits": 171195392, "q_proj": { "group_size": { @@ -22003,7 +22003,7 @@ } }, { - "accuracy": 0.9827395484439636, + "accuracy": 0.9822284273901268, "total_bits": 173563904, "q_proj": { "group_size": { @@ -22055,7 +22055,7 @@ } }, { - "accuracy": 0.9812627562664842, + "accuracy": 0.9811755887379772, "total_bits": 174923264, "q_proj": { "group_size": { @@ -22119,7 +22119,7 @@ } }, { - "accuracy": 0.9829997485013384, + "accuracy": 0.9822439918000447, "total_bits": 175750144, "q_proj": { "group_size": { @@ -22183,7 +22183,7 @@ } }, { - "accuracy": 0.9851943114772439, + "accuracy": 0.984695501478487, "total_bits": 179253248, "q_proj": { "group_size": { @@ -22244,7 +22244,7 @@ } }, { - "accuracy": 0.9863403668431076, + "accuracy": 0.9859467323771433, "total_bits": 181592064, "q_proj": { "group_size": { @@ -22305,7 +22305,7 @@ } }, { - "accuracy": 0.9919811441612086, + "accuracy": 0.9918877920135856, "total_bits": 220469248, "q_proj": { "group_size": { @@ -22366,7 +22366,7 @@ } }, { - "accuracy": 0.9932269475324765, + "accuracy": 0.9929040547117198, "total_bits": 223535104, "q_proj": { "group_size": { @@ -22427,7 +22427,7 @@ } }, { - "accuracy": 0.9948224880561036, + "accuracy": 0.994516446132605, "total_bits": 253499392, "q_proj": { "group_size": { @@ -22479,7 +22479,7 @@ } }, { - "accuracy": 0.9965398360386883, + "accuracy": 0.9963599712048706, "total_bits": 265838592, "q_proj": { "group_size": { @@ -22531,7 +22531,7 @@ } }, { - "accuracy": 0.9985943438093129, + "accuracy": 0.9985572345628354, "total_bits": 337385472, "q_proj": { "group_size": { @@ -22585,7 +22585,7 @@ ], "model.layers.11.mlp": [ { - "accuracy": 0.9057635198298254, + "accuracy": 0.9053019261673877, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -22637,7 +22637,7 @@ } }, { - "accuracy": 0.9085585947491621, + "accuracy": 0.9081228714632361, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -22689,7 +22689,7 @@ } }, { - "accuracy": 0.9231375395075271, + "accuracy": 0.9227863093347926, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -22738,7 +22738,7 @@ } }, { - "accuracy": 0.9273199850791379, + "accuracy": 0.9270123076674185, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -22787,7 +22787,7 @@ } }, { - "accuracy": 0.9522600981749987, + "accuracy": 0.9520112499594688, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -22839,7 +22839,7 @@ } }, { - "accuracy": 0.9561043822843778, + "accuracy": 0.9559071977671824, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -22891,7 +22891,7 @@ } }, { - "accuracy": 0.9621116436625782, + "accuracy": 0.9619493219805391, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -22940,7 +22940,7 @@ } }, { - "accuracy": 0.9751554638343422, + "accuracy": 0.9749932609694568, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -22983,7 +22983,7 @@ } }, { - "accuracy": 0.9771501181255046, + "accuracy": 0.9770038736690032, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -23026,7 +23026,7 @@ } }, { - "accuracy": 0.9755503599973101, + "accuracy": 0.9754386555991674, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -23078,7 +23078,7 @@ } }, { - "accuracy": 0.9785394592602786, + "accuracy": 0.9784368238852996, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -23130,7 +23130,7 @@ } }, { - "accuracy": 0.9874916356056929, + "accuracy": 0.9874446595479783, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -23182,7 +23182,7 @@ } }, { - "accuracy": 0.9892735714828106, + "accuracy": 0.9892231926910187, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -23234,7 +23234,7 @@ } }, { - "accuracy": 0.993180731139881, + "accuracy": 0.9931359945453311, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -23277,7 +23277,7 @@ } }, { - "accuracy": 0.9936142210897646, + "accuracy": 0.9935875339188466, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -23326,7 +23326,7 @@ } }, { - "accuracy": 0.9949295579480302, + "accuracy": 0.994917523900145, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -23372,7 +23372,7 @@ } }, { - "accuracy": 0.9982013077671198, + "accuracy": 0.9981861404866275, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -23414,7 +23414,7 @@ ], "model.layers.12.self_attn": [ { - "accuracy": 0.92346174328735, + "accuracy": 0.9177081755509502, "total_bits": 89665536, "q_proj": { "group_size": { @@ -23478,7 +23478,7 @@ } }, { - "accuracy": 0.9266516950569654, + "accuracy": 0.9210440653719401, "total_bits": 92221440, "q_proj": { "group_size": { @@ -23542,7 +23542,7 @@ } }, { - "accuracy": 0.9388597101757401, + "accuracy": 0.9341432379656717, "total_bits": 95758848, "q_proj": { "group_size": { @@ -23606,7 +23606,7 @@ } }, { - "accuracy": 0.9534609174649966, + "accuracy": 0.9493519644203939, "total_bits": 112272384, "q_proj": { "group_size": { @@ -23670,7 +23670,7 @@ } }, { - "accuracy": 0.9616208381362652, + "accuracy": 0.9592909201195365, "total_bits": 132913152, "q_proj": { "group_size": { @@ -23734,7 +23734,7 @@ } }, { - "accuracy": 0.9621965485183817, + "accuracy": 0.9602762185233205, "total_bits": 132980224, "q_proj": { "group_size": { @@ -23798,7 +23798,7 @@ } }, { - "accuracy": 0.9785458741611556, + "accuracy": 0.9776099850668719, "total_bits": 169613312, "q_proj": { "group_size": { @@ -23850,7 +23850,7 @@ } }, { - "accuracy": 0.979201380408516, + "accuracy": 0.9779021551734522, "total_bits": 169745920, "q_proj": { "group_size": { @@ -23902,7 +23902,7 @@ } }, { - "accuracy": 0.9808099021350867, + "accuracy": 0.9793077972472498, "total_bits": 171195392, "q_proj": { "group_size": { @@ -23954,7 +23954,7 @@ } }, { - "accuracy": 0.9815549087759695, + "accuracy": 0.9802125572275958, "total_bits": 173563904, "q_proj": { "group_size": { @@ -24006,7 +24006,7 @@ } }, { - "accuracy": 0.9811999694395223, + "accuracy": 0.9796748763244403, "total_bits": 174923264, "q_proj": { "group_size": { @@ -24070,7 +24070,7 @@ } }, { - "accuracy": 0.9823770262300968, + "accuracy": 0.9809421344023002, "total_bits": 175750144, "q_proj": { "group_size": { @@ -24134,7 +24134,7 @@ } }, { - "accuracy": 0.9850662669264957, + "accuracy": 0.9838554892983091, "total_bits": 179253248, "q_proj": { "group_size": { @@ -24195,7 +24195,7 @@ } }, { - "accuracy": 0.9861097527471813, + "accuracy": 0.9850622667489868, "total_bits": 181592064, "q_proj": { "group_size": { @@ -24256,7 +24256,7 @@ } }, { - "accuracy": 0.9917866191581676, + "accuracy": 0.9911956275372129, "total_bits": 220469248, "q_proj": { "group_size": { @@ -24317,7 +24317,7 @@ } }, { - "accuracy": 0.9930157423950732, + "accuracy": 0.9924398446945768, "total_bits": 223535104, "q_proj": { "group_size": { @@ -24378,7 +24378,7 @@ } }, { - "accuracy": 0.9944038968043107, + "accuracy": 0.9940825063539179, "total_bits": 253499392, "q_proj": { "group_size": { @@ -24430,7 +24430,7 @@ } }, { - "accuracy": 0.9963409042010378, + "accuracy": 0.9960676462781665, "total_bits": 265838592, "q_proj": { "group_size": { @@ -24482,7 +24482,7 @@ } }, { - "accuracy": 0.9985070177047563, + "accuracy": 0.9983926095975268, "total_bits": 337385472, "q_proj": { "group_size": { @@ -24536,7 +24536,7 @@ ], "model.layers.12.mlp": [ { - "accuracy": 0.9036301703829515, + "accuracy": 0.9029942770537577, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -24588,7 +24588,7 @@ } }, { - "accuracy": 0.9065264049721391, + "accuracy": 0.9059699728692833, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -24640,7 +24640,7 @@ } }, { - "accuracy": 0.9215670565241262, + "accuracy": 0.9210211334652022, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -24689,7 +24689,7 @@ } }, { - "accuracy": 0.9259577689594344, + "accuracy": 0.9254641823078457, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -24738,7 +24738,7 @@ } }, { - "accuracy": 0.9510227147685855, + "accuracy": 0.9507614978049931, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -24790,7 +24790,7 @@ } }, { - "accuracy": 0.9551253197224516, + "accuracy": 0.9548749017872309, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -24842,7 +24842,7 @@ } }, { - "accuracy": 0.9613188112056569, + "accuracy": 0.9610721025811999, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -24891,7 +24891,7 @@ } }, { - "accuracy": 0.9742740799525851, + "accuracy": 0.9740628272687134, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -24934,7 +24934,7 @@ } }, { - "accuracy": 0.9764540864056662, + "accuracy": 0.9762556588179186, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -24977,7 +24977,7 @@ } }, { - "accuracy": 0.9748966069401879, + "accuracy": 0.9747795189093602, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -25029,7 +25029,7 @@ } }, { - "accuracy": 0.9780550748599988, + "accuracy": 0.9779397047271854, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -25081,7 +25081,7 @@ } }, { - "accuracy": 0.9871470147351685, + "accuracy": 0.9870867412047166, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -25133,7 +25133,7 @@ } }, { - "accuracy": 0.989016763473812, + "accuracy": 0.9889602209441364, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -25185,7 +25185,7 @@ } }, { - "accuracy": 0.9929028342379943, + "accuracy": 0.9928382109409493, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -25228,7 +25228,7 @@ } }, { - "accuracy": 0.9934521347627436, + "accuracy": 0.9934198788955415, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -25277,7 +25277,7 @@ } }, { - "accuracy": 0.994853079208712, + "accuracy": 0.9948250617660386, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -25323,7 +25323,7 @@ } }, { - "accuracy": 0.9981136623537168, + "accuracy": 0.9980883319849932, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -25365,7 +25365,7 @@ ], "model.layers.13.self_attn": [ { - "accuracy": 0.9152934751228282, + "accuracy": 0.9131190674869638, "total_bits": 89665536, "q_proj": { "group_size": { @@ -25429,7 +25429,7 @@ } }, { - "accuracy": 0.916959138881219, + "accuracy": 0.9158147491122547, "total_bits": 92221440, "q_proj": { "group_size": { @@ -25493,7 +25493,7 @@ } }, { - "accuracy": 0.9288980923593044, + "accuracy": 0.9272799966366667, "total_bits": 95758848, "q_proj": { "group_size": { @@ -25557,7 +25557,7 @@ } }, { - "accuracy": 0.9432535473453372, + "accuracy": 0.941761592893224, "total_bits": 112272384, "q_proj": { "group_size": { @@ -25621,7 +25621,7 @@ } }, { - "accuracy": 0.9564987228889215, + "accuracy": 0.9562998312084299, "total_bits": 132913152, "q_proj": { "group_size": { @@ -25685,7 +25685,7 @@ } }, { - "accuracy": 0.9574877163885456, + "accuracy": 0.956985551373739, "total_bits": 132980224, "q_proj": { "group_size": { @@ -25749,7 +25749,7 @@ } }, { - "accuracy": 0.9766972854145264, + "accuracy": 0.9759827924794272, "total_bits": 169613312, "q_proj": { "group_size": { @@ -25801,7 +25801,7 @@ } }, { - "accuracy": 0.977453015891737, + "accuracy": 0.9767849347309062, "total_bits": 169745920, "q_proj": { "group_size": { @@ -25853,7 +25853,7 @@ } }, { - "accuracy": 0.9789451199436658, + "accuracy": 0.9784457761500227, "total_bits": 171195392, "q_proj": { "group_size": { @@ -25905,7 +25905,7 @@ } }, { - "accuracy": 0.9802414507262016, + "accuracy": 0.9794315538418136, "total_bits": 173563904, "q_proj": { "group_size": { @@ -25957,7 +25957,7 @@ } }, { - "accuracy": 0.9789471958126676, + "accuracy": 0.9786563825450445, "total_bits": 174923264, "q_proj": { "group_size": { @@ -26021,7 +26021,7 @@ } }, { - "accuracy": 0.9804479740069885, + "accuracy": 0.9798056222498417, "total_bits": 175750144, "q_proj": { "group_size": { @@ -26085,7 +26085,7 @@ } }, { - "accuracy": 0.983116311364268, + "accuracy": 0.9828121969966512, "total_bits": 179253248, "q_proj": { "group_size": { @@ -26146,7 +26146,7 @@ } }, { - "accuracy": 0.9843086968911322, + "accuracy": 0.9840821132652069, "total_bits": 181592064, "q_proj": { "group_size": { @@ -26207,7 +26207,7 @@ } }, { - "accuracy": 0.9907392179593444, + "accuracy": 0.9908058126457036, "total_bits": 220469248, "q_proj": { "group_size": { @@ -26268,7 +26268,7 @@ } }, { - "accuracy": 0.9921443703045186, + "accuracy": 0.9919813703500518, "total_bits": 223535104, "q_proj": { "group_size": { @@ -26329,7 +26329,7 @@ } }, { - "accuracy": 0.9940082805084163, + "accuracy": 0.9939188195245439, "total_bits": 253499392, "q_proj": { "group_size": { @@ -26381,7 +26381,7 @@ } }, { - "accuracy": 0.9959271975155723, + "accuracy": 0.9958502633595153, "total_bits": 265838592, "q_proj": { "group_size": { @@ -26433,7 +26433,7 @@ } }, { - "accuracy": 0.998376496209714, + "accuracy": 0.9983784957041376, "total_bits": 337385472, "q_proj": { "group_size": { @@ -26487,7 +26487,7 @@ ], "model.layers.13.mlp": [ { - "accuracy": 0.9006116872555331, + "accuracy": 0.8993301932748995, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -26539,7 +26539,7 @@ } }, { - "accuracy": 0.9036720120593121, + "accuracy": 0.9024810822386491, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -26591,7 +26591,7 @@ } }, { - "accuracy": 0.919114638119936, + "accuracy": 0.9180228772916292, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -26640,7 +26640,7 @@ } }, { - "accuracy": 0.9236063427830997, + "accuracy": 0.9225989678188374, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -26689,7 +26689,7 @@ } }, { - "accuracy": 0.949788094743302, + "accuracy": 0.949177583189387, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -26741,7 +26741,7 @@ } }, { - "accuracy": 0.9538923608825395, + "accuracy": 0.9533256627619267, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -26793,7 +26793,7 @@ } }, { - "accuracy": 0.9602242367048013, + "accuracy": 0.9596941836766506, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -26842,7 +26842,7 @@ } }, { - "accuracy": 0.9737078471991577, + "accuracy": 0.973284112191514, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -26885,7 +26885,7 @@ } }, { - "accuracy": 0.97588300381444, + "accuracy": 0.9754906800624571, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -26928,7 +26928,7 @@ } }, { - "accuracy": 0.9743558776221777, + "accuracy": 0.9740401219184461, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -26980,7 +26980,7 @@ } }, { - "accuracy": 0.9775336726421588, + "accuracy": 0.9772566586830899, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -27032,7 +27032,7 @@ } }, { - "accuracy": 0.9869005446273246, + "accuracy": 0.9867376312123317, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -27084,7 +27084,7 @@ } }, { - "accuracy": 0.9887787032578337, + "accuracy": 0.9886381407758515, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -27136,7 +27136,7 @@ } }, { - "accuracy": 0.9927801914807213, + "accuracy": 0.992657635753092, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -27179,7 +27179,7 @@ } }, { - "accuracy": 0.9933302890215265, + "accuracy": 0.9932638647671985, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -27228,7 +27228,7 @@ } }, { - "accuracy": 0.9946927819033399, + "accuracy": 0.9946364454042754, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -27274,7 +27274,7 @@ } }, { - "accuracy": 0.9980731896480153, + "accuracy": 0.9980299310072472, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -27316,7 +27316,7 @@ ], "model.layers.14.self_attn": [ { - "accuracy": 0.9205027222633362, + "accuracy": 0.9131143759740026, "total_bits": 89665536, "q_proj": { "group_size": { @@ -27380,7 +27380,7 @@ } }, { - "accuracy": 0.9227886633261254, + "accuracy": 0.9154409154465324, "total_bits": 92221440, "q_proj": { "group_size": { @@ -27444,7 +27444,7 @@ } }, { - "accuracy": 0.9318458961420938, + "accuracy": 0.9273906307000863, "total_bits": 95758848, "q_proj": { "group_size": { @@ -27508,7 +27508,7 @@ } }, { - "accuracy": 0.9456742019637635, + "accuracy": 0.9422794735353244, "total_bits": 112272384, "q_proj": { "group_size": { @@ -27572,7 +27572,7 @@ } }, { - "accuracy": 0.9591158910801536, + "accuracy": 0.9565369080948203, "total_bits": 132913152, "q_proj": { "group_size": { @@ -27636,7 +27636,7 @@ } }, { - "accuracy": 0.959651744189231, + "accuracy": 0.9575513220931354, "total_bits": 132980224, "q_proj": { "group_size": { @@ -27700,7 +27700,7 @@ } }, { - "accuracy": 0.9764563710869927, + "accuracy": 0.9749602542111748, "total_bits": 169613312, "q_proj": { "group_size": { @@ -27752,7 +27752,7 @@ } }, { - "accuracy": 0.9770543643910634, + "accuracy": 0.9756693387109983, "total_bits": 169745920, "q_proj": { "group_size": { @@ -27804,7 +27804,7 @@ } }, { - "accuracy": 0.9788302108645439, + "accuracy": 0.9771783634235984, "total_bits": 171195392, "q_proj": { "group_size": { @@ -27856,7 +27856,7 @@ } }, { - "accuracy": 0.9800073148584679, + "accuracy": 0.9784984001399655, "total_bits": 173563904, "q_proj": { "group_size": { @@ -27908,7 +27908,7 @@ } }, { - "accuracy": 0.9795524974990832, + "accuracy": 0.9781653034059625, "total_bits": 174923264, "q_proj": { "group_size": { @@ -27972,7 +27972,7 @@ } }, { - "accuracy": 0.9810624413290306, + "accuracy": 0.97952327230259, "total_bits": 175750144, "q_proj": { "group_size": { @@ -28036,7 +28036,7 @@ } }, { - "accuracy": 0.9833355853334069, + "accuracy": 0.9820284449838494, "total_bits": 179253248, "q_proj": { "group_size": { @@ -28097,7 +28097,7 @@ } }, { - "accuracy": 0.9845118442746369, + "accuracy": 0.9836551540188099, "total_bits": 181592064, "q_proj": { "group_size": { @@ -28158,7 +28158,7 @@ } }, { - "accuracy": 0.990971889395855, + "accuracy": 0.9903581722051298, "total_bits": 220469248, "q_proj": { "group_size": { @@ -28219,7 +28219,7 @@ } }, { - "accuracy": 0.9923853569075858, + "accuracy": 0.9917885243990704, "total_bits": 223535104, "q_proj": { "group_size": { @@ -28280,7 +28280,7 @@ } }, { - "accuracy": 0.9939501654405735, + "accuracy": 0.9932864235567027, "total_bits": 253499392, "q_proj": { "group_size": { @@ -28332,7 +28332,7 @@ } }, { - "accuracy": 0.9958047512305999, + "accuracy": 0.9955214504887792, "total_bits": 265838592, "q_proj": { "group_size": { @@ -28384,7 +28384,7 @@ } }, { - "accuracy": 0.9984015154492992, + "accuracy": 0.9982598438601646, "total_bits": 337385472, "q_proj": { "group_size": { @@ -28438,7 +28438,7 @@ ], "model.layers.14.mlp": [ { - "accuracy": 0.8969062178542739, + "accuracy": 0.8952913723493877, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -28490,7 +28490,7 @@ } }, { - "accuracy": 0.9002050722115919, + "accuracy": 0.8986984126661953, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -28542,7 +28542,7 @@ } }, { - "accuracy": 0.9160937617876028, + "accuracy": 0.9147512208866446, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -28591,7 +28591,7 @@ } }, { - "accuracy": 0.9210172295570374, + "accuracy": 0.9197725935986167, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -28640,7 +28640,7 @@ } }, { - "accuracy": 0.9478068847797418, + "accuracy": 0.9470671182008166, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -28692,7 +28692,7 @@ } }, { - "accuracy": 0.9520839676260948, + "accuracy": 0.9513948881312421, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -28744,7 +28744,7 @@ } }, { - "accuracy": 0.9587062713935187, + "accuracy": 0.9580837692085066, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -28793,7 +28793,7 @@ } }, { - "accuracy": 0.9724062008685187, + "accuracy": 0.9719526274619918, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -28836,7 +28836,7 @@ } }, { - "accuracy": 0.9746922722184345, + "accuracy": 0.974264508211299, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -28879,7 +28879,7 @@ } }, { - "accuracy": 0.9733288030287153, + "accuracy": 0.9729546288910665, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -28931,7 +28931,7 @@ } }, { - "accuracy": 0.9766540848895123, + "accuracy": 0.9763253167467681, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -28983,7 +28983,7 @@ } }, { - "accuracy": 0.9863802348018477, + "accuracy": 0.9861926331527924, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -29035,7 +29035,7 @@ } }, { - "accuracy": 0.9883242514670679, + "accuracy": 0.9881630971243507, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -29087,7 +29087,7 @@ } }, { - "accuracy": 0.9924002342465285, + "accuracy": 0.9922697508805677, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -29130,7 +29130,7 @@ } }, { - "accuracy": 0.9930846782058085, + "accuracy": 0.9929906870483568, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -29179,7 +29179,7 @@ } }, { - "accuracy": 0.9945309839186895, + "accuracy": 0.9944456925885262, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -29225,7 +29225,7 @@ } }, { - "accuracy": 0.9979677209569338, + "accuracy": 0.997922707152994, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -29267,7 +29267,7 @@ ], "model.layers.15.self_attn": [ { - "accuracy": 0.9128122847331197, + "accuracy": 0.9089588879754669, "total_bits": 89665536, "q_proj": { "group_size": { @@ -29331,7 +29331,7 @@ } }, { - "accuracy": 0.9150226155394002, + "accuracy": 0.9102917842959103, "total_bits": 92221440, "q_proj": { "group_size": { @@ -29395,7 +29395,7 @@ } }, { - "accuracy": 0.9258082771771833, + "accuracy": 0.9253257667939914, "total_bits": 95758848, "q_proj": { "group_size": { @@ -29459,7 +29459,7 @@ } }, { - "accuracy": 0.9410199999417129, + "accuracy": 0.941281175927112, "total_bits": 112272384, "q_proj": { "group_size": { @@ -29523,7 +29523,7 @@ } }, { - "accuracy": 0.9544542884748233, + "accuracy": 0.953925563708732, "total_bits": 132913152, "q_proj": { "group_size": { @@ -29587,7 +29587,7 @@ } }, { - "accuracy": 0.9551517465396931, + "accuracy": 0.954911494529561, "total_bits": 132980224, "q_proj": { "group_size": { @@ -29651,7 +29651,7 @@ } }, { - "accuracy": 0.9747305720260269, + "accuracy": 0.9738605508678838, "total_bits": 169613312, "q_proj": { "group_size": { @@ -29703,7 +29703,7 @@ } }, { - "accuracy": 0.975976746039171, + "accuracy": 0.9751915901311135, "total_bits": 169745920, "q_proj": { "group_size": { @@ -29755,7 +29755,7 @@ } }, { - "accuracy": 0.9779046514120541, + "accuracy": 0.9774157483326761, "total_bits": 171195392, "q_proj": { "group_size": { @@ -29807,7 +29807,7 @@ } }, { - "accuracy": 0.9786451167770123, + "accuracy": 0.9785601658452499, "total_bits": 173563904, "q_proj": { "group_size": { @@ -29859,7 +29859,7 @@ } }, { - "accuracy": 0.9782757571849384, + "accuracy": 0.9770640863203689, "total_bits": 174923264, "q_proj": { "group_size": { @@ -29923,7 +29923,7 @@ } }, { - "accuracy": 0.9793739006119339, + "accuracy": 0.9789585914756906, "total_bits": 175750144, "q_proj": { "group_size": { @@ -29987,7 +29987,7 @@ } }, { - "accuracy": 0.9822194188539135, + "accuracy": 0.9818499448071969, "total_bits": 179253248, "q_proj": { "group_size": { @@ -30048,7 +30048,7 @@ } }, { - "accuracy": 0.983648861562343, + "accuracy": 0.9832866513905557, "total_bits": 181592064, "q_proj": { "group_size": { @@ -30109,7 +30109,7 @@ } }, { - "accuracy": 0.990093398569642, + "accuracy": 0.9898972917887333, "total_bits": 220469248, "q_proj": { "group_size": { @@ -30170,7 +30170,7 @@ } }, { - "accuracy": 0.9918086134681576, + "accuracy": 0.9916349354837286, "total_bits": 223535104, "q_proj": { "group_size": { @@ -30231,7 +30231,7 @@ } }, { - "accuracy": 0.9934967576869225, + "accuracy": 0.9932825523183534, "total_bits": 253499392, "q_proj": { "group_size": { @@ -30283,7 +30283,7 @@ } }, { - "accuracy": 0.9958440971707827, + "accuracy": 0.9957623771073199, "total_bits": 265838592, "q_proj": { "group_size": { @@ -30335,7 +30335,7 @@ } }, { - "accuracy": 0.9982820799280154, + "accuracy": 0.9982198519926322, "total_bits": 337385472, "q_proj": { "group_size": { @@ -30389,7 +30389,7 @@ ], "model.layers.15.mlp": [ { - "accuracy": 0.8914005728928667, + "accuracy": 0.8900455122715548, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -30441,7 +30441,7 @@ } }, { - "accuracy": 0.8949090897252685, + "accuracy": 0.8936422384883228, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -30493,7 +30493,7 @@ } }, { - "accuracy": 0.9120906560044539, + "accuracy": 0.9109154825932101, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -30542,7 +30542,7 @@ } }, { - "accuracy": 0.9172241074082098, + "accuracy": 0.9161352685799724, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -30591,7 +30591,7 @@ } }, { - "accuracy": 0.945448553875873, + "accuracy": 0.9447537437081337, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -30643,7 +30643,7 @@ } }, { - "accuracy": 0.949826220344556, + "accuracy": 0.9492049317218756, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -30695,7 +30695,7 @@ } }, { - "accuracy": 0.9568474733907926, + "accuracy": 0.956260095987665, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -30744,7 +30744,7 @@ } }, { - "accuracy": 0.971343044093565, + "accuracy": 0.9709044217475151, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -30787,7 +30787,7 @@ } }, { - "accuracy": 0.9736610201040381, + "accuracy": 0.9732388975588899, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -30830,7 +30830,7 @@ } }, { - "accuracy": 0.9721537014763606, + "accuracy": 0.9718087699852491, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -30882,7 +30882,7 @@ } }, { - "accuracy": 0.9755813801955235, + "accuracy": 0.9752611500260077, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -30934,7 +30934,7 @@ } }, { - "accuracy": 0.9857970079112994, + "accuracy": 0.9856160360535509, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -30986,7 +30986,7 @@ } }, { - "accuracy": 0.9878109168065222, + "accuracy": 0.987651148124745, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -31038,7 +31038,7 @@ } }, { - "accuracy": 0.9921418049274698, + "accuracy": 0.9920113448200649, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -31081,7 +31081,7 @@ } }, { - "accuracy": 0.9927716975492474, + "accuracy": 0.9926830940928898, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -31130,7 +31130,7 @@ } }, { - "accuracy": 0.9942791132795575, + "accuracy": 0.9941935016234454, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -31176,7 +31176,7 @@ } }, { - "accuracy": 0.9978831031629326, + "accuracy": 0.9978376184590161, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -31218,7 +31218,7 @@ ], "model.layers.16.self_attn": [ { - "accuracy": 0.9276164619154051, + "accuracy": 0.9224674572285853, "total_bits": 89665536, "q_proj": { "group_size": { @@ -31282,7 +31282,7 @@ } }, { - "accuracy": 0.9302929130039717, + "accuracy": 0.9254111239784643, "total_bits": 92221440, "q_proj": { "group_size": { @@ -31346,7 +31346,7 @@ } }, { - "accuracy": 0.9388603354363065, + "accuracy": 0.9378393435556638, "total_bits": 95758848, "q_proj": { "group_size": { @@ -31410,7 +31410,7 @@ } }, { - "accuracy": 0.9521176928752347, + "accuracy": 0.9503926211281827, "total_bits": 112272384, "q_proj": { "group_size": { @@ -31474,7 +31474,7 @@ } }, { - "accuracy": 0.9626472450204586, + "accuracy": 0.960383852943778, "total_bits": 132913152, "q_proj": { "group_size": { @@ -31538,7 +31538,7 @@ } }, { - "accuracy": 0.9633555515228134, + "accuracy": 0.9616616172225851, "total_bits": 132980224, "q_proj": { "group_size": { @@ -31602,7 +31602,7 @@ } }, { - "accuracy": 0.9769954787273156, + "accuracy": 0.975998291647748, "total_bits": 169613312, "q_proj": { "group_size": { @@ -31654,7 +31654,7 @@ } }, { - "accuracy": 0.9783493744111375, + "accuracy": 0.9773986268004304, "total_bits": 169745920, "q_proj": { "group_size": { @@ -31706,7 +31706,7 @@ } }, { - "accuracy": 0.980003807399618, + "accuracy": 0.9791314468572014, "total_bits": 171195392, "q_proj": { "group_size": { @@ -31758,7 +31758,7 @@ } }, { - "accuracy": 0.9812607052490899, + "accuracy": 0.980054777997889, "total_bits": 173563904, "q_proj": { "group_size": { @@ -31810,7 +31810,7 @@ } }, { - "accuracy": 0.9813340871447795, + "accuracy": 0.9804569534761342, "total_bits": 174923264, "q_proj": { "group_size": { @@ -31874,7 +31874,7 @@ } }, { - "accuracy": 0.982675175966793, + "accuracy": 0.9816380170124926, "total_bits": 175750144, "q_proj": { "group_size": { @@ -31938,7 +31938,7 @@ } }, { - "accuracy": 0.9844471363252715, + "accuracy": 0.9843807564558167, "total_bits": 179253248, "q_proj": { "group_size": { @@ -31999,7 +31999,7 @@ } }, { - "accuracy": 0.9860259525379852, + "accuracy": 0.9856414337593474, "total_bits": 181592064, "q_proj": { "group_size": { @@ -32060,7 +32060,7 @@ } }, { - "accuracy": 0.9916171746720609, + "accuracy": 0.9914116855759761, "total_bits": 220469248, "q_proj": { "group_size": { @@ -32121,7 +32121,7 @@ } }, { - "accuracy": 0.9929631713924831, + "accuracy": 0.9927732744254172, "total_bits": 223535104, "q_proj": { "group_size": { @@ -32182,7 +32182,7 @@ } }, { - "accuracy": 0.9940083497939142, + "accuracy": 0.9937797100773376, "total_bits": 253499392, "q_proj": { "group_size": { @@ -32234,7 +32234,7 @@ } }, { - "accuracy": 0.9962043645546624, + "accuracy": 0.9960941228231317, "total_bits": 265838592, "q_proj": { "group_size": { @@ -32286,7 +32286,7 @@ } }, { - "accuracy": 0.9983653944708701, + "accuracy": 0.9983332439105174, "total_bits": 337385472, "q_proj": { "group_size": { @@ -32340,7 +32340,7 @@ ], "model.layers.16.mlp": [ { - "accuracy": 0.8932184153481534, + "accuracy": 0.891506900912837, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -32392,7 +32392,7 @@ } }, { - "accuracy": 0.896572481644781, + "accuracy": 0.894897130367003, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -32444,7 +32444,7 @@ } }, { - "accuracy": 0.9132255500084475, + "accuracy": 0.9118173428271946, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -32493,7 +32493,7 @@ } }, { - "accuracy": 0.9183859829055636, + "accuracy": 0.9171442428701803, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -32542,7 +32542,7 @@ } }, { - "accuracy": 0.9461143326602484, + "accuracy": 0.9451728220048704, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -32594,7 +32594,7 @@ } }, { - "accuracy": 0.9504349337596643, + "accuracy": 0.9495925532751962, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -32646,7 +32646,7 @@ } }, { - "accuracy": 0.9574292596233518, + "accuracy": 0.9567234086755075, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -32695,7 +32695,7 @@ } }, { - "accuracy": 0.9716716574406937, + "accuracy": 0.9711121674627066, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -32738,7 +32738,7 @@ } }, { - "accuracy": 0.9740218467226154, + "accuracy": 0.9735319796753558, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -32781,7 +32781,7 @@ } }, { - "accuracy": 0.972479686435116, + "accuracy": 0.9720074568728083, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -32833,7 +32833,7 @@ } }, { - "accuracy": 0.9758817764293206, + "accuracy": 0.9754816048631543, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -32885,7 +32885,7 @@ } }, { - "accuracy": 0.9859518863652882, + "accuracy": 0.9857210747309422, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -32937,7 +32937,7 @@ } }, { - "accuracy": 0.9879571411170458, + "accuracy": 0.9877544392978674, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -32989,7 +32989,7 @@ } }, { - "accuracy": 0.9922260953799674, + "accuracy": 0.992076809101395, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -33032,7 +33032,7 @@ } }, { - "accuracy": 0.9928559448422962, + "accuracy": 0.9927341479955143, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -33081,7 +33081,7 @@ } }, { - "accuracy": 0.9943434854626263, + "accuracy": 0.9942599462198192, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -33127,7 +33127,7 @@ } }, { - "accuracy": 0.9979085323131202, + "accuracy": 0.9978663274944809, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -33169,7 +33169,7 @@ ], "model.layers.17.self_attn": [ { - "accuracy": 0.9337116668098852, + "accuracy": 0.9327367538292157, "total_bits": 89665536, "q_proj": { "group_size": { @@ -33233,7 +33233,7 @@ } }, { - "accuracy": 0.9363457407606275, + "accuracy": 0.9359054702677225, "total_bits": 92221440, "q_proj": { "group_size": { @@ -33297,7 +33297,7 @@ } }, { - "accuracy": 0.9446112905677996, + "accuracy": 0.9450910644311654, "total_bits": 95758848, "q_proj": { "group_size": { @@ -33361,7 +33361,7 @@ } }, { - "accuracy": 0.9555443115532398, + "accuracy": 0.9560589472714224, "total_bits": 112272384, "q_proj": { "group_size": { @@ -33425,7 +33425,7 @@ } }, { - "accuracy": 0.9661162508357513, + "accuracy": 0.9657368129609447, "total_bits": 132913152, "q_proj": { "group_size": { @@ -33489,7 +33489,7 @@ } }, { - "accuracy": 0.9664030280944548, + "accuracy": 0.9655536907283884, "total_bits": 132980224, "q_proj": { "group_size": { @@ -33553,7 +33553,7 @@ } }, { - "accuracy": 0.9798138077910009, + "accuracy": 0.9795156425159228, "total_bits": 169613312, "q_proj": { "group_size": { @@ -33605,7 +33605,7 @@ } }, { - "accuracy": 0.9805734202657875, + "accuracy": 0.9800936651759242, "total_bits": 169745920, "q_proj": { "group_size": { @@ -33657,7 +33657,7 @@ } }, { - "accuracy": 0.9818189546563908, + "accuracy": 0.9815763250777596, "total_bits": 171195392, "q_proj": { "group_size": { @@ -33709,7 +33709,7 @@ } }, { - "accuracy": 0.9827360209861868, + "accuracy": 0.9823656393901298, "total_bits": 173563904, "q_proj": { "group_size": { @@ -33761,7 +33761,7 @@ } }, { - "accuracy": 0.982644286104723, + "accuracy": 0.9822438932269028, "total_bits": 174923264, "q_proj": { "group_size": { @@ -33825,7 +33825,7 @@ } }, { - "accuracy": 0.9836074570193887, + "accuracy": 0.9832804790747008, "total_bits": 175750144, "q_proj": { "group_size": { @@ -33889,7 +33889,7 @@ } }, { - "accuracy": 0.9860271717862863, + "accuracy": 0.9858677278419858, "total_bits": 179253248, "q_proj": { "group_size": { @@ -33950,7 +33950,7 @@ } }, { - "accuracy": 0.9873345177130479, + "accuracy": 0.9869831095596677, "total_bits": 181592064, "q_proj": { "group_size": { @@ -34011,7 +34011,7 @@ } }, { - "accuracy": 0.9924936025942627, + "accuracy": 0.9922622250344016, "total_bits": 220469248, "q_proj": { "group_size": { @@ -34072,7 +34072,7 @@ } }, { - "accuracy": 0.9936388629047495, + "accuracy": 0.9935795820416197, "total_bits": 223535104, "q_proj": { "group_size": { @@ -34133,7 +34133,7 @@ } }, { - "accuracy": 0.9946833217614576, + "accuracy": 0.9944344076671099, "total_bits": 253499392, "q_proj": { "group_size": { @@ -34185,7 +34185,7 @@ } }, { - "accuracy": 0.9968069684691727, + "accuracy": 0.9967062117066234, "total_bits": 265838592, "q_proj": { "group_size": { @@ -34237,7 +34237,7 @@ } }, { - "accuracy": 0.9985670397352231, + "accuracy": 0.9985337449164179, "total_bits": 337385472, "q_proj": { "group_size": { @@ -34291,7 +34291,7 @@ ], "model.layers.17.mlp": [ { - "accuracy": 0.8935036631791216, + "accuracy": 0.8908158191724828, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -34343,7 +34343,7 @@ } }, { - "accuracy": 0.8967085649308405, + "accuracy": 0.8940835101039786, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -34395,7 +34395,7 @@ } }, { - "accuracy": 0.9139467171932522, + "accuracy": 0.9116833347238993, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -34444,7 +34444,7 @@ } }, { - "accuracy": 0.9191947361748469, + "accuracy": 0.9171461439446399, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -34493,7 +34493,7 @@ } }, { - "accuracy": 0.9463203159209929, + "accuracy": 0.9448635415419152, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -34545,7 +34545,7 @@ } }, { - "accuracy": 0.9506043060437629, + "accuracy": 0.9492780825025157, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -34597,7 +34597,7 @@ } }, { - "accuracy": 0.9578127012048897, + "accuracy": 0.9566842045046782, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -34646,7 +34646,7 @@ } }, { - "accuracy": 0.9717582982817763, + "accuracy": 0.970905398557845, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -34689,7 +34689,7 @@ } }, { - "accuracy": 0.9741341132474574, + "accuracy": 0.9733821355590695, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -34732,7 +34732,7 @@ } }, { - "accuracy": 0.9726044535636902, + "accuracy": 0.9718781099899819, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -34784,7 +34784,7 @@ } }, { - "accuracy": 0.9759731725054351, + "accuracy": 0.975329595666967, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -34836,7 +34836,7 @@ } }, { - "accuracy": 0.9860195313629351, + "accuracy": 0.9856448168131081, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -34888,7 +34888,7 @@ } }, { - "accuracy": 0.9880003504160988, + "accuracy": 0.9876782780905303, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -34940,7 +34940,7 @@ } }, { - "accuracy": 0.9922685824628723, + "accuracy": 0.9920309527385, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -34983,7 +34983,7 @@ } }, { - "accuracy": 0.9928931627716673, + "accuracy": 0.992713971382105, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -35032,7 +35032,7 @@ } }, { - "accuracy": 0.9944244618037421, + "accuracy": 0.9942904448038653, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -35078,7 +35078,7 @@ } }, { - "accuracy": 0.9979018089238947, + "accuracy": 0.9978316737963867, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -35120,7 +35120,7 @@ ], "model.layers.18.self_attn": [ { - "accuracy": 0.944679098890016, + "accuracy": 0.943310114309976, "total_bits": 89665536, "q_proj": { "group_size": { @@ -35184,7 +35184,7 @@ } }, { - "accuracy": 0.9459297825631342, + "accuracy": 0.9448977424518058, "total_bits": 92221440, "q_proj": { "group_size": { @@ -35248,7 +35248,7 @@ } }, { - "accuracy": 0.9520549672214609, + "accuracy": 0.9515413716435432, "total_bits": 95758848, "q_proj": { "group_size": { @@ -35312,7 +35312,7 @@ } }, { - "accuracy": 0.9608107989555911, + "accuracy": 0.9606600841997486, "total_bits": 112272384, "q_proj": { "group_size": { @@ -35376,7 +35376,7 @@ } }, { - "accuracy": 0.9708268567919731, + "accuracy": 0.970376394983185, "total_bits": 132913152, "q_proj": { "group_size": { @@ -35440,7 +35440,7 @@ } }, { - "accuracy": 0.9717176989897301, + "accuracy": 0.9711237408612904, "total_bits": 132980224, "q_proj": { "group_size": { @@ -35504,7 +35504,7 @@ } }, { - "accuracy": 0.98101465982434, + "accuracy": 0.9810096360743046, "total_bits": 169613312, "q_proj": { "group_size": { @@ -35556,7 +35556,7 @@ } }, { - "accuracy": 0.9829624108970165, + "accuracy": 0.9826737414359262, "total_bits": 169745920, "q_proj": { "group_size": { @@ -35608,7 +35608,7 @@ } }, { - "accuracy": 0.9847109506004735, + "accuracy": 0.9843824844023115, "total_bits": 171195392, "q_proj": { "group_size": { @@ -35660,7 +35660,7 @@ } }, { - "accuracy": 0.9855133054385844, + "accuracy": 0.9850903986708114, "total_bits": 173563904, "q_proj": { "group_size": { @@ -35712,7 +35712,7 @@ } }, { - "accuracy": 0.985513468223967, + "accuracy": 0.9849474538901919, "total_bits": 174923264, "q_proj": { "group_size": { @@ -35776,7 +35776,7 @@ } }, { - "accuracy": 0.9865912228430572, + "accuracy": 0.9863323522241492, "total_bits": 175750144, "q_proj": { "group_size": { @@ -35840,7 +35840,7 @@ } }, { - "accuracy": 0.9881378567140353, + "accuracy": 0.9877792841411734, "total_bits": 179253248, "q_proj": { "group_size": { @@ -35901,7 +35901,7 @@ } }, { - "accuracy": 0.9892407095942058, + "accuracy": 0.9889967420481538, "total_bits": 181592064, "q_proj": { "group_size": { @@ -35962,7 +35962,7 @@ } }, { - "accuracy": 0.9931937235064412, + "accuracy": 0.9931674913356179, "total_bits": 220469248, "q_proj": { "group_size": { @@ -36023,7 +36023,7 @@ } }, { - "accuracy": 0.9946184422526705, + "accuracy": 0.9944592472901078, "total_bits": 223535104, "q_proj": { "group_size": { @@ -36084,7 +36084,7 @@ } }, { - "accuracy": 0.9949640307918584, + "accuracy": 0.9949289723054359, "total_bits": 253499392, "q_proj": { "group_size": { @@ -36136,7 +36136,7 @@ } }, { - "accuracy": 0.997180601128524, + "accuracy": 0.9971254911384007, "total_bits": 265838592, "q_proj": { "group_size": { @@ -36188,7 +36188,7 @@ } }, { - "accuracy": 0.998671550475257, + "accuracy": 0.9986348188371936, "total_bits": 337385472, "q_proj": { "group_size": { @@ -36242,7 +36242,7 @@ ], "model.layers.18.mlp": [ { - "accuracy": 0.8970098526854264, + "accuracy": 0.894507784200342, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -36294,7 +36294,7 @@ } }, { - "accuracy": 0.8999123836034223, + "accuracy": 0.8975494543188497, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -36346,7 +36346,7 @@ } }, { - "accuracy": 0.9161689344205355, + "accuracy": 0.9141937208018804, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -36395,7 +36395,7 @@ } }, { - "accuracy": 0.92110415469659, + "accuracy": 0.9192859716713428, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -36444,7 +36444,7 @@ } }, { - "accuracy": 0.9479836574510524, + "accuracy": 0.946719850952688, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -36496,7 +36496,7 @@ } }, { - "accuracy": 0.9520162071444487, + "accuracy": 0.9508802304534536, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -36548,7 +36548,7 @@ } }, { - "accuracy": 0.9589175909365478, + "accuracy": 0.957965798479946, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -36597,7 +36597,7 @@ } }, { - "accuracy": 0.9727460684156731, + "accuracy": 0.9721023386442348, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -36640,7 +36640,7 @@ } }, { - "accuracy": 0.975048723973726, + "accuracy": 0.9744422504384267, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -36683,7 +36683,7 @@ } }, { - "accuracy": 0.9734402780274027, + "accuracy": 0.972826591349746, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -36735,7 +36735,7 @@ } }, { - "accuracy": 0.9766593272552678, + "accuracy": 0.9761150616564249, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -36787,7 +36787,7 @@ } }, { - "accuracy": 0.9864444859129818, + "accuracy": 0.9861342734412143, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -36839,7 +36839,7 @@ } }, { - "accuracy": 0.9883504523160426, + "accuracy": 0.9880751027774654, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -36891,7 +36891,7 @@ } }, { - "accuracy": 0.9925792593214857, + "accuracy": 0.9924034999291363, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -36934,7 +36934,7 @@ } }, { - "accuracy": 0.993109734459339, + "accuracy": 0.9929501866725715, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -36983,7 +36983,7 @@ } }, { - "accuracy": 0.9945747746693853, + "accuracy": 0.9944524330479142, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -37029,7 +37029,7 @@ } }, { - "accuracy": 0.9980140442310489, + "accuracy": 0.997967757872845, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -37071,7 +37071,7 @@ ], "model.layers.19.self_attn": [ { - "accuracy": 0.9364683416328932, + "accuracy": 0.9375736338919715, "total_bits": 89665536, "q_proj": { "group_size": { @@ -37135,7 +37135,7 @@ } }, { - "accuracy": 0.937541129361642, + "accuracy": 0.9414192912609953, "total_bits": 92221440, "q_proj": { "group_size": { @@ -37199,7 +37199,7 @@ } }, { - "accuracy": 0.952069035682239, + "accuracy": 0.9517732123403173, "total_bits": 95758848, "q_proj": { "group_size": { @@ -37263,7 +37263,7 @@ } }, { - "accuracy": 0.9595744211814905, + "accuracy": 0.9592566405864138, "total_bits": 112272384, "q_proj": { "group_size": { @@ -37327,7 +37327,7 @@ } }, { - "accuracy": 0.9687561481995018, + "accuracy": 0.9690645596894779, "total_bits": 132913152, "q_proj": { "group_size": { @@ -37391,7 +37391,7 @@ } }, { - "accuracy": 0.9686989930311316, + "accuracy": 0.9705432502454833, "total_bits": 132980224, "q_proj": { "group_size": { @@ -37455,7 +37455,7 @@ } }, { - "accuracy": 0.9803080115663377, + "accuracy": 0.9805190916124144, "total_bits": 169613312, "q_proj": { "group_size": { @@ -37507,7 +37507,7 @@ } }, { - "accuracy": 0.9812779256975964, + "accuracy": 0.982061336797319, "total_bits": 169745920, "q_proj": { "group_size": { @@ -37559,7 +37559,7 @@ } }, { - "accuracy": 0.9832362165968669, + "accuracy": 0.9830760724450412, "total_bits": 171195392, "q_proj": { "group_size": { @@ -37611,7 +37611,7 @@ } }, { - "accuracy": 0.9838342070579529, + "accuracy": 0.9835898218382346, "total_bits": 173563904, "q_proj": { "group_size": { @@ -37663,7 +37663,7 @@ } }, { - "accuracy": 0.9850963244312688, + "accuracy": 0.9841921619678798, "total_bits": 174923264, "q_proj": { "group_size": { @@ -37727,7 +37727,7 @@ } }, { - "accuracy": 0.9861754535354281, + "accuracy": 0.985681646846627, "total_bits": 175750144, "q_proj": { "group_size": { @@ -37791,7 +37791,7 @@ } }, { - "accuracy": 0.9877318652640832, + "accuracy": 0.9878430095942397, "total_bits": 179253248, "q_proj": { "group_size": { @@ -37852,7 +37852,7 @@ } }, { - "accuracy": 0.9891782319663387, + "accuracy": 0.9889410907206567, "total_bits": 181592064, "q_proj": { "group_size": { @@ -37913,7 +37913,7 @@ } }, { - "accuracy": 0.9932431398253692, + "accuracy": 0.9932514944260842, "total_bits": 220469248, "q_proj": { "group_size": { @@ -37974,7 +37974,7 @@ } }, { - "accuracy": 0.9945197904139365, + "accuracy": 0.9944913612531596, "total_bits": 223535104, "q_proj": { "group_size": { @@ -38035,7 +38035,7 @@ } }, { - "accuracy": 0.9947800697072556, + "accuracy": 0.9948054097690865, "total_bits": 253499392, "q_proj": { "group_size": { @@ -38087,7 +38087,7 @@ } }, { - "accuracy": 0.9973581694434152, + "accuracy": 0.9972530012509149, "total_bits": 265838592, "q_proj": { "group_size": { @@ -38139,7 +38139,7 @@ } }, { - "accuracy": 0.9985358212388268, + "accuracy": 0.9986483938992023, "total_bits": 337385472, "q_proj": { "group_size": { @@ -38193,7 +38193,7 @@ ], "model.layers.19.mlp": [ { - "accuracy": 0.8980615833087972, + "accuracy": 0.8960867171224794, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -38245,7 +38245,7 @@ } }, { - "accuracy": 0.9009356992809396, + "accuracy": 0.8990460477377239, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -38297,7 +38297,7 @@ } }, { - "accuracy": 0.9165768239058947, + "accuracy": 0.9149506241083145, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -38346,7 +38346,7 @@ } }, { - "accuracy": 0.921308162181001, + "accuracy": 0.9197891656505435, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -38395,7 +38395,7 @@ } }, { - "accuracy": 0.9484429731965065, + "accuracy": 0.9474612980296737, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -38447,7 +38447,7 @@ } }, { - "accuracy": 0.9524440102671322, + "accuracy": 0.951546344317888, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -38499,7 +38499,7 @@ } }, { - "accuracy": 0.9591568880959561, + "accuracy": 0.9583676826012761, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -38548,7 +38548,7 @@ } }, { - "accuracy": 0.9730544243203966, + "accuracy": 0.9725158324367121, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -38591,7 +38591,7 @@ } }, { - "accuracy": 0.9753118498544944, + "accuracy": 0.9748119428557785, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -38634,7 +38634,7 @@ } }, { - "accuracy": 0.9737463932680456, + "accuracy": 0.9732538532269629, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -38686,7 +38686,7 @@ } }, { - "accuracy": 0.9769195020198822, + "accuracy": 0.9764791208466417, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -38738,7 +38738,7 @@ } }, { - "accuracy": 0.9866309956598439, + "accuracy": 0.986385085570969, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -38790,7 +38790,7 @@ } }, { - "accuracy": 0.988479770867056, + "accuracy": 0.9882593198532337, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -38842,7 +38842,7 @@ } }, { - "accuracy": 0.9926495073657287, + "accuracy": 0.9925084857907343, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -38885,7 +38885,7 @@ } }, { - "accuracy": 0.9932103572462342, + "accuracy": 0.9930890148848688, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -38934,7 +38934,7 @@ } }, { - "accuracy": 0.9945620700569922, + "accuracy": 0.9944711444458287, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -38980,7 +38980,7 @@ } }, { - "accuracy": 0.9980197638812426, + "accuracy": 0.9979916896585277, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -39022,7 +39022,7 @@ ], "model.layers.20.self_attn": [ { - "accuracy": 0.9456599739037062, + "accuracy": 0.9435877400009256, "total_bits": 89665536, "q_proj": { "group_size": { @@ -39086,7 +39086,7 @@ } }, { - "accuracy": 0.9499139334810407, + "accuracy": 0.9485910232914121, "total_bits": 92221440, "q_proj": { "group_size": { @@ -39150,7 +39150,7 @@ } }, { - "accuracy": 0.9577709381517611, + "accuracy": 0.956550940283035, "total_bits": 95758848, "q_proj": { "group_size": { @@ -39214,7 +39214,7 @@ } }, { - "accuracy": 0.9656849503517151, + "accuracy": 0.9642738518550208, "total_bits": 112272384, "q_proj": { "group_size": { @@ -39278,7 +39278,7 @@ } }, { - "accuracy": 0.9727934887142557, + "accuracy": 0.9709541991745171, "total_bits": 132913152, "q_proj": { "group_size": { @@ -39342,7 +39342,7 @@ } }, { - "accuracy": 0.9741284222783226, + "accuracy": 0.9702305055566525, "total_bits": 132980224, "q_proj": { "group_size": { @@ -39406,7 +39406,7 @@ } }, { - "accuracy": 0.9827874374919032, + "accuracy": 0.9824008194631652, "total_bits": 169613312, "q_proj": { "group_size": { @@ -39458,7 +39458,7 @@ } }, { - "accuracy": 0.9835851979687026, + "accuracy": 0.9836366925094473, "total_bits": 169745920, "q_proj": { "group_size": { @@ -39510,7 +39510,7 @@ } }, { - "accuracy": 0.9848906841423166, + "accuracy": 0.9847757934935784, "total_bits": 171195392, "q_proj": { "group_size": { @@ -39562,7 +39562,7 @@ } }, { - "accuracy": 0.9854848172123495, + "accuracy": 0.9854541409662679, "total_bits": 173563904, "q_proj": { "group_size": { @@ -39614,7 +39614,7 @@ } }, { - "accuracy": 0.9863186550669765, + "accuracy": 0.9856162233964393, "total_bits": 174923264, "q_proj": { "group_size": { @@ -39678,7 +39678,7 @@ } }, { - "accuracy": 0.9871017961811862, + "accuracy": 0.9865585688109461, "total_bits": 175750144, "q_proj": { "group_size": { @@ -39742,7 +39742,7 @@ } }, { - "accuracy": 0.9887673406322536, + "accuracy": 0.9889720883220434, "total_bits": 179253248, "q_proj": { "group_size": { @@ -39803,7 +39803,7 @@ } }, { - "accuracy": 0.989858863581168, + "accuracy": 0.9896417369477843, "total_bits": 181592064, "q_proj": { "group_size": { @@ -39864,7 +39864,7 @@ } }, { - "accuracy": 0.9939803180382832, + "accuracy": 0.9939340469182322, "total_bits": 220469248, "q_proj": { "group_size": { @@ -39925,7 +39925,7 @@ } }, { - "accuracy": 0.994980818395944, + "accuracy": 0.9949456907710746, "total_bits": 223535104, "q_proj": { "group_size": { @@ -39986,7 +39986,7 @@ } }, { - "accuracy": 0.9954565378445152, + "accuracy": 0.9953771252185106, "total_bits": 253499392, "q_proj": { "group_size": { @@ -40038,7 +40038,7 @@ } }, { - "accuracy": 0.9974236983781386, + "accuracy": 0.9974170139083933, "total_bits": 265838592, "q_proj": { "group_size": { @@ -40090,7 +40090,7 @@ } }, { - "accuracy": 0.9987701006772879, + "accuracy": 0.9987709914934576, "total_bits": 337385472, "q_proj": { "group_size": { @@ -40144,7 +40144,7 @@ ], "model.layers.20.mlp": [ { - "accuracy": 0.8978180238290837, + "accuracy": 0.895766867226676, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -40196,7 +40196,7 @@ } }, { - "accuracy": 0.900672363607507, + "accuracy": 0.8986942889659029, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -40248,7 +40248,7 @@ } }, { - "accuracy": 0.9160739728494695, + "accuracy": 0.9144114428444913, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -40297,7 +40297,7 @@ } }, { - "accuracy": 0.9207519234011048, + "accuracy": 0.9191970311497387, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -40346,7 +40346,7 @@ } }, { - "accuracy": 0.9482300381519293, + "accuracy": 0.9472399067721868, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -40398,7 +40398,7 @@ } }, { - "accuracy": 0.9522090291506365, + "accuracy": 0.9512919036573485, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -40450,7 +40450,7 @@ } }, { - "accuracy": 0.95883785384266, + "accuracy": 0.9580320135543221, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -40499,7 +40499,7 @@ } }, { - "accuracy": 0.9729592668774881, + "accuracy": 0.9724049227018106, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -40542,7 +40542,7 @@ } }, { - "accuracy": 0.9752475502655694, + "accuracy": 0.9747301859683112, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -40585,7 +40585,7 @@ } }, { - "accuracy": 0.9736431969427749, + "accuracy": 0.9731197307180417, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -40637,7 +40637,7 @@ } }, { - "accuracy": 0.9768064513214325, + "accuracy": 0.9763581153789633, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -40689,7 +40689,7 @@ } }, { - "accuracy": 0.9865877127372905, + "accuracy": 0.9863181849451441, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -40741,7 +40741,7 @@ } }, { - "accuracy": 0.9884394063173156, + "accuracy": 0.988217502195192, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -40793,7 +40793,7 @@ } }, { - "accuracy": 0.9926875439031344, + "accuracy": 0.992531660821681, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -40836,7 +40836,7 @@ } }, { - "accuracy": 0.9931928325248393, + "accuracy": 0.9930589289992655, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -40885,7 +40885,7 @@ } }, { - "accuracy": 0.9945414953031823, + "accuracy": 0.9944312759724102, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -40931,7 +40931,7 @@ } }, { - "accuracy": 0.9980519142822901, + "accuracy": 0.998009445985142, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -40973,7 +40973,7 @@ ], "model.layers.21.self_attn": [ { - "accuracy": 0.943290374977024, + "accuracy": 0.9420277384158812, "total_bits": 89665536, "q_proj": { "group_size": { @@ -41037,7 +41037,7 @@ } }, { - "accuracy": 0.9442870756121058, + "accuracy": 0.9456555888448891, "total_bits": 92221440, "q_proj": { "group_size": { @@ -41101,7 +41101,7 @@ } }, { - "accuracy": 0.9540135823190212, + "accuracy": 0.9538629990267127, "total_bits": 95758848, "q_proj": { "group_size": { @@ -41165,7 +41165,7 @@ } }, { - "accuracy": 0.961515402911525, + "accuracy": 0.961220733919426, "total_bits": 112272384, "q_proj": { "group_size": { @@ -41229,7 +41229,7 @@ } }, { - "accuracy": 0.9716752127401138, + "accuracy": 0.9696297934769016, "total_bits": 132913152, "q_proj": { "group_size": { @@ -41293,7 +41293,7 @@ } }, { - "accuracy": 0.9726082062054622, + "accuracy": 0.9719750868450654, "total_bits": 132980224, "q_proj": { "group_size": { @@ -41357,7 +41357,7 @@ } }, { - "accuracy": 0.9816643315318384, + "accuracy": 0.9807460449243847, "total_bits": 169613312, "q_proj": { "group_size": { @@ -41409,7 +41409,7 @@ } }, { - "accuracy": 0.9828882980111399, + "accuracy": 0.9828114246851519, "total_bits": 169745920, "q_proj": { "group_size": { @@ -41461,7 +41461,7 @@ } }, { - "accuracy": 0.9843922909349203, + "accuracy": 0.9842102797701955, "total_bits": 171195392, "q_proj": { "group_size": { @@ -41513,7 +41513,7 @@ } }, { - "accuracy": 0.9853111440806013, + "accuracy": 0.9849744904296178, "total_bits": 173563904, "q_proj": { "group_size": { @@ -41565,7 +41565,7 @@ } }, { - "accuracy": 0.9859785958634395, + "accuracy": 0.9858172050628223, "total_bits": 174923264, "q_proj": { "group_size": { @@ -41629,7 +41629,7 @@ } }, { - "accuracy": 0.9874009760096669, + "accuracy": 0.9864245926667201, "total_bits": 175750144, "q_proj": { "group_size": { @@ -41693,7 +41693,7 @@ } }, { - "accuracy": 0.9888895048122657, + "accuracy": 0.9885201539942309, "total_bits": 179253248, "q_proj": { "group_size": { @@ -41754,7 +41754,7 @@ } }, { - "accuracy": 0.9897628650069237, + "accuracy": 0.9895346878390563, "total_bits": 181592064, "q_proj": { "group_size": { @@ -41815,7 +41815,7 @@ } }, { - "accuracy": 0.9937504156933803, + "accuracy": 0.9936270043498984, "total_bits": 220469248, "q_proj": { "group_size": { @@ -41876,7 +41876,7 @@ } }, { - "accuracy": 0.9948289826218235, + "accuracy": 0.9947388439904898, "total_bits": 223535104, "q_proj": { "group_size": { @@ -41937,7 +41937,7 @@ } }, { - "accuracy": 0.9952522633156102, + "accuracy": 0.9950738154155644, "total_bits": 253499392, "q_proj": { "group_size": { @@ -41989,7 +41989,7 @@ } }, { - "accuracy": 0.9973617855361417, + "accuracy": 0.9972621887971304, "total_bits": 265838592, "q_proj": { "group_size": { @@ -42041,7 +42041,7 @@ } }, { - "accuracy": 0.9987096890353745, + "accuracy": 0.998694771447366, "total_bits": 337385472, "q_proj": { "group_size": { @@ -42095,7 +42095,7 @@ ], "model.layers.21.mlp": [ { - "accuracy": 0.900033059873079, + "accuracy": 0.8990929977674234, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -42147,7 +42147,7 @@ } }, { - "accuracy": 0.9028220313944315, + "accuracy": 0.9019180465685694, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -42199,7 +42199,7 @@ } }, { - "accuracy": 0.9174610219503704, + "accuracy": 0.916651896348125, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -42248,7 +42248,7 @@ } }, { - "accuracy": 0.921907190429537, + "accuracy": 0.9211636173881983, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -42297,7 +42297,7 @@ } }, { - "accuracy": 0.9492629525300703, + "accuracy": 0.9488103523066169, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -42349,7 +42349,7 @@ } }, { - "accuracy": 0.9532178275679287, + "accuracy": 0.952797536395098, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -42401,7 +42401,7 @@ } }, { - "accuracy": 0.9595388550507395, + "accuracy": 0.9591599926352501, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -42450,7 +42450,7 @@ } }, { - "accuracy": 0.9734023863351658, + "accuracy": 0.9731287360191345, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -42493,7 +42493,7 @@ } }, { - "accuracy": 0.9756884238633671, + "accuracy": 0.9754459900095275, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -42536,7 +42536,7 @@ } }, { - "accuracy": 0.9741525029469478, + "accuracy": 0.9739109943375776, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -42588,7 +42588,7 @@ } }, { - "accuracy": 0.9772716391047365, + "accuracy": 0.9770683767764192, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -42640,7 +42640,7 @@ } }, { - "accuracy": 0.9868358307469048, + "accuracy": 0.9867116271175052, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -42692,7 +42692,7 @@ } }, { - "accuracy": 0.988659804735921, + "accuracy": 0.9885575552225897, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -42744,7 +42744,7 @@ } }, { - "accuracy": 0.9927609564099265, + "accuracy": 0.9926810887838272, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -42787,7 +42787,7 @@ } }, { - "accuracy": 0.9933187552041521, + "accuracy": 0.993269080957888, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -42836,7 +42836,7 @@ } }, { - "accuracy": 0.9945921363112958, + "accuracy": 0.9945573769264707, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -42882,7 +42882,7 @@ } }, { - "accuracy": 0.9980380719858467, + "accuracy": 0.9980157566269076, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -42924,7 +42924,7 @@ ], "model.layers.22.self_attn": [ { - "accuracy": 0.9482472782072268, + "accuracy": 0.9483878267438788, "total_bits": 89665536, "q_proj": { "group_size": { @@ -42988,7 +42988,7 @@ } }, { - "accuracy": 0.950189836911465, + "accuracy": 0.950051539038357, "total_bits": 92221440, "q_proj": { "group_size": { @@ -43052,7 +43052,7 @@ } }, { - "accuracy": 0.9575777963588112, + "accuracy": 0.9589273040427974, "total_bits": 95758848, "q_proj": { "group_size": { @@ -43116,7 +43116,7 @@ } }, { - "accuracy": 0.9652416374730437, + "accuracy": 0.9665476064148703, "total_bits": 112272384, "q_proj": { "group_size": { @@ -43180,7 +43180,7 @@ } }, { - "accuracy": 0.9735469243636257, + "accuracy": 0.9736002350324079, "total_bits": 132913152, "q_proj": { "group_size": { @@ -43244,7 +43244,7 @@ } }, { - "accuracy": 0.9749776401409977, + "accuracy": 0.9743315569664303, "total_bits": 132980224, "q_proj": { "group_size": { @@ -43308,7 +43308,7 @@ } }, { - "accuracy": 0.9826735066446034, + "accuracy": 0.9826373034892114, "total_bits": 169613312, "q_proj": { "group_size": { @@ -43360,7 +43360,7 @@ } }, { - "accuracy": 0.9843419476559288, + "accuracy": 0.9836759566280403, "total_bits": 169745920, "q_proj": { "group_size": { @@ -43412,7 +43412,7 @@ } }, { - "accuracy": 0.9853213757864738, + "accuracy": 0.9850599610883939, "total_bits": 171195392, "q_proj": { "group_size": { @@ -43464,7 +43464,7 @@ } }, { - "accuracy": 0.9860507576775394, + "accuracy": 0.9856724616532263, "total_bits": 173563904, "q_proj": { "group_size": { @@ -43516,7 +43516,7 @@ } }, { - "accuracy": 0.9872009936524065, + "accuracy": 0.9872184336969727, "total_bits": 174923264, "q_proj": { "group_size": { @@ -43580,7 +43580,7 @@ } }, { - "accuracy": 0.9880094823770618, + "accuracy": 0.9880351385493812, "total_bits": 175750144, "q_proj": { "group_size": { @@ -43644,7 +43644,7 @@ } }, { - "accuracy": 0.9894334337625065, + "accuracy": 0.9895875001767356, "total_bits": 179253248, "q_proj": { "group_size": { @@ -43705,7 +43705,7 @@ } }, { - "accuracy": 0.9903135126652686, + "accuracy": 0.9902975041615335, "total_bits": 181592064, "q_proj": { "group_size": { @@ -43766,7 +43766,7 @@ } }, { - "accuracy": 0.9940307795462248, + "accuracy": 0.993927537292046, "total_bits": 220469248, "q_proj": { "group_size": { @@ -43827,7 +43827,7 @@ } }, { - "accuracy": 0.995157766082373, + "accuracy": 0.9952111643077316, "total_bits": 223535104, "q_proj": { "group_size": { @@ -43888,7 +43888,7 @@ } }, { - "accuracy": 0.9954051792278493, + "accuracy": 0.9952434224909857, "total_bits": 253499392, "q_proj": { "group_size": { @@ -43940,7 +43940,7 @@ } }, { - "accuracy": 0.9974537637256282, + "accuracy": 0.9975120271494808, "total_bits": 265838592, "q_proj": { "group_size": { @@ -43992,7 +43992,7 @@ } }, { - "accuracy": 0.9987865218733388, + "accuracy": 0.9987522705985037, "total_bits": 337385472, "q_proj": { "group_size": { @@ -44046,7 +44046,7 @@ ], "model.layers.22.mlp": [ { - "accuracy": 0.9032199096522833, + "accuracy": 0.9028125315120346, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -44098,7 +44098,7 @@ } }, { - "accuracy": 0.9058257737442067, + "accuracy": 0.9054452753380725, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -44150,7 +44150,7 @@ } }, { - "accuracy": 0.9196835348480626, + "accuracy": 0.919369173873412, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -44199,7 +44199,7 @@ } }, { - "accuracy": 0.9238896854221821, + "accuracy": 0.9235992423797909, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -44248,7 +44248,7 @@ } }, { - "accuracy": 0.9508502669632435, + "accuracy": 0.9507327850319838, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -44300,7 +44300,7 @@ } }, { - "accuracy": 0.9546151335694288, + "accuracy": 0.9544903551669497, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -44352,7 +44352,7 @@ } }, { - "accuracy": 0.96060287305399, + "accuracy": 0.9604763614111825, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -44401,7 +44401,7 @@ } }, { - "accuracy": 0.9744124748793087, + "accuracy": 0.9743305625099885, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -44444,7 +44444,7 @@ } }, { - "accuracy": 0.9765731334490212, + "accuracy": 0.9764831513166428, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -44487,7 +44487,7 @@ } }, { - "accuracy": 0.9750015945418885, + "accuracy": 0.9749472121659079, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -44539,7 +44539,7 @@ } }, { - "accuracy": 0.9779893053989661, + "accuracy": 0.9779386792920137, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -44591,7 +44591,7 @@ } }, { - "accuracy": 0.9872960305135501, + "accuracy": 0.9872766987567669, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -44643,7 +44643,7 @@ } }, { - "accuracy": 0.9890378019527385, + "accuracy": 0.9890139062251699, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -44695,7 +44695,7 @@ } }, { - "accuracy": 0.9931023369151118, + "accuracy": 0.9930777715666121, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -44738,7 +44738,7 @@ } }, { - "accuracy": 0.993546063276498, + "accuracy": 0.9935381057623186, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -44787,7 +44787,7 @@ } }, { - "accuracy": 0.994731132039114, + "accuracy": 0.9947241955485783, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -44833,7 +44833,7 @@ } }, { - "accuracy": 0.9981478130763495, + "accuracy": 0.9981337333845562, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -44875,7 +44875,7 @@ ], "model.layers.23.self_attn": [ { - "accuracy": 0.9510137515240594, + "accuracy": 0.9502481190781844, "total_bits": 89665536, "q_proj": { "group_size": { @@ -44939,7 +44939,7 @@ } }, { - "accuracy": 0.9526072450374302, + "accuracy": 0.9530709889766417, "total_bits": 92221440, "q_proj": { "group_size": { @@ -45003,7 +45003,7 @@ } }, { - "accuracy": 0.962001116064034, + "accuracy": 0.9612796043879107, "total_bits": 95758848, "q_proj": { "group_size": { @@ -45067,7 +45067,7 @@ } }, { - "accuracy": 0.9682537217281366, + "accuracy": 0.9672535549065, "total_bits": 112272384, "q_proj": { "group_size": { @@ -45131,7 +45131,7 @@ } }, { - "accuracy": 0.975260864747198, + "accuracy": 0.9746645238054427, "total_bits": 132913152, "q_proj": { "group_size": { @@ -45195,7 +45195,7 @@ } }, { - "accuracy": 0.9763250603879753, + "accuracy": 0.9754390449900376, "total_bits": 132980224, "q_proj": { "group_size": { @@ -45259,7 +45259,7 @@ } }, { - "accuracy": 0.9837328454871711, + "accuracy": 0.9838630994291682, "total_bits": 169613312, "q_proj": { "group_size": { @@ -45311,7 +45311,7 @@ } }, { - "accuracy": 0.9847811820769781, + "accuracy": 0.9843490204136622, "total_bits": 169745920, "q_proj": { "group_size": { @@ -45363,7 +45363,7 @@ } }, { - "accuracy": 0.9861498307436705, + "accuracy": 0.9865377572806258, "total_bits": 171195392, "q_proj": { "group_size": { @@ -45415,7 +45415,7 @@ } }, { - "accuracy": 0.9866779337784177, + "accuracy": 0.9868896327618706, "total_bits": 173563904, "q_proj": { "group_size": { @@ -45467,7 +45467,7 @@ } }, { - "accuracy": 0.9873121254832337, + "accuracy": 0.987329784094503, "total_bits": 174923264, "q_proj": { "group_size": { @@ -45531,7 +45531,7 @@ } }, { - "accuracy": 0.9884528629971963, + "accuracy": 0.9882270813870587, "total_bits": 175750144, "q_proj": { "group_size": { @@ -45595,7 +45595,7 @@ } }, { - "accuracy": 0.9903055085359436, + "accuracy": 0.9903721029282009, "total_bits": 179253248, "q_proj": { "group_size": { @@ -45656,7 +45656,7 @@ } }, { - "accuracy": 0.9911426249156264, + "accuracy": 0.9912103865001547, "total_bits": 181592064, "q_proj": { "group_size": { @@ -45717,7 +45717,7 @@ } }, { - "accuracy": 0.9945278980181014, + "accuracy": 0.9946270031168273, "total_bits": 220469248, "q_proj": { "group_size": { @@ -45778,7 +45778,7 @@ } }, { - "accuracy": 0.9955299621521446, + "accuracy": 0.995528266152465, "total_bits": 223535104, "q_proj": { "group_size": { @@ -45839,7 +45839,7 @@ } }, { - "accuracy": 0.995648593862394, + "accuracy": 0.9956167150215295, "total_bits": 253499392, "q_proj": { "group_size": { @@ -45891,7 +45891,7 @@ } }, { - "accuracy": 0.9977277301153854, + "accuracy": 0.9978099523884195, "total_bits": 265838592, "q_proj": { "group_size": { @@ -45943,7 +45943,7 @@ } }, { - "accuracy": 0.9988459613186454, + "accuracy": 0.998819023677099, "total_bits": 337385472, "q_proj": { "group_size": { @@ -45997,7 +45997,7 @@ ], "model.layers.23.mlp": [ { - "accuracy": 0.9051217401498243, + "accuracy": 0.9056100531628257, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -46049,7 +46049,7 @@ } }, { - "accuracy": 0.9076284581893369, + "accuracy": 0.9081501286280782, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -46101,7 +46101,7 @@ } }, { - "accuracy": 0.920641915970727, + "accuracy": 0.9210308960785991, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -46150,7 +46150,7 @@ } }, { - "accuracy": 0.9245966819948271, + "accuracy": 0.9249813648823061, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -46199,7 +46199,7 @@ } }, { - "accuracy": 0.9517227221084268, + "accuracy": 0.952037826376526, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -46251,7 +46251,7 @@ } }, { - "accuracy": 0.9554342553019524, + "accuracy": 0.9556936813812507, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -46303,7 +46303,7 @@ } }, { - "accuracy": 0.9610833873678195, + "accuracy": 0.9612869417392894, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -46352,7 +46352,7 @@ } }, { - "accuracy": 0.9748941076625335, + "accuracy": 0.9750148592222678, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -46395,7 +46395,7 @@ } }, { - "accuracy": 0.9770096644367042, + "accuracy": 0.9771057201647445, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -46438,7 +46438,7 @@ } }, { - "accuracy": 0.9754382005255473, + "accuracy": 0.9756095285870527, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -46490,7 +46490,7 @@ } }, { - "accuracy": 0.9783839506930426, + "accuracy": 0.9785108163364624, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -46542,7 +46542,7 @@ } }, { - "accuracy": 0.9875168682223088, + "accuracy": 0.9876114163351687, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -46594,7 +46594,7 @@ } }, { - "accuracy": 0.9892356215338958, + "accuracy": 0.9893002010587799, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -46646,7 +46646,7 @@ } }, { - "accuracy": 0.9932197156166168, + "accuracy": 0.993260216237487, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -46689,7 +46689,7 @@ } }, { - "accuracy": 0.993658114959927, + "accuracy": 0.9937104818068052, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -46738,7 +46738,7 @@ } }, { - "accuracy": 0.9947657026105413, + "accuracy": 0.9948111176245699, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -46784,7 +46784,7 @@ } }, { - "accuracy": 0.998167707266188, + "accuracy": 0.9981725445924032, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -46826,7 +46826,7 @@ ], "model.layers.24.self_attn": [ { - "accuracy": 0.9498151215283495, + "accuracy": 0.9487879560574105, "total_bits": 89665536, "q_proj": { "group_size": { @@ -46890,7 +46890,7 @@ } }, { - "accuracy": 0.9512326399746694, + "accuracy": 0.9516484009984293, "total_bits": 92221440, "q_proj": { "group_size": { @@ -46954,7 +46954,7 @@ } }, { - "accuracy": 0.959779762908032, + "accuracy": 0.9600290020829753, "total_bits": 95758848, "q_proj": { "group_size": { @@ -47018,7 +47018,7 @@ } }, { - "accuracy": 0.9666704037471822, + "accuracy": 0.9665687635148826, "total_bits": 112272384, "q_proj": { "group_size": { @@ -47082,7 +47082,7 @@ } }, { - "accuracy": 0.9743388493202234, + "accuracy": 0.9737422511373696, "total_bits": 132913152, "q_proj": { "group_size": { @@ -47146,7 +47146,7 @@ } }, { - "accuracy": 0.974842529449808, + "accuracy": 0.9744793577609878, "total_bits": 132980224, "q_proj": { "group_size": { @@ -47210,7 +47210,7 @@ } }, { - "accuracy": 0.9832458566188028, + "accuracy": 0.9829583209204046, "total_bits": 169613312, "q_proj": { "group_size": { @@ -47262,7 +47262,7 @@ } }, { - "accuracy": 0.9839273462758252, + "accuracy": 0.9839565247591389, "total_bits": 169745920, "q_proj": { "group_size": { @@ -47314,7 +47314,7 @@ } }, { - "accuracy": 0.9853346122330741, + "accuracy": 0.9854759321499028, "total_bits": 171195392, "q_proj": { "group_size": { @@ -47366,7 +47366,7 @@ } }, { - "accuracy": 0.9860211665693083, + "accuracy": 0.9861636403948069, "total_bits": 173563904, "q_proj": { "group_size": { @@ -47418,7 +47418,7 @@ } }, { - "accuracy": 0.986713446921816, + "accuracy": 0.986473196823346, "total_bits": 174923264, "q_proj": { "group_size": { @@ -47482,7 +47482,7 @@ } }, { - "accuracy": 0.9875483970696989, + "accuracy": 0.987540786644738, "total_bits": 175750144, "q_proj": { "group_size": { @@ -47546,7 +47546,7 @@ } }, { - "accuracy": 0.9896109450706526, + "accuracy": 0.9897486916498134, "total_bits": 179253248, "q_proj": { "group_size": { @@ -47607,7 +47607,7 @@ } }, { - "accuracy": 0.9903714658790513, + "accuracy": 0.9906450642615949, "total_bits": 181592064, "q_proj": { "group_size": { @@ -47668,7 +47668,7 @@ } }, { - "accuracy": 0.9941248118779377, + "accuracy": 0.9941419730649182, "total_bits": 220469248, "q_proj": { "group_size": { @@ -47729,7 +47729,7 @@ } }, { - "accuracy": 0.9951638817591103, + "accuracy": 0.9952516833344769, "total_bits": 223535104, "q_proj": { "group_size": { @@ -47790,7 +47790,7 @@ } }, { - "accuracy": 0.9953079977023759, + "accuracy": 0.9952554055734685, "total_bits": 253499392, "q_proj": { "group_size": { @@ -47842,7 +47842,7 @@ } }, { - "accuracy": 0.9974803455222986, + "accuracy": 0.9976206048894184, "total_bits": 265838592, "q_proj": { "group_size": { @@ -47894,7 +47894,7 @@ } }, { - "accuracy": 0.9987719079455066, + "accuracy": 0.9987729074690785, "total_bits": 337385472, "q_proj": { "group_size": { @@ -47948,7 +47948,7 @@ ], "model.layers.24.mlp": [ { - "accuracy": 0.9065527861055575, + "accuracy": 0.9074203732766604, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -48000,7 +48000,7 @@ } }, { - "accuracy": 0.9090194172765079, + "accuracy": 0.9099162860136283, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -48052,7 +48052,7 @@ } }, { - "accuracy": 0.921401963226105, + "accuracy": 0.9221326544096595, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -48101,7 +48101,7 @@ } }, { - "accuracy": 0.9252098663464973, + "accuracy": 0.9259051535474627, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -48150,7 +48150,7 @@ } }, { - "accuracy": 0.9523959267688424, + "accuracy": 0.9529018374650102, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -48202,7 +48202,7 @@ } }, { - "accuracy": 0.9560554023636014, + "accuracy": 0.9564938207990245, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -48254,7 +48254,7 @@ } }, { - "accuracy": 0.9614702226888192, + "accuracy": 0.9618294633140689, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -48303,7 +48303,7 @@ } }, { - "accuracy": 0.9752316442563346, + "accuracy": 0.975474656412476, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -48346,7 +48346,7 @@ } }, { - "accuracy": 0.977322325992741, + "accuracy": 0.9775249346306449, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -48389,7 +48389,7 @@ } }, { - "accuracy": 0.9757761364116481, + "accuracy": 0.9760482674954754, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -48441,7 +48441,7 @@ } }, { - "accuracy": 0.9786714775193679, + "accuracy": 0.9789021798458538, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -48493,7 +48493,7 @@ } }, { - "accuracy": 0.9876941558169691, + "accuracy": 0.9878299575985262, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -48545,7 +48545,7 @@ } }, { - "accuracy": 0.9893774361790795, + "accuracy": 0.9894889078446125, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -48597,7 +48597,7 @@ } }, { - "accuracy": 0.9933127998374403, + "accuracy": 0.9933787360787392, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -48640,7 +48640,7 @@ } }, { - "accuracy": 0.9937457350621882, + "accuracy": 0.993808017577976, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -48689,7 +48689,7 @@ } }, { - "accuracy": 0.994800708464984, + "accuracy": 0.9948495488221708, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -48735,7 +48735,7 @@ } }, { - "accuracy": 0.9981878133625478, + "accuracy": 0.9981965286546925, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -48777,7 +48777,7 @@ ], "model.layers.25.self_attn": [ { - "accuracy": 0.9488158669126661, + "accuracy": 0.9458470319054628, "total_bits": 89665536, "q_proj": { "group_size": { @@ -48841,7 +48841,7 @@ } }, { - "accuracy": 0.9511049050641687, + "accuracy": 0.9474324309512189, "total_bits": 92221440, "q_proj": { "group_size": { @@ -48905,7 +48905,7 @@ } }, { - "accuracy": 0.9583402054482385, + "accuracy": 0.9589221412806135, "total_bits": 95758848, "q_proj": { "group_size": { @@ -48969,7 +48969,7 @@ } }, { - "accuracy": 0.9648275051854158, + "accuracy": 0.9649457796231696, "total_bits": 112272384, "q_proj": { "group_size": { @@ -49033,7 +49033,7 @@ } }, { - "accuracy": 0.9729314623890739, + "accuracy": 0.971886742565977, "total_bits": 132913152, "q_proj": { "group_size": { @@ -49097,7 +49097,7 @@ } }, { - "accuracy": 0.9736364970081731, + "accuracy": 0.9724908905397904, "total_bits": 132980224, "q_proj": { "group_size": { @@ -49161,7 +49161,7 @@ } }, { - "accuracy": 0.9821601294373211, + "accuracy": 0.9820638985226029, "total_bits": 169613312, "q_proj": { "group_size": { @@ -49213,7 +49213,7 @@ } }, { - "accuracy": 0.9830479631690603, + "accuracy": 0.983313759445752, "total_bits": 169745920, "q_proj": { "group_size": { @@ -49265,7 +49265,7 @@ } }, { - "accuracy": 0.9850593051922164, + "accuracy": 0.9850981331577426, "total_bits": 171195392, "q_proj": { "group_size": { @@ -49317,7 +49317,7 @@ } }, { - "accuracy": 0.9856737586424539, + "accuracy": 0.9856968799998101, "total_bits": 173563904, "q_proj": { "group_size": { @@ -49369,7 +49369,7 @@ } }, { - "accuracy": 0.9865651306157049, + "accuracy": 0.9862744168525464, "total_bits": 174923264, "q_proj": { "group_size": { @@ -49433,7 +49433,7 @@ } }, { - "accuracy": 0.9874835402557725, + "accuracy": 0.9871476240652172, "total_bits": 175750144, "q_proj": { "group_size": { @@ -49497,7 +49497,7 @@ } }, { - "accuracy": 0.9894345217923585, + "accuracy": 0.9896134171929014, "total_bits": 179253248, "q_proj": { "group_size": { @@ -49558,7 +49558,7 @@ } }, { - "accuracy": 0.9903469423420335, + "accuracy": 0.9905227793282584, "total_bits": 181592064, "q_proj": { "group_size": { @@ -49619,7 +49619,7 @@ } }, { - "accuracy": 0.9940386692699241, + "accuracy": 0.9941945887955004, "total_bits": 220469248, "q_proj": { "group_size": { @@ -49680,7 +49680,7 @@ } }, { - "accuracy": 0.9952443013163773, + "accuracy": 0.995297767540538, "total_bits": 223535104, "q_proj": { "group_size": { @@ -49741,7 +49741,7 @@ } }, { - "accuracy": 0.9952908678127355, + "accuracy": 0.9952866520340505, "total_bits": 253499392, "q_proj": { "group_size": { @@ -49793,7 +49793,7 @@ } }, { - "accuracy": 0.9974354728811273, + "accuracy": 0.9974391659060003, "total_bits": 265838592, "q_proj": { "group_size": { @@ -49845,7 +49845,7 @@ } }, { - "accuracy": 0.9987432912090107, + "accuracy": 0.9987426578728972, "total_bits": 337385472, "q_proj": { "group_size": { @@ -49899,7 +49899,7 @@ ], "model.layers.25.mlp": [ { - "accuracy": 0.9067067841165944, + "accuracy": 0.9088886450780065, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -49951,7 +49951,7 @@ } }, { - "accuracy": 0.9092354362732485, + "accuracy": 0.9113666548540718, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -50003,7 +50003,7 @@ } }, { - "accuracy": 0.9212227599009087, + "accuracy": 0.923032491811012, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -50052,7 +50052,7 @@ } }, { - "accuracy": 0.9249252104445508, + "accuracy": 0.9266559271828124, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -50101,7 +50101,7 @@ } }, { - "accuracy": 0.952399526967814, + "accuracy": 0.9536091583339792, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -50153,7 +50153,7 @@ } }, { - "accuracy": 0.9560997166523808, + "accuracy": 0.957175229332949, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -50205,7 +50205,7 @@ } }, { - "accuracy": 0.9613283950051195, + "accuracy": 0.9622613882743999, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -50254,7 +50254,7 @@ } }, { - "accuracy": 0.9752293303608894, + "accuracy": 0.9758168908914453, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -50297,7 +50297,7 @@ } }, { - "accuracy": 0.9773161167180852, + "accuracy": 0.9778374946235042, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -50340,7 +50340,7 @@ } }, { - "accuracy": 0.9757754738001447, + "accuracy": 0.9764133103583988, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -50392,7 +50392,7 @@ } }, { - "accuracy": 0.9786968226299474, + "accuracy": 0.9792184036617216, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -50444,7 +50444,7 @@ } }, { - "accuracy": 0.9876833510045943, + "accuracy": 0.988023854939169, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -50496,7 +50496,7 @@ } }, { - "accuracy": 0.9893827981462604, + "accuracy": 0.9896477213815639, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -50548,7 +50548,7 @@ } }, { - "accuracy": 0.9933003317564726, + "accuracy": 0.9934675191823197, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -50591,7 +50591,7 @@ } }, { - "accuracy": 0.9937434998635006, + "accuracy": 0.9939135614243385, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -50640,7 +50640,7 @@ } }, { - "accuracy": 0.9947581622185871, + "accuracy": 0.9949056060960222, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -50686,7 +50686,7 @@ } }, { - "accuracy": 0.9981913148780892, + "accuracy": 0.9982286457670853, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -50728,7 +50728,7 @@ ], "model.layers.26.self_attn": [ { - "accuracy": 0.9479121577582861, + "accuracy": 0.9487627187841817, "total_bits": 89665536, "q_proj": { "group_size": { @@ -50792,7 +50792,7 @@ } }, { - "accuracy": 0.9503459575537004, + "accuracy": 0.9507187300998914, "total_bits": 92221440, "q_proj": { "group_size": { @@ -50856,7 +50856,7 @@ } }, { - "accuracy": 0.9576964443059344, + "accuracy": 0.9587722908901541, "total_bits": 95758848, "q_proj": { "group_size": { @@ -50920,7 +50920,7 @@ } }, { - "accuracy": 0.9653835506423524, + "accuracy": 0.9660183190319099, "total_bits": 112272384, "q_proj": { "group_size": { @@ -50984,7 +50984,7 @@ } }, { - "accuracy": 0.9729656623186249, + "accuracy": 0.9729224882627788, "total_bits": 132913152, "q_proj": { "group_size": { @@ -51048,7 +51048,7 @@ } }, { - "accuracy": 0.9739223553946144, + "accuracy": 0.9747599382933817, "total_bits": 132980224, "q_proj": { "group_size": { @@ -51112,7 +51112,7 @@ } }, { - "accuracy": 0.9823017737485076, + "accuracy": 0.9831985739108763, "total_bits": 169613312, "q_proj": { "group_size": { @@ -51164,7 +51164,7 @@ } }, { - "accuracy": 0.9837876818583984, + "accuracy": 0.9844246666486326, "total_bits": 169745920, "q_proj": { "group_size": { @@ -51216,7 +51216,7 @@ } }, { - "accuracy": 0.9848850857662527, + "accuracy": 0.9858212914611948, "total_bits": 171195392, "q_proj": { "group_size": { @@ -51268,7 +51268,7 @@ } }, { - "accuracy": 0.9855629657640269, + "accuracy": 0.9862934676440138, "total_bits": 173563904, "q_proj": { "group_size": { @@ -51320,7 +51320,7 @@ } }, { - "accuracy": 0.9861785050873694, + "accuracy": 0.9864065552522477, "total_bits": 174923264, "q_proj": { "group_size": { @@ -51384,7 +51384,7 @@ } }, { - "accuracy": 0.986946036647025, + "accuracy": 0.9874741717878925, "total_bits": 175750144, "q_proj": { "group_size": { @@ -51448,7 +51448,7 @@ } }, { - "accuracy": 0.9891065998787159, + "accuracy": 0.9893429364616934, "total_bits": 179253248, "q_proj": { "group_size": { @@ -51509,7 +51509,7 @@ } }, { - "accuracy": 0.9901095925781288, + "accuracy": 0.9904637321780779, "total_bits": 181592064, "q_proj": { "group_size": { @@ -51570,7 +51570,7 @@ } }, { - "accuracy": 0.9939403485898909, + "accuracy": 0.9941711807868591, "total_bits": 220469248, "q_proj": { "group_size": { @@ -51631,7 +51631,7 @@ } }, { - "accuracy": 0.9949914177046403, + "accuracy": 0.9952622074633837, "total_bits": 223535104, "q_proj": { "group_size": { @@ -51692,7 +51692,7 @@ } }, { - "accuracy": 0.995356286140649, + "accuracy": 0.9955319977046824, "total_bits": 253499392, "q_proj": { "group_size": { @@ -51744,7 +51744,7 @@ } }, { - "accuracy": 0.9973190626815746, + "accuracy": 0.9974245381431261, "total_bits": 265838592, "q_proj": { "group_size": { @@ -51796,7 +51796,7 @@ } }, { - "accuracy": 0.9987346040281025, + "accuracy": 0.9987907473696396, "total_bits": 337385472, "q_proj": { "group_size": { @@ -51850,7 +51850,7 @@ ], "model.layers.26.mlp": [ { - "accuracy": 0.9059437348654396, + "accuracy": 0.9081306786913621, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -51902,7 +51902,7 @@ } }, { - "accuracy": 0.908503245366247, + "accuracy": 0.910644632028906, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -51954,7 +51954,7 @@ } }, { - "accuracy": 0.9204196345649267, + "accuracy": 0.9223323164409712, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -52003,7 +52003,7 @@ } }, { - "accuracy": 0.9241533495093647, + "accuracy": 0.9260027436049361, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -52052,7 +52052,7 @@ } }, { - "accuracy": 0.9520501937521131, + "accuracy": 0.9532161692255422, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -52104,7 +52104,7 @@ } }, { - "accuracy": 0.9557382823213151, + "accuracy": 0.9568005992393744, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -52156,7 +52156,7 @@ } }, { - "accuracy": 0.9609578424378445, + "accuracy": 0.961900201577105, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -52205,7 +52205,7 @@ } }, { - "accuracy": 0.9749748898964179, + "accuracy": 0.9755692395724749, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -52248,7 +52248,7 @@ } }, { - "accuracy": 0.9770808203243896, + "accuracy": 0.9776126162001961, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -52291,7 +52291,7 @@ } }, { - "accuracy": 0.9756017253783188, + "accuracy": 0.9761945107265523, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -52343,7 +52343,7 @@ } }, { - "accuracy": 0.9785121577350717, + "accuracy": 0.9790279881930665, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -52395,7 +52395,7 @@ } }, { - "accuracy": 0.9875998964631244, + "accuracy": 0.9879067885738454, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -52447,7 +52447,7 @@ } }, { - "accuracy": 0.9892914449109843, + "accuracy": 0.9895513587582269, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -52499,7 +52499,7 @@ } }, { - "accuracy": 0.9932366719371394, + "accuracy": 0.9933951359830404, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -52542,7 +52542,7 @@ } }, { - "accuracy": 0.9937064550130775, + "accuracy": 0.9938535921177581, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -52591,7 +52591,7 @@ } }, { - "accuracy": 0.9947310440168765, + "accuracy": 0.9948541356593763, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -52637,7 +52637,7 @@ } }, { - "accuracy": 0.9981712053627952, + "accuracy": 0.9982059716161242, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -52679,7 +52679,7 @@ ], "model.layers.27.self_attn": [ { - "accuracy": 0.9424951021608553, + "accuracy": 0.9434478780940959, "total_bits": 89665536, "q_proj": { "group_size": { @@ -52743,7 +52743,7 @@ } }, { - "accuracy": 0.9456411717753661, + "accuracy": 0.9451379950501417, "total_bits": 92221440, "q_proj": { "group_size": { @@ -52807,7 +52807,7 @@ } }, { - "accuracy": 0.9542936845437476, + "accuracy": 0.9540607099862475, "total_bits": 95758848, "q_proj": { "group_size": { @@ -52871,7 +52871,7 @@ } }, { - "accuracy": 0.9621277694639406, + "accuracy": 0.9617430735379457, "total_bits": 112272384, "q_proj": { "group_size": { @@ -52935,7 +52935,7 @@ } }, { - "accuracy": 0.9710372051126078, + "accuracy": 0.9702666551855049, "total_bits": 132913152, "q_proj": { "group_size": { @@ -52999,7 +52999,7 @@ } }, { - "accuracy": 0.9719590329025921, + "accuracy": 0.9714633463636825, "total_bits": 132980224, "q_proj": { "group_size": { @@ -53063,7 +53063,7 @@ } }, { - "accuracy": 0.9803541639917775, + "accuracy": 0.9802681577244872, "total_bits": 169613312, "q_proj": { "group_size": { @@ -53115,7 +53115,7 @@ } }, { - "accuracy": 0.9816839122948678, + "accuracy": 0.9819463537025609, "total_bits": 169745920, "q_proj": { "group_size": { @@ -53167,7 +53167,7 @@ } }, { - "accuracy": 0.9833788683049773, + "accuracy": 0.9833932330733851, "total_bits": 171195392, "q_proj": { "group_size": { @@ -53219,7 +53219,7 @@ } }, { - "accuracy": 0.9840522178105617, + "accuracy": 0.9843222897401765, "total_bits": 173563904, "q_proj": { "group_size": { @@ -53271,7 +53271,7 @@ } }, { - "accuracy": 0.9858122274377629, + "accuracy": 0.985410600949667, "total_bits": 174923264, "q_proj": { "group_size": { @@ -53335,7 +53335,7 @@ } }, { - "accuracy": 0.9863537154405525, + "accuracy": 0.9862800933616725, "total_bits": 175750144, "q_proj": { "group_size": { @@ -53399,7 +53399,7 @@ } }, { - "accuracy": 0.9881419031635711, + "accuracy": 0.9883456508580007, "total_bits": 179253248, "q_proj": { "group_size": { @@ -53460,7 +53460,7 @@ } }, { - "accuracy": 0.989256463797861, + "accuracy": 0.9895112045893544, "total_bits": 181592064, "q_proj": { "group_size": { @@ -53521,7 +53521,7 @@ } }, { - "accuracy": 0.9934491572264386, + "accuracy": 0.9935121850698794, "total_bits": 220469248, "q_proj": { "group_size": { @@ -53582,7 +53582,7 @@ } }, { - "accuracy": 0.9945267753577546, + "accuracy": 0.9947013332949657, "total_bits": 223535104, "q_proj": { "group_size": { @@ -53643,7 +53643,7 @@ } }, { - "accuracy": 0.9948108980530187, + "accuracy": 0.9949374200874254, "total_bits": 253499392, "q_proj": { "group_size": { @@ -53695,7 +53695,7 @@ } }, { - "accuracy": 0.997045311574383, + "accuracy": 0.997136262282239, "total_bits": 265838592, "q_proj": { "group_size": { @@ -53747,7 +53747,7 @@ } }, { - "accuracy": 0.9986081643422183, + "accuracy": 0.998628963612167, "total_bits": 337385472, "q_proj": { "group_size": { @@ -53801,7 +53801,7 @@ ], "model.layers.27.mlp": [ { - "accuracy": 0.9039016087588511, + "accuracy": 0.9069889779937894, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -53853,7 +53853,7 @@ } }, { - "accuracy": 0.9065776090872915, + "accuracy": 0.9095301228134256, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -53905,7 +53905,7 @@ } }, { - "accuracy": 0.9185606754924122, + "accuracy": 0.9211613112374356, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -53954,7 +53954,7 @@ } }, { - "accuracy": 0.9224375651070946, + "accuracy": 0.9249300880259589, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -54003,7 +54003,7 @@ } }, { - "accuracy": 0.9508984879051384, + "accuracy": 0.9525143035540455, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -54055,7 +54055,7 @@ } }, { - "accuracy": 0.9546990133821964, + "accuracy": 0.9562023393809795, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -54107,7 +54107,7 @@ } }, { - "accuracy": 0.960005313746239, + "accuracy": 0.9613319134437724, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -54156,7 +54156,7 @@ } }, { - "accuracy": 0.9742310946121028, + "accuracy": 0.975074468670707, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -54199,7 +54199,7 @@ } }, { - "accuracy": 0.9764304797312147, + "accuracy": 0.9772006085044459, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -54242,7 +54242,7 @@ } }, { - "accuracy": 0.9749809888828742, + "accuracy": 0.9758249246760419, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -54294,7 +54294,7 @@ } }, { - "accuracy": 0.9779991365380978, + "accuracy": 0.9787212381825635, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -54346,7 +54346,7 @@ } }, { - "accuracy": 0.9872734655479067, + "accuracy": 0.9877128246191301, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -54398,7 +54398,7 @@ } }, { - "accuracy": 0.9890360964070025, + "accuracy": 0.9894014930254534, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -54450,7 +54450,7 @@ } }, { - "accuracy": 0.9930287209143372, + "accuracy": 0.9932610707259492, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -54493,7 +54493,7 @@ } }, { - "accuracy": 0.9935468171821221, + "accuracy": 0.9937691056953841, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -54542,7 +54542,7 @@ } }, { - "accuracy": 0.9945940370671451, + "accuracy": 0.9947843230451996, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -54588,7 +54588,7 @@ } }, { - "accuracy": 0.9981165734903985, + "accuracy": 0.998177430678257, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -54630,7 +54630,7 @@ ], "model.layers.28.self_attn": [ { - "accuracy": 0.9367124750033805, + "accuracy": 0.9362437364302183, "total_bits": 89665536, "q_proj": { "group_size": { @@ -54694,7 +54694,7 @@ } }, { - "accuracy": 0.9379993500678163, + "accuracy": 0.9372361837641189, "total_bits": 92221440, "q_proj": { "group_size": { @@ -54758,7 +54758,7 @@ } }, { - "accuracy": 0.9513284224820764, + "accuracy": 0.9513718076050282, "total_bits": 95758848, "q_proj": { "group_size": { @@ -54822,7 +54822,7 @@ } }, { - "accuracy": 0.9605587773809308, + "accuracy": 0.961191442353945, "total_bits": 112272384, "q_proj": { "group_size": { @@ -54886,7 +54886,7 @@ } }, { - "accuracy": 0.9687110350320214, + "accuracy": 0.9682433715972462, "total_bits": 132913152, "q_proj": { "group_size": { @@ -54950,7 +54950,7 @@ } }, { - "accuracy": 0.969934609277468, + "accuracy": 0.9691933717970785, "total_bits": 132980224, "q_proj": { "group_size": { @@ -55014,7 +55014,7 @@ } }, { - "accuracy": 0.9812605130045038, + "accuracy": 0.9812179332795111, "total_bits": 169613312, "q_proj": { "group_size": { @@ -55066,7 +55066,7 @@ } }, { - "accuracy": 0.98190788179636, + "accuracy": 0.9820223970730838, "total_bits": 169745920, "q_proj": { "group_size": { @@ -55118,7 +55118,7 @@ } }, { - "accuracy": 0.9830738246734989, + "accuracy": 0.9832787493635949, "total_bits": 171195392, "q_proj": { "group_size": { @@ -55170,7 +55170,7 @@ } }, { - "accuracy": 0.9841299387381265, + "accuracy": 0.9839331565522834, "total_bits": 173563904, "q_proj": { "group_size": { @@ -55222,7 +55222,7 @@ } }, { - "accuracy": 0.9845823859795928, + "accuracy": 0.9843095676287225, "total_bits": 174923264, "q_proj": { "group_size": { @@ -55286,7 +55286,7 @@ } }, { - "accuracy": 0.9855940481157679, + "accuracy": 0.9854277645384795, "total_bits": 175750144, "q_proj": { "group_size": { @@ -55350,7 +55350,7 @@ } }, { - "accuracy": 0.9879433417104577, + "accuracy": 0.9879202580961742, "total_bits": 179253248, "q_proj": { "group_size": { @@ -55411,7 +55411,7 @@ } }, { - "accuracy": 0.9888839909904882, + "accuracy": 0.9888220327465158, "total_bits": 181592064, "q_proj": { "group_size": { @@ -55472,7 +55472,7 @@ } }, { - "accuracy": 0.993159772411577, + "accuracy": 0.9931618823963952, "total_bits": 220469248, "q_proj": { "group_size": { @@ -55533,7 +55533,7 @@ } }, { - "accuracy": 0.9944646907970309, + "accuracy": 0.994235600810498, "total_bits": 223535104, "q_proj": { "group_size": { @@ -55594,7 +55594,7 @@ } }, { - "accuracy": 0.9948158818542173, + "accuracy": 0.9947797443080497, "total_bits": 253499392, "q_proj": { "group_size": { @@ -55646,7 +55646,7 @@ } }, { - "accuracy": 0.9972003068848464, + "accuracy": 0.9971368630833336, "total_bits": 265838592, "q_proj": { "group_size": { @@ -55698,7 +55698,7 @@ } }, { - "accuracy": 0.9986425778816307, + "accuracy": 0.9986384437284678, "total_bits": 337385472, "q_proj": { "group_size": { @@ -55752,7 +55752,7 @@ ], "model.layers.28.mlp": [ { - "accuracy": 0.9004592064179873, + "accuracy": 0.9025848786297598, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -55804,7 +55804,7 @@ } }, { - "accuracy": 0.9032249823212624, + "accuracy": 0.9053193828777263, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -55856,7 +55856,7 @@ } }, { - "accuracy": 0.9156045707824984, + "accuracy": 0.9174373391035356, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -55905,7 +55905,7 @@ } }, { - "accuracy": 0.91970757963626, + "accuracy": 0.9214657037273833, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -55954,7 +55954,7 @@ } }, { - "accuracy": 0.9491443745791912, + "accuracy": 0.9503187127411366, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -56006,7 +56006,7 @@ } }, { - "accuracy": 0.9530928317261369, + "accuracy": 0.9541476251263368, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -56058,7 +56058,7 @@ } }, { - "accuracy": 0.9585649053517141, + "accuracy": 0.9595084069786888, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -56107,7 +56107,7 @@ } }, { - "accuracy": 0.9731988448061442, + "accuracy": 0.9738058054721669, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -56150,7 +56150,7 @@ } }, { - "accuracy": 0.9755161676163736, + "accuracy": 0.9760429733677914, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -56193,7 +56193,7 @@ } }, { - "accuracy": 0.9741098433732986, + "accuracy": 0.974719419095077, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -56245,7 +56245,7 @@ } }, { - "accuracy": 0.977227778517102, + "accuracy": 0.9777300802402591, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -56297,7 +56297,7 @@ } }, { - "accuracy": 0.986842875712012, + "accuracy": 0.9871551218491635, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -56349,7 +56349,7 @@ } }, { - "accuracy": 0.9886463201163631, + "accuracy": 0.9889036752283573, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -56401,7 +56401,7 @@ } }, { - "accuracy": 0.9927499375894273, + "accuracy": 0.9929277300099401, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -56444,7 +56444,7 @@ } }, { - "accuracy": 0.9933270449063888, + "accuracy": 0.9934874623278646, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -56493,7 +56493,7 @@ } }, { - "accuracy": 0.9944204081487107, + "accuracy": 0.9945568965478359, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -56539,7 +56539,7 @@ } }, { - "accuracy": 0.9980353182733157, + "accuracy": 0.9980806403879174, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -56581,7 +56581,7 @@ ], "model.layers.29.self_attn": [ { - "accuracy": 0.9361793000839258, + "accuracy": 0.9287255459318036, "total_bits": 89665536, "q_proj": { "group_size": { @@ -56645,7 +56645,7 @@ } }, { - "accuracy": 0.9390310235321522, + "accuracy": 0.930326672368928, "total_bits": 92221440, "q_proj": { "group_size": { @@ -56709,7 +56709,7 @@ } }, { - "accuracy": 0.9516669858835245, + "accuracy": 0.9493203094523204, "total_bits": 95758848, "q_proj": { "group_size": { @@ -56773,7 +56773,7 @@ } }, { - "accuracy": 0.9590546421118473, + "accuracy": 0.9562089598100436, "total_bits": 112272384, "q_proj": { "group_size": { @@ -56837,7 +56837,7 @@ } }, { - "accuracy": 0.9679287136777451, + "accuracy": 0.9653359131985589, "total_bits": 132913152, "q_proj": { "group_size": { @@ -56901,7 +56901,7 @@ } }, { - "accuracy": 0.9685769256596503, + "accuracy": 0.9656498429218405, "total_bits": 132980224, "q_proj": { "group_size": { @@ -56965,7 +56965,7 @@ } }, { - "accuracy": 0.9809319616148346, + "accuracy": 0.9804368212721065, "total_bits": 169613312, "q_proj": { "group_size": { @@ -57017,7 +57017,7 @@ } }, { - "accuracy": 0.9817231295532302, + "accuracy": 0.9806328550177185, "total_bits": 169745920, "q_proj": { "group_size": { @@ -57069,7 +57069,7 @@ } }, { - "accuracy": 0.9836407655752019, + "accuracy": 0.9826134642782179, "total_bits": 171195392, "q_proj": { "group_size": { @@ -57121,7 +57121,7 @@ } }, { - "accuracy": 0.9842287297115514, + "accuracy": 0.9832148871041442, "total_bits": 173563904, "q_proj": { "group_size": { @@ -57173,7 +57173,7 @@ } }, { - "accuracy": 0.9841496059180874, + "accuracy": 0.9828789114559952, "total_bits": 174923264, "q_proj": { "group_size": { @@ -57237,7 +57237,7 @@ } }, { - "accuracy": 0.9850288834912997, + "accuracy": 0.9843405053803795, "total_bits": 175750144, "q_proj": { "group_size": { @@ -57301,7 +57301,7 @@ } }, { - "accuracy": 0.9879535030769674, + "accuracy": 0.9875970985250253, "total_bits": 179253248, "q_proj": { "group_size": { @@ -57362,7 +57362,7 @@ } }, { - "accuracy": 0.9888889568514729, + "accuracy": 0.9887215920086754, "total_bits": 181592064, "q_proj": { "group_size": { @@ -57423,7 +57423,7 @@ } }, { - "accuracy": 0.9934684268051857, + "accuracy": 0.9932251357914585, "total_bits": 220469248, "q_proj": { "group_size": { @@ -57484,7 +57484,7 @@ } }, { - "accuracy": 0.9944882137014678, + "accuracy": 0.9943580585286805, "total_bits": 223535104, "q_proj": { "group_size": { @@ -57545,7 +57545,7 @@ } }, { - "accuracy": 0.995095324910883, + "accuracy": 0.9946791924242127, "total_bits": 253499392, "q_proj": { "group_size": { @@ -57597,7 +57597,7 @@ } }, { - "accuracy": 0.9971579691566723, + "accuracy": 0.9971507764298861, "total_bits": 265838592, "q_proj": { "group_size": { @@ -57649,7 +57649,7 @@ } }, { - "accuracy": 0.9986602384351978, + "accuracy": 0.9985929969820733, "total_bits": 337385472, "q_proj": { "group_size": { @@ -57703,7 +57703,7 @@ ], "model.layers.29.mlp": [ { - "accuracy": 0.895974394914351, + "accuracy": 0.8982392761268114, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -57755,7 +57755,7 @@ } }, { - "accuracy": 0.8989685616995159, + "accuracy": 0.9012185052821511, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -57807,7 +57807,7 @@ } }, { - "accuracy": 0.9119811489393836, + "accuracy": 0.9138486201041623, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -57856,7 +57856,7 @@ } }, { - "accuracy": 0.9162935479299018, + "accuracy": 0.9180533860466982, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -57905,7 +57905,7 @@ } }, { - "accuracy": 0.9464578812843875, + "accuracy": 0.9476723086677099, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -57957,7 +57957,7 @@ } }, { - "accuracy": 0.9508937418852982, + "accuracy": 0.951990555579725, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -58009,7 +58009,7 @@ } }, { - "accuracy": 0.9567253673939329, + "accuracy": 0.9576529957550137, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -58058,7 +58058,7 @@ } }, { - "accuracy": 0.9716562753249156, + "accuracy": 0.9722733116267543, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -58101,7 +58101,7 @@ } }, { - "accuracy": 0.9741271344062529, + "accuracy": 0.9746550921546785, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -58144,7 +58144,7 @@ } }, { - "accuracy": 0.9725390801108197, + "accuracy": 0.9731504613239514, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -58196,7 +58196,7 @@ } }, { - "accuracy": 0.9760081061211071, + "accuracy": 0.976547883627446, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -58248,7 +58248,7 @@ } }, { - "accuracy": 0.9859512745843906, + "accuracy": 0.9862681904219484, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -58300,7 +58300,7 @@ } }, { - "accuracy": 0.9880149831603232, + "accuracy": 0.9882674325061472, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -58352,7 +58352,7 @@ } }, { - "accuracy": 0.9921242934161503, + "accuracy": 0.9922878680946795, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -58395,7 +58395,7 @@ } }, { - "accuracy": 0.9928749354654237, + "accuracy": 0.9930419144955905, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -58444,7 +58444,7 @@ } }, { - "accuracy": 0.9940255677670633, + "accuracy": 0.9941575458812478, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -58490,7 +58490,7 @@ } }, { - "accuracy": 0.9978683753809157, + "accuracy": 0.9979065027896707, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -58532,7 +58532,7 @@ ], "model.layers.30.self_attn": [ { - "accuracy": 0.9281110851780364, + "accuracy": 0.9294108654323378, "total_bits": 89665536, "q_proj": { "group_size": { @@ -58596,7 +58596,7 @@ } }, { - "accuracy": 0.9304367948911691, + "accuracy": 0.9335513042384073, "total_bits": 92221440, "q_proj": { "group_size": { @@ -58660,7 +58660,7 @@ } }, { - "accuracy": 0.9397618247098044, + "accuracy": 0.9454480490010035, "total_bits": 95758848, "q_proj": { "group_size": { @@ -58724,7 +58724,7 @@ } }, { - "accuracy": 0.9487706942385749, + "accuracy": 0.9537417996478708, "total_bits": 112272384, "q_proj": { "group_size": { @@ -58788,7 +58788,7 @@ } }, { - "accuracy": 0.9620860031756916, + "accuracy": 0.9637758616161973, "total_bits": 132913152, "q_proj": { "group_size": { @@ -58852,7 +58852,7 @@ } }, { - "accuracy": 0.9616938420620403, + "accuracy": 0.9647677897622711, "total_bits": 132980224, "q_proj": { "group_size": { @@ -58916,7 +58916,7 @@ } }, { - "accuracy": 0.977748556552749, + "accuracy": 0.9789000656455755, "total_bits": 169613312, "q_proj": { "group_size": { @@ -58968,7 +58968,7 @@ } }, { - "accuracy": 0.9791354767389988, + "accuracy": 0.9799976234177226, "total_bits": 169745920, "q_proj": { "group_size": { @@ -59020,7 +59020,7 @@ } }, { - "accuracy": 0.9811562163461196, + "accuracy": 0.9815308692325887, "total_bits": 171195392, "q_proj": { "group_size": { @@ -59072,7 +59072,7 @@ } }, { - "accuracy": 0.9823650051594565, + "accuracy": 0.9824057497378242, "total_bits": 173563904, "q_proj": { "group_size": { @@ -59124,7 +59124,7 @@ } }, { - "accuracy": 0.9821830422764546, + "accuracy": 0.98234146181494, "total_bits": 174923264, "q_proj": { "group_size": { @@ -59188,7 +59188,7 @@ } }, { - "accuracy": 0.9834651449008992, + "accuracy": 0.9834738772754607, "total_bits": 175750144, "q_proj": { "group_size": { @@ -59252,7 +59252,7 @@ } }, { - "accuracy": 0.9861626127538713, + "accuracy": 0.986764159151598, "total_bits": 179253248, "q_proj": { "group_size": { @@ -59313,7 +59313,7 @@ } }, { - "accuracy": 0.9874788266851714, + "accuracy": 0.9881406317612058, "total_bits": 181592064, "q_proj": { "group_size": { @@ -59374,7 +59374,7 @@ } }, { - "accuracy": 0.9925128852360343, + "accuracy": 0.9928716928943208, "total_bits": 220469248, "q_proj": { "group_size": { @@ -59435,7 +59435,7 @@ } }, { - "accuracy": 0.993710986044454, + "accuracy": 0.994032961978136, "total_bits": 223535104, "q_proj": { "group_size": { @@ -59496,7 +59496,7 @@ } }, { - "accuracy": 0.9944882836486948, + "accuracy": 0.9945411313031065, "total_bits": 253499392, "q_proj": { "group_size": { @@ -59548,7 +59548,7 @@ } }, { - "accuracy": 0.9966783542798734, + "accuracy": 0.9968617164750436, "total_bits": 265838592, "q_proj": { "group_size": { @@ -59600,7 +59600,7 @@ } }, { - "accuracy": 0.9985228671912888, + "accuracy": 0.9985311028032907, "total_bits": 337385472, "q_proj": { "group_size": { @@ -59654,7 +59654,7 @@ ], "model.layers.30.mlp": [ { - "accuracy": 0.8830651840881297, + "accuracy": 0.8849808260014183, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -59706,7 +59706,7 @@ } }, { - "accuracy": 0.8869845804415251, + "accuracy": 0.8888402400832427, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -59758,7 +59758,7 @@ } }, { - "accuracy": 0.900140098051021, + "accuracy": 0.9020102631888891, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -59807,7 +59807,7 @@ } }, { - "accuracy": 0.9044817152776217, + "accuracy": 0.9063003486708591, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -59856,7 +59856,7 @@ } }, { - "accuracy": 0.938663956954291, + "accuracy": 0.9395228649832701, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -59908,7 +59908,7 @@ } }, { - "accuracy": 0.9451034414140802, + "accuracy": 0.9460300789459756, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -59960,7 +59960,7 @@ } }, { - "accuracy": 0.9511445907777861, + "accuracy": 0.9519095142420969, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -60009,7 +60009,7 @@ } }, { - "accuracy": 0.9681059886750422, + "accuracy": 0.9686001149055204, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -60052,7 +60052,7 @@ } }, { - "accuracy": 0.9707965688093713, + "accuracy": 0.9711995015018865, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -60095,7 +60095,7 @@ } }, { - "accuracy": 0.9683944562352017, + "accuracy": 0.9688290752666561, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -60147,7 +60147,7 @@ } }, { - "accuracy": 0.9731286280837498, + "accuracy": 0.9735513782422793, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -60199,7 +60199,7 @@ } }, { - "accuracy": 0.9838335352802747, + "accuracy": 0.9840430837418688, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -60251,7 +60251,7 @@ } }, { - "accuracy": 0.9865542725218754, + "accuracy": 0.9867606090479776, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -60303,7 +60303,7 @@ } }, { - "accuracy": 0.9908618711082167, + "accuracy": 0.9909827291083179, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -60346,7 +60346,7 @@ } }, { - "accuracy": 0.9917276501165408, + "accuracy": 0.9918171535736244, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -60395,7 +60395,7 @@ } }, { - "accuracy": 0.9929199321930738, + "accuracy": 0.9929624785620131, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -60441,7 +60441,7 @@ } }, { - "accuracy": 0.997476822034897, + "accuracy": 0.9975187013134066, "total_bits": 1415520512, "gate_proj": { "group_size": { @@ -60483,7 +60483,7 @@ ], "model.layers.31.self_attn": [ { - "accuracy": 0.9336667274566073, + "accuracy": 0.9266550258586281, "total_bits": 89665536, "q_proj": { "group_size": { @@ -60547,7 +60547,7 @@ } }, { - "accuracy": 0.9362687062668174, + "accuracy": 0.9312431880910146, "total_bits": 92221440, "q_proj": { "group_size": { @@ -60611,7 +60611,7 @@ } }, { - "accuracy": 0.9482218321216733, + "accuracy": 0.9452139746985937, "total_bits": 95758848, "q_proj": { "group_size": { @@ -60675,7 +60675,7 @@ } }, { - "accuracy": 0.9598894887848904, + "accuracy": 0.9581292657867858, "total_bits": 112272384, "q_proj": { "group_size": { @@ -60739,7 +60739,7 @@ } }, { - "accuracy": 0.9661438174937901, + "accuracy": 0.9636060254354226, "total_bits": 132913152, "q_proj": { "group_size": { @@ -60803,7 +60803,7 @@ } }, { - "accuracy": 0.9670225406359685, + "accuracy": 0.9644337586666408, "total_bits": 132980224, "q_proj": { "group_size": { @@ -60867,7 +60867,7 @@ } }, { - "accuracy": 0.979833778876223, + "accuracy": 0.9774503753961701, "total_bits": 169613312, "q_proj": { "group_size": { @@ -60919,7 +60919,7 @@ } }, { - "accuracy": 0.980362587657414, + "accuracy": 0.9781386846382367, "total_bits": 169745920, "q_proj": { "group_size": { @@ -60971,7 +60971,7 @@ } }, { - "accuracy": 0.982035329222287, + "accuracy": 0.9803491334773993, "total_bits": 171195392, "q_proj": { "group_size": { @@ -61023,7 +61023,7 @@ } }, { - "accuracy": 0.9826493605383133, + "accuracy": 0.9812571843105712, "total_bits": 173563904, "q_proj": { "group_size": { @@ -61075,7 +61075,7 @@ } }, { - "accuracy": 0.9829646884708813, + "accuracy": 0.9814649584065926, "total_bits": 174923264, "q_proj": { "group_size": { @@ -61139,7 +61139,7 @@ } }, { - "accuracy": 0.9842083790878716, + "accuracy": 0.9828941818130644, "total_bits": 175750144, "q_proj": { "group_size": { @@ -61203,7 +61203,7 @@ } }, { - "accuracy": 0.9869368995392793, + "accuracy": 0.9860010932346708, "total_bits": 179253248, "q_proj": { "group_size": { @@ -61264,7 +61264,7 @@ } }, { - "accuracy": 0.9879527344417415, + "accuracy": 0.987090107739756, "total_bits": 181592064, "q_proj": { "group_size": { @@ -61325,7 +61325,7 @@ } }, { - "accuracy": 0.9928924746223187, + "accuracy": 0.9923636379014504, "total_bits": 220469248, "q_proj": { "group_size": { @@ -61386,7 +61386,7 @@ } }, { - "accuracy": 0.9940123450942338, + "accuracy": 0.9935069437579889, "total_bits": 223535104, "q_proj": { "group_size": { @@ -61447,7 +61447,7 @@ } }, { - "accuracy": 0.9947025165402967, + "accuracy": 0.9941199343210381, "total_bits": 253499392, "q_proj": { "group_size": { @@ -61499,7 +61499,7 @@ } }, { - "accuracy": 0.9968619158638543, + "accuracy": 0.9965414572016973, "total_bits": 265838592, "q_proj": { "group_size": { @@ -61551,7 +61551,7 @@ } }, { - "accuracy": 0.9985370182272929, + "accuracy": 0.9984177566795168, "total_bits": 337385472, "q_proj": { "group_size": { @@ -61605,7 +61605,7 @@ ], "model.layers.31.mlp": [ { - "accuracy": 0.8708056423224901, + "accuracy": 0.8628403830685114, "total_bits": 395461696, "gate_proj": { "group_size": { @@ -61657,7 +61657,7 @@ } }, { - "accuracy": 0.8754319470179708, + "accuracy": 0.867565969103261, "total_bits": 409224256, "gate_proj": { "group_size": { @@ -61709,7 +61709,7 @@ } }, { - "accuracy": 0.8867548923743398, + "accuracy": 0.8795218028520283, "total_bits": 457272320, "gate_proj": { "group_size": { @@ -61758,7 +61758,7 @@ } }, { - "accuracy": 0.8909720068699435, + "accuracy": 0.883901169033427, "total_bits": 512977920, "gate_proj": { "group_size": { @@ -61807,7 +61807,7 @@ } }, { - "accuracy": 0.9324234053492546, + "accuracy": 0.9283068440854549, "total_bits": 578397280, "gate_proj": { "group_size": { @@ -61859,7 +61859,7 @@ } }, { - "accuracy": 0.9402476735413074, + "accuracy": 0.9364610924140403, "total_bits": 592872448, "gate_proj": { "group_size": { @@ -61911,7 +61911,7 @@ } }, { - "accuracy": 0.945353377806513, + "accuracy": 0.941853898724443, "total_bits": 637454432, "gate_proj": { "group_size": { @@ -61960,7 +61960,7 @@ } }, { - "accuracy": 0.9647525185228962, + "accuracy": 0.9627053813126526, "total_bits": 728741472, "gate_proj": { "group_size": { @@ -62003,7 +62003,7 @@ } }, { - "accuracy": 0.9677408377787, + "accuracy": 0.965717359789108, "total_bits": 739476480, "gate_proj": { "group_size": { @@ -62046,7 +62046,7 @@ } }, { - "accuracy": 0.9651259544648623, + "accuracy": 0.9628826519964557, "total_bits": 751543392, "gate_proj": { "group_size": { @@ -62098,7 +62098,7 @@ } }, { - "accuracy": 0.9703355514885563, + "accuracy": 0.9684994862856049, "total_bits": 766018560, "gate_proj": { "group_size": { @@ -62150,7 +62150,7 @@ } }, { - "accuracy": 0.9819708428786773, + "accuracy": 0.9807827789826613, "total_bits": 924689504, "gate_proj": { "group_size": { @@ -62202,7 +62202,7 @@ } }, { - "accuracy": 0.9850258716921273, + "accuracy": 0.9840721279186638, "total_bits": 939164672, "gate_proj": { "group_size": { @@ -62254,7 +62254,7 @@ } }, { - "accuracy": 0.9897539450934059, + "accuracy": 0.9891346512901548, "total_bits": 1069524064, "gate_proj": { "group_size": { @@ -62297,7 +62297,7 @@ } }, { - "accuracy": 0.9906766237200875, + "accuracy": 0.9900673695986992, "total_bits": 1110384896, "gate_proj": { "group_size": { @@ -62346,7 +62346,7 @@ } }, { - "accuracy": 0.9917373532723439, + "accuracy": 0.9911810960130472, "total_bits": 1209999616, "gate_proj": { "group_size": { @@ -62392,7 +62392,7 @@ } }, { - "accuracy": 0.9969809681030088, + "accuracy": 0.9968050105962902, "total_bits": 1415520512, "gate_proj": { "group_size": {