model,minerva_math_acc,minerva_math_pass_acc,minerva_math_tokens,minerva_math_keywords,minerva_math_correct_tokens,minerva_math_wrong_tokens,minerva_math_clip_ratio,minerva_math_stop_tokens,minerva_math_stop_ratio,minerva_math_box_ratio,minerva_math_repeat_ratio,amc23_acc,amc23_pass_acc,amc23_tokens,amc23_keywords,amc23_correct_tokens,amc23_wrong_tokens,amc23_clip_ratio,amc23_stop_tokens,amc23_stop_ratio,amc23_box_ratio,amc23_repeat_ratio,mmlu_stem_acc,mmlu_stem_pass_acc,mmlu_stem_tokens,mmlu_stem_keywords,mmlu_stem_correct_tokens,mmlu_stem_wrong_tokens,mmlu_stem_clip_ratio,mmlu_stem_stop_tokens,mmlu_stem_stop_ratio,mmlu_stem_box_ratio,mmlu_stem_repeat_ratio,aime24_acc,aime24_pass_acc,aime24_tokens,aime24_keywords,aime24_correct_tokens,aime24_wrong_tokens,aime24_clip_ratio,aime24_stop_tokens,aime24_stop_ratio,aime24_box_ratio,aime24_repeat_ratio,aime25_acc,aime25_pass_acc,aime25_tokens,aime25_keywords,aime25_correct_tokens,aime25_wrong_tokens,aime25_clip_ratio,aime25_stop_tokens,aime25_stop_ratio,aime25_box_ratio,aime25_repeat_ratio,gsm8k_acc,gsm8k_pass_acc,gsm8k_tokens,gsm8k_keywords,gsm8k_correct_tokens,gsm8k_wrong_tokens,gsm8k_clip_ratio,gsm8k_stop_tokens,gsm8k_stop_ratio,gsm8k_box_ratio,gsm8k_repeat_ratio,math500_acc,math500_pass_acc,math500_tokens,math500_keywords,math500_correct_tokens,math500_wrong_tokens,math500_clip_ratio,math500_stop_tokens,math500_stop_ratio,math500_box_ratio,math500_repeat_ratio,olympiadbench_acc,olympiadbench_pass_acc,olympiadbench_tokens,olympiadbench_keywords,olympiadbench_correct_tokens,olympiadbench_wrong_tokens,olympiadbench_clip_ratio,olympiadbench_stop_tokens,olympiadbench_stop_ratio,olympiadbench_box_ratio,olympiadbench_repeat_ratio,avg_acc,avg_pass_acc,avg_tokens,avg_keywords,avg_correct_tokens,avg_wrong_tokens,avg_clip_ratio,avg_stop_tokens,avg_stop_ratio,avg_box_ratio,avg_repeat_ratio eval_results-global_step_0,26.1,26.1,724.5992647058823,0.11764705882352941,988.7887323943662,631.2786069651742,0.007352941176470588,608.4481481481481,0.9926470588235294,0.9375,0.3897058823529412,45.0,45.0,990.275,0.675,987.2222222222222,992.7727272727273,0.0,990.275,1.0,1.0,0.775,60.7,60.7,373.0622929092114,0.26673293571901924,319.14020731042007,456.47088607594935,0.004638833664678595,301.13848202396804,0.9953611663353215,0.9055666003976143,0.4592445328031809,6.7,6.7,2314.4333333333334,7.666666666666667,1565.5,2367.9285714285716,0.06666666666666667,1350.892857142857,0.9333333333333333,0.9333333333333333,0.9,13.3,13.3,1927.8333333333333,1.8,5070.0,1444.423076923077,0.03333333333333333,1442.655172413793,0.9666666666666667,0.9333333333333333,0.8,84.3,84.3,336.931766489765,0.04927975739196361,304.51079136690646,511.0966183574879,0.004548900682335102,266.7989337395278,0.9954510993176648,0.9575435936315391,0.17816527672479152,65.4,65.4,879.99,0.92,530.434250764526,1540.7109826589594,0.018,602.5336048879838,0.982,0.964,0.448,31.1,31.1,1166.722962962963,1.2696296296296297,866.952380952381,1302.1032258064515,0.011851851851851851,983.7991004497751,0.9881481481481481,0.9674074074074074,0.6266666666666667,41.575,41.575,1089.230994216811,1.5956195060288512,1329.068573126353,1155.8480869360496,0.018299065921917018,818.3176623507566,0.9817009340780829,0.9498355335129034,0.5720977948184475 eval_results-global_step_10,32.7,32.7,753.8308823529412,0.07352941176470588,513.1685393258427,870.8743169398907,0.007352941176470588,638.6592592592592,0.9926470588235294,0.9926470588235294,0.45955882352941174,52.5,52.5,1412.525,1.225,924.047619047619,1952.421052631579,0.025,1038.5897435897436,0.975,0.975,0.625,64.5,64.5,459.8711066931743,0.6196156394963552,407.25513347022587,555.6616822429907,0.0026507620941020544,418.36146179401993,0.9973492379058979,0.9758117958913187,0.558648111332008,16.7,16.7,3543.4666666666667,5.866666666666666,1584.2,3935.32,0.03333333333333333,3113.9655172413795,0.9666666666666667,0.9333333333333333,0.9,16.7,16.7,2644.3,8.2,1336.0,2905.96,0.03333333333333333,2183.7586206896553,0.9666666666666667,0.9333333333333333,0.7333333333333333,91.8,91.8,312.6459438968916,0.03335860500379075,292.8117258464079,535.0462962962963,0.000758150113722517,300.7443095599393,0.9992418498862775,0.9984836997725549,0.1599696739954511,79.2,79.2,966.608,0.984,678.979797979798,2061.8076923076924,0.006,875.8068410462777,0.994,0.988,0.514,43.6,43.6,1474.634074074074,1.288888888888889,1011.6360544217687,1831.9081364829397,0.016296296296296295,1233.936746987952,0.9837037037037037,0.9733333333333334,0.6696296296296296,49.7125,49.7125,1445.9852092104686,2.286382401477551,843.5123587614578,1831.1248971126734,0.015590602043407264,1225.4778125210285,0.9844093979565927,0.9712428193109254,0.5775174464774793 eval_results-global_step_20,36.8,36.8,749.3419117647059,0.2647058823529412,544.13,868.6511627906976,0.0,749.3419117647059,1.0,0.9963235294117647,0.45588235294117646,62.5,62.5,3341.225,11.925,2057.12,5481.4,0.025,3016.641025641026,0.975,0.925,0.85,72.1,72.1,622.5596421471173,0.936050364479788,561.6977491961414,780.1058263971463,0.0023194168323392977,586.8462304882099,0.9976805831676607,0.9804506295559974,0.6292246520874751,13.3,13.3,6496.2,11.333333333333334,1646.75,7242.2692307692305,0.2,4119.416666666667,0.8,0.7333333333333333,0.9666666666666667,23.3,23.3,4939.533333333334,30.4,3971.285714285714,5234.217391304348,0.03333333333333333,4558.068965517241,0.9666666666666667,0.8333333333333334,0.9333333333333333,93.5,93.5,381.9128127369219,0.0712661106899166,376.021897810219,466.3720930232558,0.0,381.9128127369219,1.0,0.9984836997725549,0.19787717968157695,81.4,81.4,1488.374,2.486,922.936117936118,3962.9247311827958,0.008,1370.9415322580646,0.992,0.98,0.586,48.3,48.3,2765.731851851852,6.060740740740741,1574.4110429447853,3878.541547277937,0.034074074074074076,2299.0153374233128,0.965925925925926,0.9525925925925925,0.8340740740740741,53.9,53.9,2598.109818979241,7.93463705394959,1456.7940652716222,3489.3102478431765,0.03784085302996834,2135.2730603120185,0.9621591469700317,0.924939639749947,0.681632282348038 eval_results-global_step_30,36.8,36.8,1043.0625,3.073529411764706,695.07,1245.3837209302326,0.007352941176470588,930.9962962962964,0.9926470588235294,0.9926470588235294,0.5661764705882353,70.0,70.0,3201.2,8.175,2237.4285714285716,5450.0,0.025,2873.25641025641,0.975,0.95,0.8,78.1,78.1,765.3389662027834,1.4532803180914513,657.6355536699194,1149.3888048411497,0.003644797879390325,709.4845360824743,0.9963552021206097,0.9804506295559974,0.6726308813783963,16.7,16.7,7676.766666666666,21.766666666666666,1997.4,8812.64,0.16666666666666666,6022.24,0.8333333333333334,0.7,0.9666666666666667,26.7,26.7,5636.333333333333,19.233333333333334,3237.25,6508.727272727273,0.06666666666666667,4902.642857142857,0.9333333333333333,0.8333333333333334,0.9666666666666667,91.7,91.7,464.3199393479909,0.18119787717968158,439.6575682382134,735.3818181818182,0.0,464.3199393479909,1.0,0.9969673995451099,0.26459438968915844,83.4,83.4,1690.934,2.582,1125.4604316546763,4531.9277108433735,0.01,1546.3030303030303,0.99,0.99,0.688,48.9,48.9,3462.4933333333333,10.435555555555556,1835.0363636363636,5019.191304347826,0.056296296296296296,2714.12715855573,0.9437037037037037,0.914074074074074,0.8622222222222222,56.537499999999994,56.537499999999994,2992.5560923605135,8.362570395323925,1528.117311078468,4181.580078983959,0.04195342108568632,2520.4212784980987,0.9580465789143137,0.9196840619165055,0.7233696621514182 eval_results-global_step_40,36.4,36.4,975.8639705882352,0.6286764705882353,745.4646464646464,1107.7109826589594,0.0,975.8639705882352,1.0,0.9963235294117647,0.5441176470588235,67.5,67.5,3282.125,8.0,1868.5555555555557,6218.0,0.025,2955.948717948718,0.975,0.95,0.8,79.5,79.5,786.0828363154407,1.2647448641484427,724.7739783152628,1023.2096774193549,0.0023194168323392977,750.388575224178,0.9976805831676607,0.9797879390324719,0.7024519549370444,23.3,23.3,7061.666666666667,25.966666666666665,2573.1428571428573,8427.739130434782,0.2,4827.333333333333,0.8,0.7333333333333333,1.0,20.0,20.0,6232.8,24.766666666666666,2844.5,7079.875,0.16666666666666666,4287.32,0.8333333333333334,0.8,0.9666666666666667,93.6,93.6,458.33965125094767,0.14935557240333586,449.0680713128039,592.9411764705883,0.0,458.33965125094767,1.0,0.9984836997725549,0.2918877937831691,84.6,84.6,1762.144,3.422,1090.9810874704492,5449.181818181818,0.012,1588.7105263157894,0.988,0.978,0.678,48.1,48.1,3415.6711111111113,8.457777777777778,1656.1076923076923,5049.551428571429,0.054814814814814816,2685.896551724138,0.9451851851851852,0.9214814814814815,0.8755555555555555,56.625,56.625,2996.83665449155,9.08198600228139,1494.0742360711586,4368.526151717117,0.0576001122892276,2316.2251657981674,0.9423998877107724,0.9196762478789507,0.7323349522501574 eval_results-global_step_50,36.8,36.8,1181.3419117647059,3.0955882352941178,845.37,1376.6744186046512,0.003676470588235294,1126.719557195572,0.9963235294117647,0.9816176470588235,0.5955882352941176,75.0,75.0,3588.575,9.35,1828.4333333333334,8869.0,0.0,3588.575,1.0,0.875,0.825,80.0,80.0,814.1610337972166,1.739562624254473,745.4556752278376,1088.7549668874171,0.0033134526176275677,763.7563164893617,0.9966865473823724,0.9774685222001326,0.7203445990722332,20.0,20.0,6118.866666666667,15.466666666666667,3677.6666666666665,6729.166666666667,0.13333333333333333,4597.615384615385,0.8666666666666667,0.8,0.9666666666666667,23.3,23.3,5266.633333333333,12.366666666666667,3300.0,5865.173913043478,0.03333333333333333,4897.0,0.9666666666666667,0.9,1.0,93.7,93.7,457.8339651250948,0.11827141774071266,448.87783171521033,591.2048192771084,0.0,457.8339651250948,1.0,0.9992418498862775,0.287338893100834,85.4,85.4,1685.964,3.682,1108.4496487119438,5064.027397260274,0.014,1482.6997971602434,0.986,0.974,0.666,51.0,51.0,3449.077037037037,8.59851851851852,1751.0029069767443,5213.842900302115,0.05333333333333334,2740.622848200313,0.9466666666666667,0.9318518518518518,0.8740740740740741,58.150000000000006,58.150000000000006,2820.3066184655063,6.802159266142645,1713.157007828967,4349.730635255213,0.03012374040073286,2456.8528585982463,0.969876259599267,0.9298974838746358,0.7418765585259908 eval_results-global_step_60,37.5,37.5,1045.2610294117646,0.6875,805.2352941176471,1189.2764705882353,0.0,1045.2610294117646,1.0,0.9963235294117647,0.6139705882352942,65.0,65.0,3065.25,5.85,1716.8076923076924,5569.5,0.025,2734.5128205128203,0.975,0.925,0.875,79.3,79.3,802.0414181577204,1.7978793903247183,720.0258980785296,1116.6971153846155,0.0023194168323392977,766.614413816008,0.9976805831676607,0.9797879390324719,0.7190192180251822,30.0,30.0,5753.466666666666,42.0,2277.4444444444443,7243.190476190476,0.1,4612.888888888889,0.9,0.8333333333333334,1.0,16.7,16.7,6363.6,29.966666666666665,1694.4,7297.44,0.1,5290.925925925926,0.9,0.8333333333333334,0.9,93.4,93.4,465.0614101592115,0.26914329037149354,437.96915584415586,848.7126436781609,0.000758150113722517,453.1449165402124,0.9992418498862775,0.9984836997725549,0.310841546626232,82.6,82.6,1628.972,2.358,1079.7772397094432,4236.068965517241,0.008,1513.1532258064517,0.992,0.984,0.68,50.2,50.2,3312.311111111111,9.139259259259259,1817.2625368731563,4820.708333333333,0.034074074074074076,2864.814417177914,0.965925925925926,0.9303703703703704,0.8711111111111111,56.8375,56.8375,2804.495454438309,11.508556075827768,1318.6152826718835,4040.199250586508,0.033768955127516986,2410.164454759998,0.966231044872483,0.9350790256567286,0.7462428079997275 eval_results-global_step_70,40.8,40.8,1070.0698529411766,0.6875,785.4504504504505,1266.2981366459628,0.0,1070.0698529411766,1.0,0.9926470588235294,0.5845588235294118,72.5,72.5,2952.05,6.55,1982.4137931034484,5508.363636363636,0.025,2617.6153846153848,0.975,0.975,0.85,78.2,78.2,819.4668654738238,1.6358515573227304,735.9610004239084,1118.3899848254932,0.003976143141153081,759.0133067198935,0.9960238568588469,0.9774685222001326,0.7077534791252486,20.0,20.0,5749.833333333333,19.566666666666666,1802.5,6736.666666666667,0.13333333333333333,4170.076923076923,0.8666666666666667,0.8,0.9666666666666667,20.0,20.0,6076.033333333334,26.633333333333333,2108.5,7067.916666666667,0.13333333333333333,4569.2692307692305,0.8666666666666667,0.7666666666666667,1.0,93.4,93.4,442.3563305534496,0.11448066717210008,435.9862012987013,532.5632183908046,0.0,442.3563305534496,1.0,0.9992418498862775,0.2699014404852161,84.6,84.6,1716.186,6.8,1041.2033096926714,5424.207792207792,0.018,1453.529531568228,0.982,0.974,0.662,50.1,50.1,3079.0755555555556,8.274074074074074,1694.792899408284,4467.46587537092,0.035555555555555556,2602.9001536098312,0.9644444444444444,0.9481481481481482,0.8696296296296296,57.45,57.45,2738.133908898834,8.782738287321113,1323.3509567971828,4015.233997142243,0.04364979567042192,2210.603839231765,0.9563502043295781,0.9291465307155944,0.7388137549295217 eval_results-global_step_80,36.4,36.4,1121.7132352941176,0.7757352941176471,831.2525252525253,1287.9306358381502,0.003676470588235294,1068.830258302583,0.9963235294117647,0.9963235294117647,0.5808823529411765,67.5,67.5,3409.775,6.65,2261.740740740741,5794.153846153846,0.0,3409.775,1.0,0.95,0.775,79.4,79.4,822.2004638833665,1.6693174287607688,724.3124739257405,1200.038647342995,0.003644797879390325,766.9015630196209,0.9963552021206097,0.9777998674618953,0.7239893969516236,30.0,30.0,6118.966666666666,16.4,2107.3333333333335,7838.238095238095,0.16666666666666666,4153.92,0.8333333333333334,0.8,1.0,20.0,20.0,6597.433333333333,38.6,4887.333333333333,7024.958333333333,0.1,5542.666666666667,0.9,0.7666666666666667,0.9333333333333333,92.6,92.6,475.15238817285825,0.16300227445034116,450.36497545008183,787.4226804123712,0.0,475.15238817285825,1.0,0.9984836997725549,0.2767247915087187,89.2,89.2,1553.866,2.588,1125.4035874439462,5092.648148148148,0.004,1495.8875502008032,0.996,0.984,0.684,50.8,50.8,3215.7614814814815,8.687407407407408,1759.9825072886297,4719.774096385542,0.037037037037037035,2723.2046153846154,0.9629629629629629,0.9392592592592592,0.8696296296296296,58.2375,58.2375,2914.3585711039777,9.44168280059202,1768.4654345960412,4218.14556035656,0.03937812152141617,2454.5422552183936,0.9606218784785839,0.9265666278215176,0.7304449380455603 eval_results-global_step_90,40.8,40.8,1174.1066176470588,1.411764705882353,899.7207207207207,1363.27950310559,0.0,1174.1066176470588,1.0,0.9852941176470589,0.6102941176470589,70.0,70.0,3502.025,9.4,1884.3214285714287,7276.666666666667,0.025,3180.3076923076924,0.975,0.925,0.875,79.1,79.1,839.7773359840954,1.7491716368455932,740.828655215752,1214.0887480190174,0.003644797879390325,784.0941137346192,0.9963552021206097,0.9777998674618953,0.7213386348575216,26.7,26.7,5584.533333333334,13.833333333333334,3066.0,6500.363636363636,0.03333333333333333,5225.3448275862065,0.9666666666666667,0.9333333333333333,0.9666666666666667,16.7,16.7,3947.766666666667,10.033333333333333,2029.2,4331.48,0.0,3947.766666666667,1.0,0.9333333333333333,0.9666666666666667,93.8,93.8,485.72934040940106,0.3388931008339651,461.7259498787389,847.829268292683,0.000758150113722517,473.48406676783003,0.9992418498862775,0.9984836997725549,0.3055344958301744,86.2,86.2,1557.568,2.224,1124.4037122969837,4263.275362318841,0.004,1499.694779116466,0.996,0.982,0.668,51.1,51.1,3165.311111111111,8.044444444444444,1808.431884057971,4583.866666666667,0.03851851851851852,2651.697996918336,0.9614814814814815,0.9466666666666667,0.8681481481481481,58.05,58.05,2532.102175643958,5.879367569334128,1501.8290438426995,3797.6062314291376,0.013156849980620588,2367.0620950931097,0.9868431500193795,0.9602388772768553,0.7477060912270295 eval_results-global_step_100,37.9,37.9,1185.8088235294117,2.9595588235294117,841.0970873786408,1395.8994082840236,0.007352941176470588,1076.9592592592592,0.9926470588235294,0.9852941176470589,0.5698529411764706,67.5,67.5,3563.375,14.575,1730.3703703703704,7370.384615384615,0.05,2908.5789473684213,0.95,0.925,0.925,77.6,77.6,821.2372432074221,1.5374420145791916,759.898804440649,1033.7440828402366,0.0023194168323392977,786.0315509797409,0.9976805831676607,0.9781312127236581,0.7256461232604374,13.3,13.3,6191.033333333334,12.3,1540.5,6906.5,0.1,5103.148148148148,0.9,0.8,1.0,26.7,26.7,5226.666666666667,14.4,2493.875,6220.409090909091,0.06666666666666667,4462.285714285715,0.9333333333333333,0.8666666666666667,0.9333333333333333,93.6,93.6,488.1925701288855,0.2850644427596664,463.0,853.9294117647058,0.0,488.1925701288855,1.0,0.9977255496588324,0.3062926459438969,86.0,86.0,1495.094,2.358,1095.7116279069767,3948.442857142857,0.002,1466.0901803607214,0.998,0.988,0.664,50.4,50.4,3217.1451851851853,8.002962962962963,1699.479411764706,4757.462686567164,0.03259259259259259,2785.924961715161,0.9674074074074074,0.9392592592592592,0.8770370370370371,56.625,56.625,2773.5691027563635,7.052253530478904,1327.9915377326677,4060.8465191115865,0.03261645215850864,2384.6514165307563,0.9673835478414913,0.9350096007444344,0.7501452600938968 eval_results-global_step_110,39.7,39.7,1113.4375,0.9852941176470589,888.6018518518518,1261.5,0.0,1113.4375,1.0,0.9963235294117647,0.5845588235294118,70.0,70.0,2832.05,4.7,1878.4642857142858,5057.083333333333,0.0,2832.05,1.0,1.0,0.9,78.4,78.4,822.2369118621604,1.6494367130550034,729.3629066328687,1159.921658986175,0.0023194168323392977,786.971438060445,0.9976805831676607,0.9777998674618953,0.7292909211398277,26.7,26.7,5703.466666666666,23.133333333333333,1825.75,7113.545454545455,0.06666666666666667,4974.607142857143,0.9333333333333333,0.9333333333333333,0.9666666666666667,20.0,20.0,4268.366666666667,16.766666666666666,2227.8333333333335,4778.5,0.03333333333333333,3860.0,0.9666666666666667,0.9,0.9333333333333333,93.6,93.6,487.8097043214556,0.23805913570887036,473.3962722852512,697.0588235294117,0.0,487.8097043214556,1.0,0.9984836997725549,0.3062926459438969,85.6,85.6,1564.606,2.298,1127.6004672897195,4162.361111111111,0.008,1448.1935483870968,0.992,0.986,0.668,52.0,52.0,2840.131851851852,6.022222222222222,1645.5982905982905,4134.20987654321,0.013333333333333334,2662.214714714715,0.9866666666666667,0.9688888888888889,0.8785185185185185,58.25,58.25,2454.0131626711004,6.9741265235791445,1349.5759259632,3545.5225322560873,0.015456593770709081,2270.660506042607,0.9845434062292909,0.9701036648585546,0.7458326136414569 eval_results-global_step_120,43.0,43.0,1296.889705882353,1.8235294117647058,864.6837606837607,1623.1354838709678,0.007352941176470588,1187.5777777777778,0.9926470588235294,0.9742647058823529,0.6286764705882353,67.5,67.5,2712.075,5.35,1855.888888888889,4490.307692307692,0.025,2371.128205128205,0.975,0.975,0.875,77.5,77.5,818.4774685222002,1.634857521537442,728.316509837468,1128.4720588235293,0.0026507620941020544,778.1395348837209,0.9973492379058979,0.9768058316766071,0.7226640159045725,20.0,20.0,5528.6,14.6,1503.1666666666667,6534.958333333333,0.1,4365.7037037037035,0.9,0.8333333333333334,1.0,13.3,13.3,4524.0,15.4,1559.25,4980.115384615385,0.0,4524.0,1.0,0.9333333333333333,0.9666666666666667,93.9,93.9,529.7763457164518,0.5375284306292646,489.9668820678514,1138.2222222222222,0.001516300227445034,506.18602885345484,0.9984836997725549,0.9977255496588324,0.3252463987869598,86.0,86.0,1580.476,2.846,1108.6953488372094,4478.557142857143,0.006,1493.486921529175,0.994,0.988,0.644,52.9,52.9,2823.6192592592593,5.832592592592593,1662.2941176470588,4127.37106918239,0.025185185185185185,2482.6854103343467,0.9748148148148148,0.96,0.8548148148148148,56.7625,56.7625,2476.7392224225327,6.003063494565501,1221.532771828613,3562.642423401583,0.02096314858540036,2213.613447776298,0.9790368514145996,0.9548078442355573,0.7521335458451561