[ { "epoch": 0.02, "learning_rate": 0.0002, "loss": 0.6769, "step": 1 }, { "epoch": 0.04, "learning_rate": 0.0002, "loss": 0.6892, "step": 2 }, { "epoch": 0.05, "learning_rate": 0.0002, "loss": 0.6882, "step": 3 }, { "epoch": 0.07, "learning_rate": 0.0002, "loss": 0.7043, "step": 4 }, { "epoch": 0.09, "learning_rate": 0.0002, "loss": 0.6683, "step": 5 }, { "epoch": 0.11, "learning_rate": 0.0002, "loss": 0.6584, "step": 6 }, { "epoch": 0.12, "learning_rate": 0.0002, "loss": 0.6654, "step": 7 }, { "epoch": 0.14, "learning_rate": 0.0002, "loss": 0.6539, "step": 8 }, { "epoch": 0.16, "learning_rate": 0.0002, "loss": 0.6895, "step": 9 }, { "epoch": 0.18, "learning_rate": 0.0002, "loss": 0.6756, "step": 10 }, { "epoch": 0.19, "learning_rate": 0.0002, "loss": 0.6878, "step": 11 }, { "epoch": 0.21, "learning_rate": 0.0002, "loss": 0.6774, "step": 12 }, { "epoch": 0.23, "learning_rate": 0.0002, "loss": 0.6806, "step": 13 }, { "epoch": 0.25, "learning_rate": 0.0002, "loss": 0.6656, "step": 14 }, { "epoch": 0.26, "learning_rate": 0.0002, "loss": 0.6541, "step": 15 }, { "epoch": 0.28, "learning_rate": 0.0002, "loss": 0.6613, "step": 16 }, { "epoch": 0.3, "learning_rate": 0.0002, "loss": 0.6425, "step": 17 }, { "epoch": 0.32, "learning_rate": 0.0002, "loss": 0.6313, "step": 18 }, { "epoch": 0.33, "learning_rate": 0.0002, "loss": 0.6138, "step": 19 }, { "epoch": 0.35, "learning_rate": 0.0002, "loss": 0.6077, "step": 20 }, { "epoch": 0.37, "learning_rate": 0.0002, "loss": 0.629, "step": 21 }, { "epoch": 0.39, "learning_rate": 0.0002, "loss": 0.5646, "step": 22 }, { "epoch": 0.4, "learning_rate": 0.0002, "loss": 0.5411, "step": 23 }, { "epoch": 0.42, "learning_rate": 0.0002, "loss": 0.5716, "step": 24 }, { "epoch": 0.44, "learning_rate": 0.0002, "loss": 0.5115, "step": 25 }, { "epoch": 0.44, "eval_math_accuracy": 0.8093333333333333, "eval_math_average_probability": 0.6316643953323364, "eval_math_brier_score": 0.16190247237682343, "eval_math_loss": 0.4996137022972107, "eval_math_probabilities": [ 0.6633706092834473, 0.6084541082382202, 0.6621570587158203, 0.5422595143318176, 0.5795955061912537, 0.5662304759025574, 0.7143477201461792, 0.7680655717849731, 0.8372054100036621, 0.8936382532119751, 0.5472975969314575, 0.7134534120559692, 0.5641617774963379, 0.3191520869731903, 0.5099648833274841, 0.5377236008644104, 0.5142484307289124, 0.5110278725624084, 0.5240746140480042, 0.5794618725776672, 0.6070640683174133, 0.5101079940795898, 0.4745468199253082, 0.5221819877624512, 0.3646273612976074, 0.8507652282714844, 0.7823563814163208, 0.5775850415229797, 0.5282427072525024, 0.7187538743019104, 0.4172961115837097, 0.40366026759147644, 0.3604571521282196, 0.5117679834365845, 0.6709480285644531, 0.5679401755332947, 0.7527113556861877, 0.8291309475898743, 0.8854144811630249, 0.4780143201351166, 0.4241604804992676, 0.414424866437912, 0.9701191782951355, 0.9443850517272949, 0.9474314451217651, 0.5658140778541565, 0.534233808517456, 0.4676360487937927, 0.8589262366294861, 0.8720059394836426, 0.7007182836532593, 0.5339250564575195, 0.43697527050971985, 0.5275648832321167, 0.5365013480186462, 0.5904162526130676, 0.6352012157440186, 0.7782678008079529, 0.6769214272499084, 0.8178733587265015, 0.6039867997169495, 0.48236700892448425, 0.49095991253852844, 0.8245977163314819, 0.8284160494804382, 0.8404079079627991, 0.2851916551589966, 0.6111747622489929, 0.676672101020813, 0.7454131245613098, 0.7277416586875916, 0.8040912747383118, 0.5549920201301575, 0.5806645750999451, 0.5479379892349243, 0.9659104943275452, 0.9027314186096191, 0.8584287762641907, 0.612223207950592, 0.5742789506912231, 0.5742713809013367, 0.491126149892807, 0.5456624031066895, 0.5265108346939087, 0.4589597284793854, 0.7241318225860596, 0.7066437602043152, 0.47177252173423767, 0.5283196568489075, 0.5310873985290527, 0.9575446248054504, 0.8689523339271545, 0.984750509262085, 0.32476434111595154, 0.4359622895717621, 0.3557249903678894, 0.638299822807312, 0.7222625613212585, 0.7197080850601196, 0.5431556105613708, 0.5483987331390381, 0.5052368640899658, 0.7071025371551514, 0.7415751218795776, 0.7538554668426514, 0.78269362449646, 0.6718623638153076, 0.8567298054695129, 0.7432538270950317, 0.7464526295661926, 0.6677084565162659, 0.5891859531402588, 0.521098256111145, 0.5279675126075745, 0.5480110049247742, 0.5089955925941467, 0.49596890807151794, 0.8053426146507263, 0.8310225009918213, 0.7393491268157959, 0.9657951593399048, 0.7804853916168213, 0.826735258102417, 0.8840931057929993, 0.8941786289215088, 0.939432680606842, 0.5693816542625427, 0.7250611186027527, 0.8192509412765503, 0.9043412804603577, 0.9025180339813232, 0.8790348768234253, 0.9226536154747009, 0.8933433294296265, 0.802139163017273, 0.6052137017250061, 0.45218783617019653, 0.5514125227928162, 0.7218031287193298, 0.6621291041374207, 0.8381228446960449, 0.38562554121017456, 0.5712605714797974, 0.5857917666435242, 0.6015986800193787, 0.6676840782165527, 0.6247783303260803, 0.7702241539955139, 0.7300885915756226, 0.81181800365448, 0.5603957772254944, 0.6586405634880066, 0.7729614973068237, 0.7636373043060303, 0.7508606314659119, 0.7786847949028015, 0.5471927523612976, 0.5218795537948608, 0.533657431602478, 0.5127111077308655, 0.49687081575393677, 0.5163062810897827, 0.24398064613342285, 0.1453399658203125, 0.7341935634613037, 0.9984416365623474, 0.5174273252487183, 0.7952530384063721, 0.5069570541381836, 0.22518883645534515, 0.5297511219978333, 0.5534253716468811, 0.5073737502098083, 0.529682993888855, 0.6464091539382935, 0.6554543375968933, 0.5762879252433777, 0.43460413813591003, 0.5502632260322571, 0.4922613203525543, 0.502454936504364, 0.4942191243171692, 0.528808057308197, 0.8252964019775391, 0.5230216979980469, 0.8004457354545593, 0.8501718044281006, 0.7722131013870239, 0.8783368468284607, 0.7852928638458252, 0.8217051029205322, 0.8546723127365112, 0.6047033071517944, 0.4482806921005249, 0.5512674450874329, 0.5168452262878418, 0.4414539635181427, 0.5040595531463623, 0.6588204503059387, 0.6542771458625793, 0.49029749631881714, 0.6382280588150024, 0.5566757917404175, 0.6693888902664185, 0.5557968616485596, 0.5821195244789124, 0.6247583627700806, 0.6291689872741699, 0.3955490291118622, 0.5351685285568237, 0.7561461925506592, 0.7327651977539062, 0.6058982610702515, 0.8234307765960693, 0.8684364557266235, 0.7713478207588196, 0.6613808274269104, 0.4938766658306122, 0.6822813153266907, 0.2828020453453064, 0.7189218997955322, 0.28969606757164, 0.5664335489273071, 0.5806348323822021, 0.46697744727134705, 0.766159176826477, 0.8114504218101501, 0.8593038320541382, 0.7944024801254272, 0.4472806453704834, 0.4464675188064575, 0.6453775763511658, 0.5014820694923401, 0.5300639271736145, 0.995434582233429, 0.995976984500885, 0.9921278953552246, 0.5221747756004333, 0.5329358577728271, 0.5543885231018066, 0.6461371779441833, 0.5970206260681152, 0.4741358160972595, 0.6899920105934143, 0.8103334307670593, 0.8387188911437988, 0.5683832168579102, 0.638966977596283, 0.5058586597442627, 0.610042929649353, 0.5112279653549194, 0.4437251091003418, 0.6581318974494934, 0.6405580043792725, 0.6548277735710144, 0.5708030462265015, 0.6149079203605652, 0.6979327201843262, 0.525466799736023, 0.7948253154754639, 0.45318952202796936, 0.6075907349586487, 0.6899601817131042, 0.6856037974357605, 0.5278491973876953, 0.5578742623329163, 0.6113816499710083, 0.5754520297050476, 0.6663941144943237, 0.6446453928947449, 0.6343801021575928, 0.452676922082901, 0.6900813579559326, 0.6203823685646057, 0.49684879183769226, 0.5552070140838623, 0.5284071564674377, 0.5662087202072144, 0.5621691942214966, 0.4604977071285248, 0.5431878566741943, 0.5537838935852051, 0.7452890872955322, 0.7336522936820984, 0.7229248881340027, 0.9484919309616089, 0.946052074432373, 0.9606884121894836, 0.6328964829444885, 0.592518150806427, 0.6761943697929382, 0.6664173603057861, 0.665858268737793, 0.6252132654190063, 0.7971418499946594, 0.7664545178413391, 0.6764003038406372, 0.546024739742279, 0.5096439123153687, 0.4163995087146759, 0.996208667755127, 0.722212553024292, 0.7535108923912048, 0.5323713421821594, 0.48590973019599915, 0.5106146335601807, 0.5493354797363281, 0.7133362293243408, 0.5568097233772278, 0.8456324338912964, 0.849081814289093, 0.6895979046821594, 0.48037657141685486, 0.5182946920394897, 0.43588948249816895, 0.3302757740020752, 0.2659425139427185, 0.3164568841457367, 0.6335851550102234, 0.6728842854499817, 0.5911792516708374, 0.6177258491516113, 0.6103651523590088, 0.6178369522094727, 0.5563710927963257, 0.7658647298812866, 0.532772421836853, 0.6550226807594299, 0.7330681085586548, 0.6204957962036133, 0.7628816962242126, 0.825613260269165, 0.7782942652702332, 0.8581648468971252, 0.9153120517730713, 0.8967598080635071, 0.9768906831741333, 0.9605985283851624, 0.6297731995582581, 0.4935714304447174, 0.4640754461288452, 0.538644552230835, 0.5147488117218018, 0.5108230710029602, 0.5612874627113342, 0.6789100170135498, 0.2105802744626999, 0.6954947113990784, 0.7572029232978821, 0.7281805872917175, 0.7502058148384094, 0.6394172310829163, 0.6887081265449524, 0.6412500739097595, 0.8335980176925659, 0.7932922840118408, 0.8053995370864868, 0.8746823668479919, 0.946009635925293, 0.9517281651496887, 0.4339127242565155, 0.247321218252182, 0.2145976573228836, 0.490614116191864, 0.5368684530258179, 0.2451506108045578, 0.7408210635185242, 0.7774543166160583, 0.7593271732330322, 0.8091133236885071, 0.7974509000778198, 0.6612302660942078, 0.568977415561676, 0.5250735878944397, 0.501058042049408, 0.5868458151817322, 0.4874229431152344, 0.5369607210159302, 0.9366500377655029, 0.8851487636566162, 0.9130953550338745, 0.9901278614997864, 0.9322760701179504, 0.9541032910346985, 0.7118127346038818, 0.7448193430900574, 0.38498297333717346, 0.5693628191947937, 0.5145847797393799, 0.5033568739891052, 0.4743233025074005, 0.5364457368850708, 0.5033722519874573, 0.6601943969726562, 0.5644096732139587, 0.6229737997055054, 0.5048108100891113, 0.5609506368637085, 0.6200689077377319, 0.45839062333106995, 0.36859121918678284, 0.30953899025917053, 0.5259954929351807, 0.5694190859794617, 0.47615528106689453, 0.5118966698646545, 0.6567121148109436, 0.6480826139450073, 0.630197286605835, 0.631337583065033, 0.6863037347793579, 0.612686276435852, 0.5603938102722168, 0.5180266499519348, 0.6630816459655762, 0.5433847308158875, 0.6935270428657532, 0.6154450178146362, 0.6265705227851868, 0.7286648750305176, 0.5883929133415222, 0.6429011821746826, 0.554049551486969, 0.48778167366981506, 0.5924201011657715, 0.48124057054519653, 0.674160897731781, 0.8663924932479858, 0.7650707960128784, 0.7101995348930359, 0.7014365792274475, 0.7146080136299133, 0.7302005290985107, 0.5496945381164551, 0.5789515972137451, 0.8068313002586365, 0.6710797548294067, 0.7141956686973572, 0.7880030274391174, 0.8896335363388062, 0.8554779291152954, 0.8726771473884583, 0.8157098889350891, 0.7947221398353577, 0.7519100904464722, 0.889167845249176, 0.7569870352745056, 0.6813006401062012, 0.598541796207428, 0.6031305193901062, 0.8224567174911499, 0.8584598898887634, 0.7914873361587524, 0.8087180852890015, 0.8671677708625793, 0.8095394372940063, 0.4693150818347931, 0.688112199306488, 0.6655168533325195, 0.4120429754257202, 0.7080686688423157, 0.4526786208152771, 0.871704638004303, 0.8860160708427429, 0.8748094439506531, 0.6092134118080139, 0.5118093490600586, 0.5536448955535889, 0.3988867700099945, 0.48200905323028564, 0.45835474133491516, 0.8484293818473816, 0.8654550909996033, 0.856299102306366, 0.11021721363067627, 0.12135862559080124, 0.1365855485200882, 0.4336954951286316, 0.3255397379398346, 0.43762141466140747, 0.5077228546142578, 0.492169052362442, 0.48603418469429016, 0.7614470720291138, 0.7657009363174438, 0.6895551085472107, 0.6581164002418518, 0.8547004461288452, 0.732698380947113, 0.5182932615280151, 0.5941303372383118, 0.6399956345558167, 0.5698806047439575, 0.6200894117355347, 0.6388326287269592, 0.8974776864051819, 0.8787057399749756, 0.9896037578582764, 0.4779830873012543, 0.4539029002189636, 0.497659295797348, 0.4199877977371216, 0.33673661947250366, 0.6004912257194519, 0.7042511105537415, 0.7038925290107727, 0.6664761900901794, 0.47931572794914246, 0.5875719785690308, 0.5820919275283813, 0.5624472498893738, 0.7421032786369324, 0.3863491714000702, 0.7999858260154724, 0.7563070058822632, 0.8077383041381836, 0.8360069990158081, 0.6688551902770996, 0.8388704657554626, 0.8339889645576477, 0.6518611311912537, 0.6413933634757996, 0.6234366297721863, 0.5850790739059448, 0.7071154117584229, 0.5823634266853333, 0.5551979541778564, 0.7558367848396301, 0.3279586136341095, 0.8189963698387146, 0.4095887839794159, 0.516676664352417, 0.5830307602882385, 0.493702232837677, 0.5616060495376587, 0.6221363544464111, 0.5668870210647583, 0.5192185640335083, 0.513372540473938, 0.5240103602409363, 0.5719670057296753, 0.6559074521064758, 0.5998367071151733, 0.8956224918365479, 0.8256760835647583, 0.8396532535552979, 0.6912676095962524, 0.7078823447227478, 0.6742523312568665, 0.44555383920669556, 0.4864961802959442, 0.5093259215354919, 0.420614093542099, 0.4558805823326111, 0.5098426938056946, 0.44671303033828735, 0.3890758156776428, 0.4822029769420624, 0.6569315195083618, 0.6540688276290894, 0.6102049350738525, 0.4973224997520447, 0.4408690333366394, 0.3441625237464905, 0.5234178304672241, 0.5053881406784058, 0.5077328085899353, 0.6272447109222412, 0.6202148795127869, 0.6250457763671875, 0.5505877137184143, 0.7488998174667358, 0.7229215502738953, 0.967279314994812, 0.8379192352294922, 0.8255277276039124, 0.7062957882881165, 0.7849461436271667, 0.7417415976524353, 0.20129697024822235, 0.659896731376648, 0.6498774886131287, 0.6354400515556335, 0.8480803370475769, 0.7202244400978088, 0.6372606158256531, 0.6529891490936279, 0.516423225402832, 0.6023105382919312, 0.6697197556495667, 0.6567447185516357, 0.5339287519454956, 0.46531304717063904, 0.4897252023220062, 0.6884264349937439, 0.7071057558059692, 0.8095695972442627, 0.4459150731563568, 0.3937334418296814, 0.40751639008522034, 0.5066817402839661, 0.5337297916412354, 0.5636802315711975, 0.833284318447113, 0.43843793869018555, 0.9899227023124695, 0.5373814105987549, 0.649697482585907, 0.511232316493988, 0.611300528049469, 0.5401736497879028, 0.548761785030365, 0.5708224177360535, 0.5487539768218994, 0.5448604226112366, 0.7356581091880798, 0.6940728425979614, 0.7854553461074829, 0.5545613765716553, 0.519231915473938, 0.5373342037200928, 0.49752581119537354, 0.520611584186554, 0.5338495969772339, 0.5593573451042175, 0.6815086007118225, 0.5781393647193909, 0.5679507851600647, 0.6038490533828735, 0.4746713638305664, 0.7259525060653687, 0.5200871825218201, 0.7806335687637329, 0.49713173508644104, 0.5273850560188293, 0.46150845289230347, 0.5906476974487305, 0.7053019404411316, 0.6652464866638184, 0.7277405858039856, 0.5937675833702087, 0.7591066956520081, 0.5191434621810913, 0.33489516377449036, 0.38055187463760376, 0.56748366355896, 0.6505720019340515, 0.4614139795303345, 0.8687284588813782, 0.7884291410446167, 0.8243569731712341, 0.5583450794219971, 0.5858427286148071, 0.7323949337005615, 0.668289303779602, 0.5550376176834106, 0.48988860845565796, 0.3248864710330963, 0.6118786334991455, 0.4166000783443451, 0.6086819767951965, 0.5723824501037598, 0.5568788647651672, 0.5895213484764099, 0.5719113945960999, 0.8764314651489258, 0.49615979194641113, 0.6165228486061096, 0.4922025203704834, 0.4707225263118744, 0.4362126290798187, 0.48726609349250793, 0.7922884821891785, 0.7094277739524841, 0.4740876853466034, 0.9792476892471313, 0.8020926117897034, 0.7029873728752136, 0.6756966710090637, 0.7588812708854675, 0.7846832871437073, 0.55971360206604, 0.5519441366195679, 0.5215198993682861, 0.751953125, 0.8236594200134277, 0.7258154153823853, 0.6511673331260681, 0.5037521719932556, 0.5392888784408569, 0.624679446220398, 0.7061256766319275, 0.6218675971031189, 0.34532469511032104, 0.8460456132888794, 0.6841530203819275, 0.7520891427993774, 0.6842833757400513, 0.6804845929145813, 0.6963101029396057, 0.7662405967712402, 0.7594859600067139, 0.8005949258804321, 0.5491482019424438, 0.6408277153968811, 0.43373754620552063, 0.3303249180316925, 0.41782644391059875, 0.6935751438140869, 0.6947365403175354, 0.7085362076759338, 0.9792237281799316, 0.4461096525192261, 0.5915313363075256, 0.49463775753974915, 0.69148188829422, 0.5705913305282593, 0.5716133117675781, 0.4339978098869324, 0.4441128969192505, 0.5309861302375793, 0.5180039405822754, 0.41510868072509766, 0.7265142202377319, 0.7004600167274475, 0.7797722816467285, 0.8555888533592224, 0.6555377840995789, 0.725948691368103, 0.5199047327041626, 0.5478607416152954, 0.49339625239372253, 0.8818256258964539, 0.9065577387809753, 0.886340856552124, 0.9988778233528137, 0.8997090458869934, 0.5748993158340454, 0.5227178335189819, 0.49822187423706055, 0.39820119738578796, 0.4866050183773041, 0.5304800271987915, 0.5495126247406006, 0.807094395160675, 0.8251957893371582, 0.8757453560829163, 0.4887425899505615, 0.4169941544532776, 0.42122045159339905 ], "eval_math_runtime": 201.2353, "eval_math_samples_per_second": 3.727, "eval_math_score": -0.16190247237682343, "eval_math_steps_per_second": 0.119, "step": 25 }, { "epoch": 0.46, "learning_rate": 0.0002, "loss": 0.4395, "step": 26 }, { "epoch": 0.47, "learning_rate": 0.0002, "loss": 0.5106, "step": 27 }, { "epoch": 0.49, "learning_rate": 0.0002, "loss": 0.3161, "step": 28 }, { "epoch": 0.51, "learning_rate": 0.0002, "loss": 0.3613, "step": 29 }, { "epoch": 0.53, "learning_rate": 0.0002, "loss": 0.3076, "step": 30 }, { "epoch": 0.54, "learning_rate": 0.0002, "loss": 0.4935, "step": 31 }, { "epoch": 0.56, "learning_rate": 0.0002, "loss": 0.3821, "step": 32 }, { "epoch": 0.58, "learning_rate": 0.0002, "loss": 0.3508, "step": 33 }, { "epoch": 0.6, "learning_rate": 0.0002, "loss": 0.3412, "step": 34 }, { "epoch": 0.61, "learning_rate": 0.0002, "loss": 0.3594, "step": 35 }, { "epoch": 0.63, "learning_rate": 0.0002, "loss": 0.2907, "step": 36 }, { "epoch": 0.65, "learning_rate": 0.0002, "loss": 0.3608, "step": 37 }, { "epoch": 0.67, "learning_rate": 0.0002, "loss": 0.2533, "step": 38 }, { "epoch": 0.68, "learning_rate": 0.0002, "loss": 0.6468, "step": 39 }, { "epoch": 0.7, "learning_rate": 0.0002, "loss": 0.4454, "step": 40 }, { "epoch": 0.72, "learning_rate": 0.0002, "loss": 0.3902, "step": 41 }, { "epoch": 0.74, "learning_rate": 0.0002, "loss": 0.2721, "step": 42 }, { "epoch": 0.75, "learning_rate": 0.0002, "loss": 0.2142, "step": 43 }, { "epoch": 0.77, "learning_rate": 0.0002, "loss": 0.2937, "step": 44 }, { "epoch": 0.79, "learning_rate": 0.0002, "loss": 0.2849, "step": 45 }, { "epoch": 0.81, "learning_rate": 0.0002, "loss": 0.411, "step": 46 }, { "epoch": 0.82, "learning_rate": 0.0002, "loss": 0.2435, "step": 47 }, { "epoch": 0.84, "learning_rate": 0.0002, "loss": 0.4361, "step": 48 }, { "epoch": 0.86, "learning_rate": 0.0002, "loss": 0.3052, "step": 49 }, { "epoch": 0.88, "learning_rate": 0.0002, "loss": 0.4491, "step": 50 }, { "epoch": 0.88, "eval_math_accuracy": 0.8226666666666667, "eval_math_average_probability": 0.7686926126480103, "eval_math_brier_score": 0.12212485074996948, "eval_math_loss": 0.4135887026786804, "eval_math_probabilities": [ 0.9898386001586914, 0.989701509475708, 0.9890323877334595, 0.7907657027244568, 0.8535579442977905, 0.8342218399047852, 0.9967971444129944, 0.9915836453437805, 0.9907526969909668, 0.9095348119735718, 0.685765266418457, 0.7450512647628784, 0.8427234888076782, 0.07416536659002304, 0.849005937576294, 0.4998757243156433, 0.6111614108085632, 0.5562968254089355, 0.759619951248169, 0.3430194556713104, 0.4106164574623108, 0.5945573449134827, 0.42925503849983215, 0.5331234335899353, 0.15886452794075012, 0.9111754298210144, 0.7929478287696838, 0.8131201863288879, 0.492657333612442, 0.40756136178970337, 0.13238157331943512, 0.10109685361385345, 0.08083260804414749, 0.933353066444397, 0.996414303779602, 0.9881616234779358, 0.9957822561264038, 0.9940518736839294, 0.9911954402923584, 0.2327170968055725, 0.01113490667194128, 0.018342692404985428, 0.9984914064407349, 0.9973036050796509, 0.9729018807411194, 0.6485802531242371, 0.3493095636367798, 0.21032515168190002, 0.9995682835578918, 0.9996974468231201, 0.917833685874939, 0.760581910610199, 0.6432754397392273, 0.8091898560523987, 0.7844832539558411, 0.91327965259552, 0.9575035572052002, 0.9994388222694397, 0.9982775449752808, 0.9997504353523254, 0.7062922716140747, 0.5163776874542236, 0.37822097539901733, 0.6208543181419373, 0.6176100969314575, 0.8507413864135742, 0.014980330131947994, 0.8677336573600769, 0.9352487325668335, 0.7987423539161682, 0.8629010319709778, 0.9119073152542114, 0.7031856775283813, 0.7270292639732361, 0.8326331973075867, 0.9997046589851379, 0.9990344047546387, 0.9939823746681213, 0.9230589866638184, 0.8899773359298706, 0.8522449731826782, 0.7666754722595215, 0.925064206123352, 0.9242060780525208, 0.7928504943847656, 0.9327524304389954, 0.9656206369400024, 0.6054933667182922, 0.5640263557434082, 0.6491990685462952, 0.9995273351669312, 0.9980650544166565, 0.9995204210281372, 0.3472268581390381, 0.900184154510498, 0.4053606390953064, 0.6472825407981873, 0.8974281549453735, 0.9143079519271851, 0.8297086954116821, 0.8830797076225281, 0.7588180899620056, 0.9726789593696594, 0.9956698417663574, 0.9944221377372742, 0.9992859959602356, 0.9955989122390747, 0.9990593791007996, 0.9950889945030212, 0.9618326425552368, 0.9871684312820435, 0.6200104355812073, 0.34859955310821533, 0.3735411465167999, 0.5748960375785828, 0.4479866027832031, 0.37354394793510437, 0.9721567034721375, 0.9860655069351196, 0.943369448184967, 0.9999667406082153, 0.9997943043708801, 0.9998214840888977, 0.2377970963716507, 0.24083161354064941, 0.28463059663772583, 0.6217735409736633, 0.45513853430747986, 0.8604767322540283, 0.9780745506286621, 0.965714693069458, 0.9147642850875854, 0.9973574280738831, 0.994486391544342, 0.9889662861824036, 0.3105144798755646, 0.5582692623138428, 0.8071754574775696, 0.9759202003479004, 0.9769974946975708, 0.9922428727149963, 0.010290156118571758, 0.7487633228302002, 0.6738214492797852, 0.9265402555465698, 0.9943633079528809, 0.9860871434211731, 0.9998179078102112, 0.9991245865821838, 0.9998130202293396, 0.10651354491710663, 0.4311460256576538, 0.42624321579933167, 0.9993637204170227, 0.999885082244873, 0.9999722242355347, 0.4203025996685028, 0.7777973413467407, 0.5109290480613708, 0.6236875057220459, 0.652536153793335, 0.6703343391418457, 0.8993702530860901, 0.2166506052017212, 0.6708146929740906, 0.9999450445175171, 0.9875665903091431, 0.983705997467041, 0.6890847682952881, 0.0033774017356336117, 0.71236252784729, 0.42585477232933044, 0.5142151117324829, 0.5489001870155334, 0.9508610963821411, 0.95615553855896, 0.9065225720405579, 0.5782293677330017, 0.7067509293556213, 0.6561964750289917, 0.6433640718460083, 0.5444236993789673, 0.6337283849716187, 0.6197820901870728, 0.6850131154060364, 0.9942216277122498, 0.9998719692230225, 0.9998711347579956, 0.9998020529747009, 0.9969862103462219, 0.9975737929344177, 0.9990050196647644, 0.9077370762825012, 0.3920532464981079, 0.7660297751426697, 0.49212735891342163, 0.30620077252388, 0.7274808883666992, 0.9477325081825256, 0.9549977779388428, 0.5160512328147888, 0.992021918296814, 0.9007187485694885, 0.9917388558387756, 0.5693521499633789, 0.559917151927948, 0.6452479958534241, 0.9803745150566101, 0.48104679584503174, 0.5412415862083435, 0.8115394115447998, 0.9632490873336792, 0.7633785605430603, 0.8565756678581238, 0.9831998348236084, 0.9901072978973389, 0.9840487241744995, 0.31269630789756775, 0.9845069050788879, 0.42847204208374023, 0.7282599806785583, 0.36419183015823364, 0.5837609767913818, 0.8755786418914795, 0.039886802434921265, 0.9991896748542786, 0.9998026490211487, 0.9999561309814453, 0.9875608086585999, 0.6893495321273804, 0.5455873012542725, 0.8017504215240479, 0.4041386842727661, 0.8203705549240112, 0.9999384880065918, 0.9999490976333618, 0.9994640946388245, 0.5638045072555542, 0.7802672386169434, 0.7020519375801086, 0.8610048890113831, 0.7877287864685059, 0.5791395902633667, 0.9052756428718567, 0.9866493344306946, 0.990517795085907, 0.7134201526641846, 0.8382417559623718, 0.4695950150489807, 0.7814311385154724, 0.8124359250068665, 0.6940707564353943, 0.9722387194633484, 0.9818227291107178, 0.9952824711799622, 0.6443295478820801, 0.7161229848861694, 0.9299699664115906, 0.5648988485336304, 0.7591490149497986, 0.1656244844198227, 0.8433585166931152, 0.9723582863807678, 0.9616088271141052, 0.6606411933898926, 0.7480043172836304, 0.900150716304779, 0.9240853190422058, 0.9606131315231323, 0.9568279385566711, 0.808892011642456, 0.3982371687889099, 0.8589038252830505, 0.6602863073348999, 0.29606351256370544, 0.5925323963165283, 0.5400646924972534, 0.7057110667228699, 0.682681679725647, 0.8740394115447998, 0.9755914211273193, 0.9656183123588562, 0.9980296492576599, 0.9965050220489502, 0.9983291029930115, 0.9995476603507996, 0.9983981251716614, 0.998607337474823, 0.8665869235992432, 0.9102798104286194, 0.934410035610199, 0.9995707869529724, 0.9994034767150879, 0.9990745782852173, 0.9984431862831116, 0.9951153993606567, 0.9804850816726685, 0.6310920119285583, 0.4925338923931122, 0.4374648630619049, 0.9808872938156128, 0.9186288118362427, 0.957531750202179, 0.637174665927887, 0.70749831199646, 0.710197925567627, 0.42596128582954407, 0.6537368893623352, 0.5910662412643433, 0.9819629192352295, 0.9844282269477844, 0.891087532043457, 0.8406636714935303, 0.9537967443466187, 0.8314835429191589, 0.0009055526461452246, 0.029619278386235237, 0.0009705450502224267, 0.9654051661491394, 0.9350541234016418, 0.8546467423439026, 0.8379034399986267, 0.9736809730529785, 0.9413271546363831, 0.4309505224227905, 0.9004702568054199, 0.35427388548851013, 0.9655686020851135, 0.9704180359840393, 0.9095833897590637, 0.9425690174102783, 0.9823436737060547, 0.9740239381790161, 0.9994397759437561, 0.9998176693916321, 0.9997082352638245, 0.8383850455284119, 0.7848756313323975, 0.6585043668746948, 0.6385700702667236, 0.5423804521560669, 0.8753641843795776, 0.732766330242157, 0.6359524726867676, 0.7625292539596558, 0.8212173581123352, 0.11705918610095978, 0.8652222156524658, 0.9102587699890137, 0.9196300506591797, 0.9737518429756165, 0.9776536822319031, 0.9756010174751282, 0.9212267398834229, 0.9992740750312805, 0.9975312352180481, 0.9967331886291504, 0.9999743700027466, 0.9999542236328125, 0.9999973773956299, 0.6512118577957153, 0.22892218828201294, 0.4092002809047699, 0.17215590178966522, 0.14864671230316162, 0.0007259995909407735, 0.9999641180038452, 0.999962568283081, 0.9998689889907837, 0.9937784075737, 0.9928675889968872, 0.9883486032485962, 0.6788796782493591, 0.5904794931411743, 0.5650668144226074, 0.8680938482284546, 0.6355900764465332, 0.44315725564956665, 0.9995632767677307, 0.9973588585853577, 0.9995960593223572, 0.9981244206428528, 0.9810311198234558, 0.9913960099220276, 0.9253461360931396, 0.9835773706436157, 0.563185453414917, 0.9161015152931213, 0.8578208088874817, 0.7942823171615601, 0.5117859840393066, 0.6000229120254517, 0.6110525727272034, 0.9549239873886108, 0.5401516556739807, 0.9555858969688416, 0.7354704141616821, 0.8270170092582703, 0.8696510791778564, 0.4741208851337433, 0.46251001954078674, 0.4985361099243164, 0.6141524314880371, 0.5771761536598206, 0.5856173634529114, 0.1125413030385971, 0.9731563925743103, 0.9515812993049622, 0.9787399768829346, 0.989871084690094, 0.9961666464805603, 0.94477379322052, 0.8960367441177368, 0.8345122337341309, 0.9985882639884949, 0.8975287675857544, 0.9889278411865234, 0.9595134854316711, 0.9094861149787903, 0.9763516187667847, 0.9941058158874512, 0.9965364933013916, 0.9765222072601318, 0.9770127534866333, 0.9509215950965881, 0.9823228716850281, 0.9632203578948975, 0.9987339377403259, 0.9793480634689331, 0.9861056804656982, 0.9859195947647095, 0.987727165222168, 0.9633209109306335, 0.8045425415039062, 0.8842135071754456, 0.9951221346855164, 0.7724618315696716, 0.9533464312553406, 0.9806482195854187, 0.9979403614997864, 0.9723275303840637, 0.999786913394928, 0.9997188448905945, 0.9992828965187073, 0.9279277324676514, 0.9303634166717529, 0.872368574142456, 0.919461727142334, 0.8884122371673584, 0.9562082290649414, 0.9996380805969238, 0.9997496008872986, 0.9990566372871399, 0.986677885055542, 0.9994465708732605, 0.999566376209259, 0.6651096940040588, 0.5527064204216003, 0.7624334096908569, 0.34169065952301025, 0.9469629526138306, 0.4833490550518036, 0.9999914169311523, 0.9999831914901733, 0.9999784231185913, 0.9619956612586975, 0.4391608238220215, 0.5740798711776733, 0.3539835810661316, 0.48285821080207825, 0.5371236205101013, 0.9999614953994751, 0.999980092048645, 0.9999723434448242, 0.9919314980506897, 0.9908376336097717, 0.9932786822319031, 0.675650417804718, 0.4359276592731476, 0.7571223974227905, 0.6247730851173401, 0.809048056602478, 0.4869582951068878, 0.9475153088569641, 0.951598584651947, 0.7009941935539246, 0.9611502289772034, 0.9823969602584839, 0.981467068195343, 0.8135129809379578, 0.774700939655304, 0.972871720790863, 0.17411310970783234, 0.6652093529701233, 0.785819411277771, 0.9978393316268921, 0.9978347420692444, 0.9991887211799622, 0.5143252611160278, 0.47546249628067017, 0.5336116552352905, 0.1676444113254547, 0.008225351572036743, 0.6153576374053955, 0.9924029111862183, 0.988237202167511, 0.9698491096496582, 0.24151939153671265, 0.7150141596794128, 0.7451751232147217, 0.58341383934021, 0.9586536884307861, 0.0559365339577198, 0.9980765581130981, 0.9857786893844604, 0.9992893934249878, 0.9924793243408203, 0.8706427216529846, 0.9980652928352356, 0.959970235824585, 0.8840649724006653, 0.9883635640144348, 0.8997098207473755, 0.008895361796021461, 0.8562850952148438, 0.7158913016319275, 0.8034545183181763, 0.8659782409667969, 0.031506672501564026, 0.9932496547698975, 0.23031069338321686, 0.7497101426124573, 0.837375819683075, 0.48054957389831543, 0.9960286617279053, 0.9925709366798401, 0.9842051863670349, 0.6498824954032898, 0.48323923349380493, 0.5284236073493958, 0.9476768374443054, 0.9332055449485779, 0.8726440072059631, 0.9804374575614929, 0.9905673861503601, 0.987600564956665, 0.9959872364997864, 0.9951980710029602, 0.9912860989570618, 0.4835430085659027, 0.6851194500923157, 0.4029543995857239, 0.1236719861626625, 0.13734008371829987, 0.3973076343536377, 0.7047004103660583, 0.06082606315612793, 0.1228705421090126, 0.9710100293159485, 0.9264395236968994, 0.9429928660392761, 0.6296966075897217, 0.9387162923812866, 0.912956953048706, 0.9590694904327393, 0.9421502351760864, 0.9380912184715271, 0.60323166847229, 0.8158379197120667, 0.8958150148391724, 0.6551173329353333, 0.9713819622993469, 0.957204282283783, 0.9843922853469849, 0.9850255846977234, 0.9930846691131592, 0.9963818788528442, 0.998307466506958, 0.9987719655036926, 0.09588505327701569, 0.9553056955337524, 0.9880474805831909, 0.9289746880531311, 0.9869676232337952, 0.9488592147827148, 0.9800060987472534, 0.9828245639801025, 0.4881092607975006, 0.9865748286247253, 0.9854854941368103, 0.9827967882156372, 0.6090140342712402, 0.6031761169433594, 0.346174955368042, 0.948103666305542, 0.9508306980133057, 0.9429970979690552, 0.43267473578453064, 0.26316529512405396, 0.36367589235305786, 0.6679554581642151, 0.7673311233520508, 0.6891053318977356, 0.9883525967597961, 0.5465512275695801, 0.9998946189880371, 0.907686173915863, 0.9419436454772949, 0.3114522695541382, 0.7514263391494751, 0.6639309525489807, 0.6631780862808228, 0.5361356139183044, 0.4464097321033478, 0.497233510017395, 0.9996397495269775, 0.9969215989112854, 0.9996145963668823, 0.44144898653030396, 0.6436446905136108, 0.4166458547115326, 0.4984821081161499, 0.5435376167297363, 0.49898481369018555, 0.5890449285507202, 0.9751158952713013, 0.7627744078636169, 0.7602001428604126, 0.6940763592720032, 0.4224088191986084, 0.7884323596954346, 0.6320403814315796, 0.7426793575286865, 0.7356664538383484, 0.8911908268928528, 0.6079978942871094, 0.9870471954345703, 0.9915956854820251, 0.8974714279174805, 0.9995042085647583, 0.9514618515968323, 0.9996602535247803, 0.417091429233551, 0.4400644302368164, 0.39303356409072876, 0.9772469997406006, 0.9654296040534973, 0.547843873500824, 0.9970254302024841, 0.9851948618888855, 0.9941616654396057, 0.9355183839797974, 0.8954127430915833, 0.9892168045043945, 0.9564470648765564, 0.9400984048843384, 0.955315887928009, 0.9603729248046875, 0.9913148283958435, 0.9798077344894409, 0.6817052364349365, 0.5417571067810059, 0.4263080656528473, 0.8194852471351624, 0.6752426028251648, 0.9849148988723755, 0.9635273814201355, 0.9744645357131958, 0.7404565811157227, 0.2977635860443115, 0.20386259257793427, 0.46867233514785767, 0.9738361239433289, 0.9531043767929077, 0.6334224343299866, 0.9998207688331604, 0.9965136647224426, 0.9990161657333374, 0.9170734286308289, 0.9926355481147766, 0.978865385055542, 0.7085341215133667, 0.7438916563987732, 0.5301404595375061, 0.9338966608047485, 0.969135046005249, 0.9385656714439392, 0.9445363879203796, 0.8947834372520447, 0.28614670038223267, 0.990917980670929, 0.9910455346107483, 0.9897929430007935, 0.1672135591506958, 0.950958251953125, 0.8695336580276489, 0.7770122289657593, 0.8807089328765869, 0.8260342478752136, 0.9968299269676208, 0.9960094690322876, 0.9997007846832275, 0.9586477875709534, 0.9053156971931458, 0.923352062702179, 0.1563415378332138, 0.002003453439101577, 0.13627783954143524, 0.9245595932006836, 0.803291916847229, 0.9196100831031799, 0.7406015992164612, 0.4807405471801758, 0.6529648303985596, 0.4399782121181488, 0.8142197132110596, 0.6627914309501648, 0.3087478578090668, 0.12539826333522797, 0.18148313462734222, 0.6181093454360962, 0.6652869582176208, 0.486186683177948, 0.977999746799469, 0.9860544800758362, 0.995832622051239, 0.9998654127120972, 0.8452519774436951, 0.9727556705474854, 0.4017540216445923, 0.5111969113349915, 0.2867123782634735, 0.9895524382591248, 0.9865810871124268, 0.9928285479545593, 0.9977977275848389, 0.9896787405014038, 0.8037351369857788, 0.8173794746398926, 0.7876136302947998, 0.373805969953537, 0.38773632049560547, 0.33671411871910095, 0.4831717312335968, 0.9743400812149048, 0.9805911183357239, 0.9997939467430115, 0.7104775905609131, 0.6915130615234375, 0.40574759244918823 ], "eval_math_runtime": 201.0086, "eval_math_samples_per_second": 3.731, "eval_math_score": -0.12212485074996948, "eval_math_steps_per_second": 0.119, "step": 50 }, { "epoch": 0.89, "learning_rate": 0.0002, "loss": 0.3559, "step": 51 }, { "epoch": 0.91, "learning_rate": 0.0002, "loss": 0.2321, "step": 52 }, { "epoch": 0.93, "learning_rate": 0.0002, "loss": 0.3617, "step": 53 }, { "epoch": 0.95, "learning_rate": 0.0002, "loss": 0.3475, "step": 54 }, { "epoch": 0.96, "learning_rate": 0.0002, "loss": 0.3019, "step": 55 }, { "epoch": 0.98, "learning_rate": 0.0002, "loss": 0.3041, "step": 56 }, { "epoch": 1.0, "learning_rate": 0.0002, "loss": 0.296, "step": 57 }, { "epoch": 1.02, "learning_rate": 0.0002, "loss": 0.3194, "step": 58 }, { "epoch": 1.04, "learning_rate": 0.0002, "loss": 0.2018, "step": 59 }, { "epoch": 1.05, "learning_rate": 0.0002, "loss": 0.2523, "step": 60 }, { "epoch": 1.07, "learning_rate": 0.0002, "loss": 0.2728, "step": 61 }, { "epoch": 1.09, "learning_rate": 0.0002, "loss": 0.1898, "step": 62 }, { "epoch": 1.11, "learning_rate": 0.0002, "loss": 0.2239, "step": 63 }, { "epoch": 1.12, "learning_rate": 0.0002, "loss": 0.1369, "step": 64 }, { "epoch": 1.14, "learning_rate": 0.0002, "loss": 0.1841, "step": 65 }, { "epoch": 1.16, "learning_rate": 0.0002, "loss": 0.0944, "step": 66 }, { "epoch": 1.18, "learning_rate": 0.0002, "loss": 0.2633, "step": 67 }, { "epoch": 1.19, "learning_rate": 0.0002, "loss": 0.2522, "step": 68 }, { "epoch": 1.21, "learning_rate": 0.0002, "loss": 0.1845, "step": 69 }, { "epoch": 1.23, "learning_rate": 0.0002, "loss": 0.6052, "step": 70 }, { "epoch": 1.25, "learning_rate": 0.0002, "loss": 0.1424, "step": 71 }, { "epoch": 1.26, "learning_rate": 0.0002, "loss": 0.1756, "step": 72 }, { "epoch": 1.28, "learning_rate": 0.0002, "loss": 0.1089, "step": 73 }, { "epoch": 1.3, "learning_rate": 0.0002, "loss": 0.1282, "step": 74 }, { "epoch": 1.32, "learning_rate": 0.0002, "loss": 0.1903, "step": 75 }, { "epoch": 1.32, "eval_math_accuracy": 0.836, "eval_math_average_probability": 0.8027346134185791, "eval_math_brier_score": 0.12285017967224121, "eval_math_loss": 0.47426244616508484, "eval_math_probabilities": [ 0.9616103768348694, 0.9777390360832214, 0.9263269901275635, 0.9547826647758484, 0.9897022247314453, 0.9868230819702148, 0.9999814033508301, 0.999953031539917, 0.9999668598175049, 0.9020634293556213, 0.6200502514839172, 0.8411897420883179, 0.7032442092895508, 0.10504203289747238, 0.9659855365753174, 0.5407034158706665, 0.6209026575088501, 0.8128259181976318, 0.9672952890396118, 0.2824172377586365, 0.25982463359832764, 0.6108538508415222, 0.39588451385498047, 0.46226173639297485, 0.37387093901634216, 0.9937414526939392, 0.9840722680091858, 0.6747256517410278, 0.1888180673122406, 0.34788623452186584, 0.31137150526046753, 0.12450224906206131, 0.010354206897318363, 0.6879879832267761, 0.9971621036529541, 0.9841330051422119, 0.9999958276748657, 0.9999974966049194, 0.9999927282333374, 0.37846872210502625, 0.004803119692951441, 0.005940170492976904, 0.9999921321868896, 0.9999728202819824, 0.999535083770752, 0.4809458553791046, 0.11902621388435364, 0.622745931148529, 0.9999984502792358, 0.999996542930603, 0.9998542070388794, 0.97740638256073, 0.8996613621711731, 0.9838483929634094, 0.9796146750450134, 0.9940411448478699, 0.9990707039833069, 0.999849796295166, 0.9998860359191895, 0.999991774559021, 0.9590617418289185, 0.8085365295410156, 0.5599466562271118, 0.9992380142211914, 0.9960553646087646, 0.9991949200630188, 0.0018545275088399649, 0.9733086824417114, 0.9608615636825562, 0.9890915155410767, 0.9968781471252441, 0.9988301396369934, 0.9659545421600342, 0.9978916049003601, 0.9996689558029175, 0.9999884366989136, 0.9999542236328125, 0.9999054670333862, 0.7933868765830994, 0.7309855222702026, 0.500259280204773, 0.85321444272995, 0.9754963517189026, 0.9570429921150208, 0.9947916269302368, 0.998795747756958, 0.9996286630630493, 0.7474744915962219, 0.8898021578788757, 0.9503018260002136, 0.9999951124191284, 0.9999133348464966, 0.9999891519546509, 0.512779176235199, 0.9794629216194153, 0.7001636624336243, 0.8228245377540588, 0.9887117147445679, 0.9956998825073242, 0.9169439673423767, 0.9870864152908325, 0.8614763021469116, 0.9944766163825989, 0.9996436834335327, 0.9998750686645508, 0.9999386072158813, 0.999779999256134, 0.9998420476913452, 0.9997830986976624, 0.9952991008758545, 0.9999264478683472, 0.9333474040031433, 0.34119364619255066, 0.27665069699287415, 0.54599529504776, 0.10532116889953613, 0.1371345818042755, 0.999987006187439, 0.999953031539917, 0.9999170303344727, 0.999994158744812, 0.999992847442627, 0.9999840259552002, 0.9312161207199097, 0.9753838181495667, 0.897465169429779, 0.18020963668823242, 0.6805407404899597, 0.9487439393997192, 0.9996782541275024, 0.9993441700935364, 0.9962584972381592, 0.9973415732383728, 0.9817659854888916, 0.97055983543396, 0.4640359878540039, 0.8658984899520874, 0.9638795256614685, 0.9964255690574646, 0.9989262223243713, 0.9996436834335327, 0.0006655855686403811, 0.7774356007575989, 0.6284235119819641, 0.9812864661216736, 0.9993892908096313, 0.9976217150688171, 0.9998873472213745, 0.9992232322692871, 0.9998394250869751, 0.02585442177951336, 0.8765549659729004, 0.5663195252418518, 0.9999856948852539, 0.9999985694885254, 0.9999998807907104, 0.22014467418193817, 0.68534916639328, 0.5673434734344482, 0.9249856472015381, 0.884716272354126, 0.9268526434898376, 0.9968695044517517, 0.339991956949234, 0.9891712069511414, 0.9999780654907227, 0.8726098537445068, 0.9999003410339355, 0.8338379859924316, 4.09116319133318e-06, 0.6740800738334656, 0.3950447142124176, 0.5736073851585388, 0.5454285144805908, 0.9989768266677856, 0.9874175786972046, 0.9756374359130859, 0.8555288910865784, 0.904450535774231, 0.7581718564033508, 0.7325549721717834, 0.7028653621673584, 0.5542841553688049, 0.7407044768333435, 0.9944004416465759, 0.9999418258666992, 0.9999920129776001, 0.999993085861206, 0.9999892711639404, 0.9998924732208252, 0.9999027252197266, 0.9999561309814453, 0.9790157079696655, 0.7475374341011047, 0.6588977575302124, 0.998623251914978, 0.9952036142349243, 0.9988403916358948, 0.9773750901222229, 0.9852950572967529, 0.33342546224594116, 0.9999450445175171, 0.9374085068702698, 0.9999899864196777, 0.5551424622535706, 0.3777192533016205, 0.6178329586982727, 0.9999898672103882, 0.6861721277236938, 0.3658721148967743, 0.9620970487594604, 0.9909302592277527, 0.9001444578170776, 0.9988125562667847, 0.9999575614929199, 0.999975323677063, 0.9425793886184692, 0.0035807753447443247, 0.9408767819404602, 0.46566227078437805, 0.9470212459564209, 0.2562110424041748, 0.634774386882782, 0.9092840552330017, 0.38700979948043823, 0.9999985694885254, 0.9999997615814209, 0.9999997615814209, 0.9999020099639893, 0.9199821352958679, 0.18736359477043152, 0.9738328456878662, 0.7494648098945618, 0.8496094346046448, 0.9999994039535522, 0.9999998807907104, 0.9999964237213135, 0.7976861000061035, 0.9804123640060425, 0.8835974931716919, 0.8938279747962952, 0.7995594143867493, 0.6249706149101257, 0.9914549589157104, 0.9999350309371948, 0.99994957447052, 0.975982666015625, 0.9702451825141907, 0.43418264389038086, 0.9935144186019897, 0.9943291544914246, 0.9888448119163513, 0.9939238429069519, 0.9998749494552612, 0.9993149042129517, 0.512698233127594, 0.6980327367782593, 0.9500287771224976, 0.9659674167633057, 0.9347702860832214, 0.6070705056190491, 0.9948592185974121, 0.9994342923164368, 0.996736466884613, 0.7936747074127197, 0.9303926229476929, 0.9700731635093689, 0.9982532858848572, 0.999664306640625, 0.9993990659713745, 0.9460805058479309, 0.7770049571990967, 0.9622872471809387, 0.9188669323921204, 0.008583828806877136, 0.7199167609214783, 0.5069194436073303, 0.6535472273826599, 0.6333915591239929, 0.8869540095329285, 0.9759289622306824, 0.9829748272895813, 0.9999711513519287, 0.9999535083770752, 0.9999791383743286, 0.9999644756317139, 0.9999152421951294, 0.9999382495880127, 0.9942936301231384, 0.9957635402679443, 0.9979026317596436, 0.9992662072181702, 0.9972594976425171, 0.9965948462486267, 0.9998446702957153, 0.9996365308761597, 0.996507465839386, 0.7331793904304504, 0.5202239751815796, 0.3624313175678253, 0.9824156761169434, 0.8202564120292664, 0.833457887172699, 0.562144935131073, 0.8174747824668884, 0.6805662512779236, 0.40537989139556885, 0.6105422377586365, 0.4814479947090149, 0.9988216757774353, 0.9993789196014404, 0.9917038679122925, 0.9987701773643494, 0.9999716281890869, 0.9983593821525574, 6.358225073199719e-05, 0.00935890432447195, 0.00017105160804931074, 0.9996293783187866, 0.9980521202087402, 0.9937124848365784, 0.6002519130706787, 0.9983401298522949, 0.8870399594306946, 0.6542457342147827, 0.9968175888061523, 0.25101590156555176, 0.9921407699584961, 0.9180073738098145, 0.9385048747062683, 0.9957907795906067, 0.9999065399169922, 0.9981562495231628, 0.999789297580719, 0.9999570846557617, 0.9997466206550598, 0.9829743504524231, 0.9559981822967529, 0.9454857707023621, 0.8298242688179016, 0.8851228952407837, 0.9324082136154175, 0.787430465221405, 0.6881181597709656, 0.857126772403717, 0.9996873140335083, 0.2410677671432495, 0.9997380375862122, 0.9910537600517273, 0.9941931366920471, 0.9987578392028809, 0.9984992742538452, 0.9969099164009094, 0.9584302306175232, 0.9999985694885254, 0.9999899864196777, 0.9999926090240479, 0.999998927116394, 0.9999991655349731, 1.0, 0.7874346375465393, 0.0061043743044137955, 0.04288526996970177, 0.18225817382335663, 0.06019359827041626, 0.016468074172735214, 0.9999972581863403, 0.9999996423721313, 0.9999982118606567, 0.9998838901519775, 0.9998937845230103, 0.9943363070487976, 0.5621864795684814, 0.7360866069793701, 0.8595901727676392, 0.9951778650283813, 0.8998104333877563, 0.4531249403953552, 0.9999992847442627, 0.9999933242797852, 0.9999998807907104, 0.9999839067459106, 0.9989839196205139, 0.9997517466545105, 0.997350811958313, 0.9996111989021301, 0.824498176574707, 0.9874978065490723, 0.9841672778129578, 0.9616992473602295, 0.5175262093544006, 0.6283077001571655, 0.546360433101654, 0.999358594417572, 0.9524742364883423, 0.9994237422943115, 0.9642894864082336, 0.994175136089325, 0.985412061214447, 0.491251677274704, 0.3416208028793335, 0.42886272072792053, 0.7841136455535889, 0.6734838485717773, 0.7526051998138428, 0.016812937334179878, 0.9658491015434265, 0.9727159738540649, 0.9945705533027649, 0.9932199716567993, 0.9996683597564697, 0.9994562268257141, 0.9915756583213806, 0.9982116222381592, 0.9999691247940063, 0.9883553981781006, 0.9992305040359497, 0.9999300241470337, 0.9996969699859619, 0.9999808073043823, 0.998924195766449, 0.9996945858001709, 0.994415283203125, 0.8847984671592712, 0.5541564226150513, 0.66079181432724, 0.9997749924659729, 0.9999837875366211, 0.9993342757225037, 0.9988571405410767, 0.9995856881141663, 0.9997518658638, 0.9963299632072449, 0.9500681757926941, 0.6518329977989197, 0.9999961853027344, 0.9785908460617065, 0.9999020099639893, 0.9788873195648193, 0.9994890689849854, 0.9929587841033936, 0.9999991655349731, 0.9999980926513672, 0.9999960660934448, 0.9969452023506165, 0.9692269563674927, 0.9684847593307495, 0.8235099911689758, 0.8225049376487732, 0.9579454064369202, 0.9999785423278809, 0.999997615814209, 0.9999775886535645, 0.9998984336853027, 0.9999974966049194, 0.9999994039535522, 0.7901800274848938, 0.5494765639305115, 0.9403153657913208, 0.008660477586090565, 0.8930303454399109, 0.006859771441668272, 0.9999998807907104, 0.9999992847442627, 0.9999985694885254, 0.9948664903640747, 0.5008512735366821, 0.8508425354957581, 0.4912760555744171, 0.7454321384429932, 0.8228439688682556, 0.9999969005584717, 0.9999953508377075, 0.9999703168869019, 0.9999094009399414, 0.9999574422836304, 0.9999868869781494, 0.731691300868988, 0.7642431259155273, 0.8792497515678406, 0.5824012160301208, 0.9118309020996094, 0.44087207317352295, 0.9818544387817383, 0.9848768711090088, 0.1831178069114685, 0.998088538646698, 0.9997708201408386, 0.9995538592338562, 0.8931752443313599, 0.9836447238922119, 0.9993769526481628, 0.015053881332278252, 0.5267915725708008, 0.969816267490387, 0.9999029636383057, 0.9999336004257202, 0.9999829530715942, 0.6167547106742859, 0.5676248669624329, 0.5696904063224792, 0.035768236964941025, 0.0004263324080966413, 0.4241045117378235, 0.9995738863945007, 0.9983693957328796, 0.9953497052192688, 0.03733458369970322, 0.719172477722168, 0.8833697438240051, 0.2553568482398987, 0.8218716979026794, 9.55943251028657e-05, 0.9998821020126343, 0.9988094568252563, 0.999967098236084, 0.999990701675415, 0.9958001971244812, 0.9999986886978149, 0.999616265296936, 0.977737545967102, 0.9988262057304382, 0.3764190971851349, 0.0009547158842906356, 0.4543500542640686, 0.7623953223228455, 0.9120107889175415, 0.9350723624229431, 0.6007090210914612, 0.9999911785125732, 0.9584690928459167, 0.7934396266937256, 0.846391499042511, 0.6466822624206543, 0.999954342842102, 0.9998090863227844, 0.9992076754570007, 0.7808103561401367, 0.6292740106582642, 0.3720255196094513, 0.9967045187950134, 0.965789258480072, 0.9823498129844666, 0.999984622001648, 0.9999942779541016, 0.9999924898147583, 0.999993085861206, 0.9999891519546509, 0.9999618530273438, 0.2143656313419342, 0.3507053256034851, 0.014185876585543156, 0.0685742199420929, 0.32263892889022827, 0.3027118742465973, 0.9694278836250305, 0.4262120723724365, 0.5605895519256592, 0.9896355271339417, 0.8920578956604004, 0.9628991484642029, 0.7188137769699097, 0.9931932091712952, 0.9797579050064087, 0.8190539479255676, 0.71856689453125, 0.8799605965614319, 0.3041703701019287, 0.945320725440979, 0.9322957396507263, 0.9028697609901428, 0.9990310668945312, 0.9984170198440552, 0.9683218598365784, 0.9300368428230286, 0.9942785501480103, 0.9982202649116516, 0.9994456171989441, 0.9992300271987915, 0.15405893325805664, 0.9928821325302124, 0.9996395111083984, 0.9917131662368774, 0.9999337196350098, 0.9988447427749634, 0.9992251396179199, 0.9994699358940125, 0.7336649894714355, 0.9999599456787109, 0.9998645782470703, 0.999771773815155, 0.43057453632354736, 0.5421355962753296, 0.06212695315480232, 0.996394693851471, 0.9963604807853699, 0.9772237539291382, 0.39635393023490906, 0.3845742344856262, 0.32552337646484375, 0.708629846572876, 0.7940416932106018, 0.8598116636276245, 0.999942421913147, 0.5154693126678467, 0.9999110698699951, 0.9967346787452698, 0.9996838569641113, 0.3025572896003723, 0.9975831508636475, 0.9961205124855042, 0.9978992938995361, 0.36784228682518005, 0.14743652939796448, 0.23945601284503937, 0.9999969005584717, 0.9998874664306641, 0.9999951124191284, 0.22594881057739258, 0.5327080488204956, 0.19016627967357635, 0.4267323315143585, 0.7181272506713867, 0.4601338505744934, 0.5814968943595886, 0.9991042017936707, 0.86968994140625, 0.7940104603767395, 0.6974850296974182, 0.026257993653416634, 0.8587540984153748, 0.7346211671829224, 0.8723004460334778, 0.6434869766235352, 0.8818493485450745, 0.04828319326043129, 0.998462438583374, 0.9985895752906799, 0.99613356590271, 0.999970555305481, 0.9999641180038452, 0.9999760389328003, 0.2821114957332611, 0.34214144945144653, 0.1562288999557495, 0.9937607645988464, 0.9977582097053528, 0.6382438540458679, 0.9998862743377686, 0.9992699027061462, 0.9998904466629028, 0.9636162519454956, 0.9482669234275818, 0.9946883916854858, 0.9072889089584351, 0.9276882410049438, 0.9478370547294617, 0.898289680480957, 0.9986287355422974, 0.9752339124679565, 0.40680989623069763, 0.3912314474582672, 0.08897563070058823, 0.9424015879631042, 0.42675265669822693, 0.9999076128005981, 0.9046557545661926, 0.9833462238311768, 0.589844822883606, 0.18730147182941437, 0.28148153424263, 0.5734831690788269, 0.9949612617492676, 0.9960654377937317, 0.45221391320228577, 0.9998648166656494, 0.9970831274986267, 0.9997900128364563, 0.8509729504585266, 0.9996299743652344, 0.9362675547599792, 0.9009715914726257, 0.9451128244400024, 0.6338557600975037, 0.950371503829956, 0.9912466406822205, 0.9598905444145203, 0.9769330024719238, 0.9683899283409119, 0.009968730621039867, 0.9999829530715942, 0.9999841451644897, 0.9999769926071167, 0.2102336287498474, 0.9997462630271912, 0.9980948567390442, 0.9894351363182068, 0.9978675842285156, 0.9974122643470764, 0.9352248907089233, 0.899463415145874, 0.873665988445282, 0.9997214674949646, 0.9978875517845154, 0.99846351146698, 0.08270219713449478, 5.026158760301769e-05, 0.06453957408666611, 0.9940483570098877, 0.9679574966430664, 0.9951175451278687, 0.9958827495574951, 0.26131582260131836, 0.8625807166099548, 0.038239989429712296, 0.947502076625824, 0.812287449836731, 0.5288971066474915, 0.7602019906044006, 0.06311137229204178, 0.3896898925304413, 0.7517817616462708, 0.5311471223831177, 0.9851204752922058, 0.996356725692749, 0.9988695979118347, 0.9999971389770508, 0.999735414981842, 0.9992386102676392, 0.29192960262298584, 0.479218989610672, 0.06572479009628296, 0.9999774694442749, 0.999933123588562, 0.9999852180480957, 0.9999809265136719, 0.9999994039535522, 0.8326940536499023, 0.8589992523193359, 0.2963012754917145, 0.5035292506217957, 0.28127846121788025, 0.20305541157722473, 0.7795776724815369, 0.6862480640411377, 0.9073684811592102, 0.999826967716217, 0.9319025278091431, 0.9470246434211731, 0.3268917500972748 ], "eval_math_runtime": 201.1044, "eval_math_samples_per_second": 3.729, "eval_math_score": -0.12285017967224121, "eval_math_steps_per_second": 0.119, "step": 75 }, { "epoch": 1.33, "learning_rate": 0.0002, "loss": 0.1415, "step": 76 }, { "epoch": 1.35, "learning_rate": 0.0002, "loss": 0.0916, "step": 77 }, { "epoch": 1.37, "learning_rate": 0.0002, "loss": 0.5743, "step": 78 }, { "epoch": 1.39, "learning_rate": 0.0002, "loss": 0.1566, "step": 79 }, { "epoch": 1.4, "learning_rate": 0.0002, "loss": 0.3156, "step": 80 }, { "epoch": 1.42, "learning_rate": 0.0002, "loss": 0.1345, "step": 81 }, { "epoch": 1.44, "learning_rate": 0.0002, "loss": 0.2403, "step": 82 }, { "epoch": 1.46, "learning_rate": 0.0002, "loss": 0.1342, "step": 83 }, { "epoch": 1.47, "learning_rate": 0.0002, "loss": 0.3069, "step": 84 }, { "epoch": 1.49, "learning_rate": 0.0002, "loss": 0.0994, "step": 85 }, { "epoch": 1.51, "learning_rate": 0.0002, "loss": 0.1322, "step": 86 }, { "epoch": 1.53, "learning_rate": 0.0002, "loss": 0.1474, "step": 87 }, { "epoch": 1.54, "learning_rate": 0.0002, "loss": 0.1289, "step": 88 }, { "epoch": 1.56, "learning_rate": 0.0002, "loss": 0.3391, "step": 89 }, { "epoch": 1.58, "learning_rate": 0.0002, "loss": 0.1304, "step": 90 }, { "epoch": 1.6, "learning_rate": 0.0002, "loss": 0.0875, "step": 91 }, { "epoch": 1.61, "learning_rate": 0.0002, "loss": 0.1721, "step": 92 }, { "epoch": 1.63, "learning_rate": 0.0002, "loss": 0.2668, "step": 93 }, { "epoch": 1.65, "learning_rate": 0.0002, "loss": 0.3303, "step": 94 }, { "epoch": 1.67, "learning_rate": 0.0002, "loss": 0.1032, "step": 95 }, { "epoch": 1.68, "learning_rate": 0.0002, "loss": 0.1306, "step": 96 }, { "epoch": 1.7, "learning_rate": 0.0002, "loss": 0.1536, "step": 97 }, { "epoch": 1.72, "learning_rate": 0.0002, "loss": 0.1029, "step": 98 }, { "epoch": 1.74, "learning_rate": 0.0002, "loss": 0.1291, "step": 99 }, { "epoch": 1.75, "learning_rate": 0.0002, "loss": 0.0983, "step": 100 }, { "epoch": 1.75, "eval_math_accuracy": 0.8266666666666667, "eval_math_average_probability": 0.804977297782898, "eval_math_brier_score": 0.12344212085008621, "eval_math_loss": 0.45978617668151855, "eval_math_probabilities": [ 0.9475333094596863, 0.9327775239944458, 0.8341836929321289, 0.9640377163887024, 0.993699312210083, 0.9906257390975952, 0.9999922513961792, 0.9999881982803345, 0.9999748468399048, 0.8802229166030884, 0.5863076448440552, 0.8300166130065918, 0.6269857883453369, 0.23321159183979034, 0.9368520379066467, 0.464248389005661, 0.57252436876297, 0.7837892770767212, 0.9481528401374817, 0.2216273695230484, 0.4848330616950989, 0.6196092367172241, 0.41316118836402893, 0.4825407564640045, 0.05769344046711922, 0.9940010905265808, 0.9787469506263733, 0.7548518180847168, 0.30525118112564087, 0.02414878085255623, 0.2709668278694153, 0.08152783662080765, 0.04588330164551735, 0.9490468502044678, 0.9958735108375549, 0.9824467897415161, 0.999996542930603, 0.9999995231628418, 0.9999969005584717, 0.2890969514846802, 0.013576988130807877, 0.08965066075325012, 0.999995231628418, 0.9999867677688599, 0.9995125532150269, 0.1754913330078125, 0.09472552686929703, 0.6613370180130005, 0.9999967813491821, 0.9999933242797852, 0.9978646636009216, 0.9262825846672058, 0.8876777291297913, 0.9589400291442871, 0.9855661392211914, 0.9969171285629272, 0.9995866417884827, 0.9999561309814453, 0.9999504089355469, 0.9999997615814209, 0.9713318943977356, 0.8056635856628418, 0.8430995941162109, 0.9851846694946289, 0.9857168197631836, 0.9992393255233765, 0.0071811373345553875, 0.5700258612632751, 0.9394314289093018, 0.8952827453613281, 0.9713773727416992, 0.9944033622741699, 0.91172194480896, 0.9976688027381897, 0.9993497729301453, 0.9999896287918091, 0.9999752044677734, 0.9999308586120605, 0.9493915438652039, 0.9053030014038086, 0.7881652116775513, 0.8593658804893494, 0.9460667371749878, 0.9194446206092834, 0.9932243227958679, 0.9996610879898071, 0.9998859167098999, 0.3371586501598358, 0.5271449089050293, 0.8565431237220764, 0.999997615814209, 0.9996390342712402, 0.9999815225601196, 0.11997628211975098, 0.9245119094848633, 0.28198161721229553, 0.9306301474571228, 0.9974621534347534, 0.9940720200538635, 0.9694506525993347, 0.9929366707801819, 0.7030938863754272, 0.999821126461029, 0.9999599456787109, 0.9999912977218628, 0.9999874830245972, 0.999936580657959, 0.9998745918273926, 0.9999892711639404, 0.9908340573310852, 0.9999599456787109, 0.9739454984664917, 0.48124802112579346, 0.3832882046699524, 0.6865490674972534, 0.293915331363678, 0.34083542227745056, 0.9999737739562988, 0.9999891519546509, 0.9999570846557617, 0.9999997615814209, 0.9999992847442627, 0.9999990463256836, 0.9977312684059143, 0.997502863407135, 0.9972578883171082, 0.16920900344848633, 0.41363605856895447, 0.974782407283783, 0.9993467926979065, 0.9977909326553345, 0.9920322895050049, 0.9752835631370544, 0.840770959854126, 0.924100399017334, 0.494393914937973, 0.9397424459457397, 0.9632019996643066, 0.9997556805610657, 0.9986082911491394, 0.9998074173927307, 0.15084709227085114, 0.9914188385009766, 0.9579959511756897, 0.9407543540000916, 0.9981377124786377, 0.9871366024017334, 0.9999904632568359, 0.9997863173484802, 0.9999808073043823, 0.5182684063911438, 0.11314063519239426, 0.9794104099273682, 0.9969139099121094, 0.9999810457229614, 0.9999997615814209, 0.15249423682689667, 0.5996314883232117, 0.6362959742546082, 0.788130521774292, 0.7887936234474182, 0.8184621334075928, 0.9945932030677795, 0.45256832242012024, 0.9728187322616577, 0.9999679327011108, 0.943649172782898, 0.9999103546142578, 0.6699703931808472, 0.0007635295041836798, 0.5882190465927124, 0.672776997089386, 0.5857751965522766, 0.7232856750488281, 0.9951426982879639, 0.9641414284706116, 0.9736242294311523, 0.6389965415000916, 0.897779107093811, 0.845750093460083, 0.6551565527915955, 0.5497551560401917, 0.3237321078777313, 0.9536895155906677, 0.9972598552703857, 0.9998490810394287, 0.9999979734420776, 0.999996542930603, 0.9999994039535522, 0.9999638795852661, 0.9999692440032959, 0.9999949932098389, 0.9189188480377197, 0.7440605759620667, 0.9050955176353455, 0.9867180585861206, 0.9692326784133911, 0.9984978437423706, 0.9661572575569153, 0.9758480191230774, 0.3943697512149811, 0.9996451139450073, 0.9045859575271606, 0.9999538660049438, 0.4594781696796417, 0.3602261543273926, 0.5872560739517212, 0.9999575614929199, 0.8614200353622437, 0.28734374046325684, 0.9775461554527283, 0.9978785514831543, 0.9859311580657959, 0.9928693175315857, 0.9998912811279297, 0.9993153810501099, 0.9948833584785461, 0.11826580762863159, 0.9942231774330139, 0.4291130304336548, 0.9649617075920105, 0.19725492596626282, 0.5354161858558655, 0.8768001794815063, 0.1560966521501541, 0.9999992847442627, 0.9999998807907104, 0.9999995231628418, 0.999900221824646, 0.9751614332199097, 0.15761438012123108, 0.9921040534973145, 0.7633439302444458, 0.939431369304657, 1.0, 1.0, 0.9999998807907104, 0.8001546859741211, 0.9445754289627075, 0.8326126933097839, 0.9177573919296265, 0.8154159784317017, 0.6136552691459656, 0.9932760000228882, 0.9999897480010986, 0.9999959468841553, 0.953885018825531, 0.9887099862098694, 0.5024290084838867, 0.974915623664856, 0.9783918261528015, 0.9194811582565308, 0.9933170080184937, 0.9985724687576294, 0.9986332058906555, 0.772635281085968, 0.9154156446456909, 0.9817554950714111, 0.9977104663848877, 0.9986905455589294, 0.9942365288734436, 0.8996217846870422, 0.9901912212371826, 0.9879768490791321, 0.8399122953414917, 0.9257044792175293, 0.9643818736076355, 0.990798830986023, 0.9988424181938171, 0.9982503056526184, 0.9759376049041748, 0.9313430786132812, 0.981048583984375, 0.9852378964424133, 0.024589162319898605, 0.8642290234565735, 0.6292590498924255, 0.787860095500946, 0.7648295164108276, 0.8659924268722534, 0.9834965467453003, 0.9787317514419556, 0.9999681711196899, 0.9999419450759888, 0.999980092048645, 0.9999966621398926, 0.9999873638153076, 0.9999876022338867, 0.9935126900672913, 0.9827268123626709, 0.9948281645774841, 0.9992837309837341, 0.9979227185249329, 0.9957268238067627, 0.9998769760131836, 0.9999520778656006, 0.9993009567260742, 0.6762076616287231, 0.5375096797943115, 0.35038521885871887, 0.9998836517333984, 0.9900625348091125, 0.9910743832588196, 0.37446582317352295, 0.6258294582366943, 0.5254096984863281, 0.2717879116535187, 0.5280758738517761, 0.6579352021217346, 0.9993864297866821, 0.9996459484100342, 0.9899701476097107, 0.9999241828918457, 0.9999732971191406, 0.9999493360519409, 0.00010340674634790048, 0.00010476552415639162, 7.096266926964745e-05, 0.9998315572738647, 0.9994848966598511, 0.9967098236083984, 0.699204683303833, 0.9921912550926208, 0.7974449396133423, 0.528963029384613, 0.9965251088142395, 0.3116721212863922, 0.9941370487213135, 0.97870934009552, 0.983799934387207, 0.9901623725891113, 0.9994006156921387, 0.9907859563827515, 0.9999831914901733, 0.9999992847442627, 0.9999488592147827, 0.9854050278663635, 0.9650493860244751, 0.8661375641822815, 0.7558331489562988, 0.6982961297035217, 0.9173397421836853, 0.8143244981765747, 0.6262655854225159, 0.8395925760269165, 0.9988210797309875, 0.02095525898039341, 0.9987699389457703, 0.9885132908821106, 0.9921883344650269, 0.9983021020889282, 0.9986556768417358, 0.9945736527442932, 0.9731589555740356, 0.9999992847442627, 0.9999966621398926, 0.9999963045120239, 0.9999984502792358, 0.9999983310699463, 1.0, 0.7335387468338013, 0.015916068106889725, 0.18418586254119873, 0.41238388419151306, 0.0656566247344017, 0.0010977339698001742, 0.9999984502792358, 0.9999998807907104, 0.9999977350234985, 0.9999608993530273, 0.9999735355377197, 0.9935814142227173, 0.47647547721862793, 0.7749339938163757, 0.6905574202537537, 0.9909040331840515, 0.6791723966598511, 0.4343525469303131, 0.9999984502792358, 0.999984860420227, 0.9999992847442627, 0.9999982118606567, 0.9993627667427063, 0.9999358654022217, 0.9907469749450684, 0.9988529682159424, 0.7688943147659302, 0.982776403427124, 0.9615985751152039, 0.9384880661964417, 0.5606516003608704, 0.47190412878990173, 0.7252959609031677, 0.9961718916893005, 0.8529340624809265, 0.9968836903572083, 0.9549634456634521, 0.9921883344650269, 0.9860765933990479, 0.2598068416118622, 0.3178275227546692, 0.39694616198539734, 0.9178012609481812, 0.6848565936088562, 0.8790230751037598, 0.0052022188901901245, 0.9799976348876953, 0.9667891263961792, 0.9986133575439453, 0.9979270696640015, 0.9993959665298462, 0.9998798370361328, 0.9969327449798584, 0.9992977380752563, 0.9999841451644897, 0.9873706102371216, 0.999184787273407, 0.999586284160614, 0.9871276617050171, 0.9997830986976624, 0.9966732263565063, 0.9992958307266235, 0.9779936075210571, 0.7954171299934387, 0.8956907391548157, 0.8188077211380005, 0.9992421865463257, 0.9999839067459106, 0.9987586736679077, 0.9996424913406372, 0.9993318915367126, 0.9996517896652222, 0.9997922778129578, 0.9984320998191833, 0.9997292160987854, 0.9999830722808838, 0.9745162725448608, 0.9992594122886658, 0.9999892711639404, 0.9999840259552002, 0.99856036901474, 0.999998927116394, 0.999998927116394, 0.9999964237213135, 0.9912416934967041, 0.9967465400695801, 0.9911262392997742, 0.9593307971954346, 0.8816831111907959, 0.9820114374160767, 0.9999856948852539, 0.9999990463256836, 0.9999876022338867, 0.9968639612197876, 0.9999830722808838, 0.9999936819076538, 0.5136188864707947, 0.5513888001441956, 0.8775236010551453, 0.02919785864651203, 0.8539873957633972, 0.020717766135931015, 1.0, 1.0, 0.9999996423721313, 0.9987290501594543, 0.4123147428035736, 0.9088837504386902, 0.6614423990249634, 0.7866751551628113, 0.8723801970481873, 0.9999992847442627, 0.9999990463256836, 0.9999973773956299, 0.9999991655349731, 0.9999990463256836, 0.9999995231628418, 0.6896315217018127, 0.5674806833267212, 0.8334212899208069, 0.5394514203071594, 0.4687158167362213, 0.26399853825569153, 0.9928597807884216, 0.9969013929367065, 0.2951197922229767, 0.993961751461029, 0.9989247918128967, 0.999881386756897, 0.5888901352882385, 0.9866610169410706, 0.9992783665657043, 0.07201408594846725, 0.2778617739677429, 0.9474989175796509, 0.999909520149231, 0.9999281167984009, 0.9999879598617554, 0.49688342213630676, 0.4218936860561371, 0.44929659366607666, 0.0018286496633663774, 1.8571909095044248e-06, 0.47513511776924133, 0.9945547580718994, 0.9972214698791504, 0.9935603141784668, 0.01943197287619114, 0.8311030268669128, 0.9550625681877136, 0.4061180651187897, 0.9351599216461182, 0.0008598004351370037, 0.9999821186065674, 0.9997472167015076, 0.9999949932098389, 0.9997113347053528, 0.6024402379989624, 0.9999672174453735, 0.9998835325241089, 0.999872088432312, 0.9978391528129578, 0.6245144605636597, 0.000171612948179245, 0.644734799861908, 0.5504216551780701, 0.9453369379043579, 0.9635985493659973, 0.1792806088924408, 0.9999797344207764, 0.8681767582893372, 0.892272412776947, 0.9809189438819885, 0.45401883125305176, 0.9998794794082642, 0.9995294809341431, 0.9977253079414368, 0.5810263752937317, 0.28023815155029297, 0.34294676780700684, 0.9560766816139221, 0.8341329097747803, 0.7069963216781616, 0.9999701976776123, 0.9999701976776123, 0.999954104423523, 0.999996542930603, 0.9999959468841553, 0.9999487400054932, 0.18719367682933807, 0.6635345220565796, 0.07233071327209473, 0.1440533995628357, 0.1732211410999298, 0.670236349105835, 0.9510051608085632, 0.05763239786028862, 0.4148212671279907, 0.996908962726593, 0.9753775596618652, 0.9774754047393799, 0.5231315493583679, 0.9927646517753601, 0.9508025646209717, 0.965073823928833, 0.9230091571807861, 0.9748613834381104, 0.8671842813491821, 0.9612912535667419, 0.9367452263832092, 0.9191805124282837, 0.9958440661430359, 0.9960203766822815, 0.996840238571167, 0.9973291158676147, 0.9988030195236206, 0.9997312426567078, 0.9995114803314209, 0.9998950958251953, 0.19462786614894867, 0.9986708164215088, 0.9992844462394714, 0.9986629486083984, 0.999993085861206, 0.9993676543235779, 0.9963127970695496, 0.9975494742393494, 0.6982600688934326, 0.9999333620071411, 0.9998518228530884, 0.999765932559967, 0.5663544535636902, 0.4996521770954132, 0.12108130007982254, 0.9874479174613953, 0.993889570236206, 0.9386891722679138, 0.3487769663333893, 0.2534719407558441, 0.20359940826892853, 0.776786208152771, 0.8626043200492859, 0.9122551679611206, 0.999937891960144, 0.7944570779800415, 0.9999947547912598, 0.9974974989891052, 0.9983175992965698, 0.28119754791259766, 0.9841620922088623, 0.9886300563812256, 0.989258348941803, 0.5012166500091553, 0.24869897961616516, 0.25906550884246826, 0.9999986886978149, 0.9999126195907593, 0.9999977350234985, 0.4772639572620392, 0.5981103181838989, 0.4021296799182892, 0.46893835067749023, 0.5952679514884949, 0.48440518975257874, 0.6431782841682434, 0.994263231754303, 0.6724222302436829, 0.7102087140083313, 0.6053889989852905, 0.08855386823415756, 0.9816499352455139, 0.8585788607597351, 0.9894812107086182, 0.5347477793693542, 0.43282970786094666, 0.04138212651014328, 0.9993693232536316, 0.9961994290351868, 0.9930423498153687, 0.999795138835907, 0.9988994598388672, 0.9999436140060425, 0.2157648354768753, 0.3275116980075836, 0.16531121730804443, 0.9990621209144592, 0.9984481334686279, 0.7156533598899841, 0.9999597072601318, 0.9997124075889587, 0.9999834299087524, 0.8027123212814331, 0.8944212794303894, 0.9910338521003723, 0.9645297527313232, 0.9467929005622864, 0.9533606767654419, 0.9590015411376953, 0.9977242350578308, 0.9823580384254456, 0.4976138770580292, 0.42694467306137085, 0.11163276433944702, 0.9914510846138, 0.8926071524620056, 0.999995231628418, 0.9927600622177124, 0.9994768500328064, 0.9221163988113403, 0.20683687925338745, 0.19798173010349274, 0.5254963636398315, 0.9974754452705383, 0.9976434111595154, 0.7375270128250122, 0.9998003840446472, 0.9963510036468506, 0.9999241828918457, 0.7944461703300476, 0.9996541738510132, 0.9815426468849182, 0.8329529762268066, 0.9255755543708801, 0.649965763092041, 0.9816361665725708, 0.9969000816345215, 0.9858155250549316, 0.9531360864639282, 0.9841613173484802, 0.00957278162240982, 0.9999836683273315, 0.9999887943267822, 0.9999659061431885, 0.049189742654561996, 0.9950551986694336, 0.9937531352043152, 0.9755020141601562, 0.9884998202323914, 0.9888747930526733, 0.9992043375968933, 0.997605562210083, 0.9994422793388367, 0.9999804496765137, 0.9982569813728333, 0.9991681575775146, 0.12187449634075165, 0.0007524779066443443, 0.02459927462041378, 0.982568621635437, 0.9168364405632019, 0.9893787503242493, 0.9542142152786255, 0.3557262420654297, 0.5960555672645569, 0.06133385747671127, 0.984184741973877, 0.9238367676734924, 0.3577895164489746, 0.5225395560264587, 0.0338018462061882, 0.6434614658355713, 0.829712450504303, 0.5059069991111755, 0.9933298230171204, 0.9973533153533936, 0.9997368454933167, 0.9999994039535522, 0.9986348748207092, 0.9997571110725403, 0.4306027591228485, 0.4954569339752197, 0.3053145706653595, 0.9999266862869263, 0.9997121691703796, 0.9999279975891113, 0.9999856948852539, 0.9999991655349731, 0.9606157541275024, 0.944769024848938, 0.9013367891311646, 0.5184392333030701, 0.5311821103096008, 0.28476089239120483, 0.6236992478370667, 0.9392392635345459, 0.9874454736709595, 0.9999157190322876, 0.8583700060844421, 0.8839094042778015, 0.349273681640625 ], "eval_math_runtime": 201.0565, "eval_math_samples_per_second": 3.73, "eval_math_score": -0.12344212085008621, "eval_math_steps_per_second": 0.119, "step": 100 }, { "epoch": 1.77, "learning_rate": 0.0002, "loss": 0.1371, "step": 101 }, { "epoch": 1.79, "learning_rate": 0.0002, "loss": 0.2524, "step": 102 }, { "epoch": 1.81, "learning_rate": 0.0002, "loss": 0.1579, "step": 103 }, { "epoch": 1.82, "learning_rate": 0.0002, "loss": 0.0881, "step": 104 }, { "epoch": 1.84, "learning_rate": 0.0002, "loss": 0.1482, "step": 105 }, { "epoch": 1.86, "learning_rate": 0.0002, "loss": 0.0699, "step": 106 }, { "epoch": 1.88, "learning_rate": 0.0002, "loss": 0.1098, "step": 107 }, { "epoch": 1.89, "learning_rate": 0.0002, "loss": 0.0058, "step": 108 }, { "epoch": 1.91, "learning_rate": 0.0002, "loss": 0.0782, "step": 109 }, { "epoch": 1.93, "learning_rate": 0.0002, "loss": 0.0563, "step": 110 }, { "epoch": 1.95, "learning_rate": 0.0002, "loss": 0.1709, "step": 111 }, { "epoch": 1.96, "learning_rate": 0.0002, "loss": 0.1019, "step": 112 }, { "epoch": 1.98, "learning_rate": 0.0002, "loss": 0.1572, "step": 113 }, { "epoch": 2.0, "learning_rate": 0.0002, "loss": 0.0638, "step": 114 }, { "epoch": 2.02, "learning_rate": 0.0002, "loss": 0.0045, "step": 115 }, { "epoch": 2.04, "learning_rate": 0.0002, "loss": 0.0119, "step": 116 }, { "epoch": 2.05, "learning_rate": 0.0002, "loss": 0.0043, "step": 117 }, { "epoch": 2.07, "learning_rate": 0.0002, "loss": 0.0322, "step": 118 }, { "epoch": 2.09, "learning_rate": 0.0002, "loss": 0.0713, "step": 119 }, { "epoch": 2.11, "learning_rate": 0.0002, "loss": 0.0384, "step": 120 }, { "epoch": 2.12, "learning_rate": 0.0002, "loss": 0.036, "step": 121 }, { "epoch": 2.14, "learning_rate": 0.0002, "loss": 0.0075, "step": 122 }, { "epoch": 2.16, "learning_rate": 0.0002, "loss": 0.0229, "step": 123 }, { "epoch": 2.18, "learning_rate": 0.0002, "loss": 0.0361, "step": 124 }, { "epoch": 2.19, "learning_rate": 0.0002, "loss": 0.0419, "step": 125 }, { "epoch": 2.19, "eval_math_accuracy": 0.812, "eval_math_average_probability": 0.8111705780029297, "eval_math_brier_score": 0.14748883247375488, "eval_math_loss": 0.8266459703445435, "eval_math_probabilities": [ 0.7277971506118774, 0.8027830123901367, 0.4868547320365906, 0.9999939203262329, 0.9999986886978149, 0.9999972581863403, 1.0, 1.0, 1.0, 0.9872032999992371, 0.8311556577682495, 0.9832150340080261, 0.18153256177902222, 0.0025412901304662228, 0.9529481530189514, 0.6011979579925537, 0.7700560688972473, 0.9257276654243469, 0.9997406601905823, 0.0307023823261261, 0.9148809313774109, 0.6387721300125122, 0.3300309479236603, 0.29847028851509094, 0.007153147831559181, 0.9998143315315247, 0.9984020590782166, 0.7399280071258545, 0.32706624269485474, 0.016767162829637527, 0.07364696264266968, 0.007332431152462959, 0.0012797487433999777, 0.12126252055168152, 0.9999532699584961, 0.9950354099273682, 1.0, 1.0, 1.0, 0.024065298959612846, 2.2653486666968092e-05, 0.0007619442185387015, 1.0, 1.0, 0.9999995231628418, 0.1580563634634018, 0.07029100507497787, 0.27928298711776733, 1.0, 1.0, 0.9999934434890747, 0.9973445534706116, 0.8740033507347107, 0.9953084588050842, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998062252998352, 0.9885712265968323, 0.9369679093360901, 0.9999309778213501, 0.9995647072792053, 0.9999864101409912, 0.006392901763319969, 0.19513407349586487, 0.92803555727005, 0.9138030409812927, 0.9702478051185608, 0.9994045495986938, 0.9999805688858032, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9999998807907104, 0.999699592590332, 0.9980478286743164, 0.9988729357719421, 0.9502097964286804, 0.9919044971466064, 0.9842649698257446, 0.9997765421867371, 1.0, 1.0, 0.009243395179510117, 0.7061121463775635, 0.9684865474700928, 1.0, 0.9999995231628418, 1.0, 0.07281903922557831, 0.9991586208343506, 0.4091057777404785, 0.9999932050704956, 0.9999966621398926, 0.9999990463256836, 0.9951953291893005, 0.9993054866790771, 0.27003559470176697, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999836683273315, 0.9999995231628418, 0.9714744687080383, 0.34408533573150635, 0.5044399499893188, 0.7383089065551758, 0.1716051548719406, 0.036765363067388535, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999256134033203, 0.9999474287033081, 0.9999390840530396, 0.03440934047102928, 0.022082384675741196, 0.9995065927505493, 0.9999998807907104, 0.9999982118606567, 0.9999592304229736, 0.9947860240936279, 0.9581873416900635, 0.9853852391242981, 0.0754304751753807, 0.7412813305854797, 0.9746203422546387, 0.9999997615814209, 0.9999997615814209, 1.0, 0.018211551010608673, 0.9999979734420776, 0.9999473094940186, 0.9992794394493103, 0.9999896287918091, 0.9998177886009216, 1.0, 1.0, 1.0, 9.234049684891943e-06, 0.9469889402389526, 0.9384269714355469, 0.9993649125099182, 1.0, 1.0, 0.010917234234511852, 0.5184338092803955, 0.7696806192398071, 0.4510691463947296, 0.685877799987793, 0.7071782946586609, 0.9999991655349731, 0.23762810230255127, 0.998090922832489, 0.9999949932098389, 0.7707432508468628, 1.0, 0.9506340622901917, 3.1603184424966457e-07, 0.8635208010673523, 0.9187722206115723, 0.8805140256881714, 0.8915034532546997, 0.9999997615814209, 0.9999842643737793, 0.9999346733093262, 0.9647281169891357, 0.955845296382904, 0.9978925585746765, 0.5895772576332092, 0.46168532967567444, 0.05893128365278244, 0.9928586483001709, 0.999943733215332, 0.9997604489326477, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9995067119598389, 0.9539420008659363, 0.9997590184211731, 0.7703603506088257, 0.004265848081558943, 0.8577179908752441, 0.9999489784240723, 0.9999229907989502, 0.9239717125892639, 0.9999998807907104, 0.9958641529083252, 1.0, 0.49938252568244934, 0.3165890872478485, 0.7180919647216797, 1.0, 0.9086061120033264, 0.339048832654953, 0.9999926090240479, 0.9999998807907104, 0.9993600249290466, 0.9991040825843811, 0.9999979734420776, 0.999990701675415, 0.9997765421867371, 0.014967636205255985, 0.9997727274894714, 0.27487891912460327, 0.9963118433952332, 0.09778929501771927, 0.96347975730896, 0.9892358183860779, 0.23288413882255554, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9846616387367249, 0.0072943586856126785, 1.0, 0.6282187700271606, 0.9998586177825928, 1.0, 1.0, 1.0, 0.9445847868919373, 0.9996905326843262, 0.993493378162384, 0.9996079802513123, 0.9891179203987122, 0.9099753499031067, 0.9999996423721313, 1.0, 1.0, 0.9994127750396729, 0.9998581409454346, 0.816500186920166, 0.9999966621398926, 0.9999886751174927, 0.9997439980506897, 0.9999955892562866, 1.0, 0.9999996423721313, 0.9470030665397644, 0.9798897504806519, 0.9998738765716553, 0.9999892711639404, 0.9999804496765137, 0.9999343156814575, 0.999377965927124, 0.9999974966049194, 0.9999412298202515, 0.9801212549209595, 0.9990443587303162, 0.9983291029930115, 0.9999696016311646, 1.0, 0.9999825954437256, 0.9999680519104004, 0.9990491271018982, 0.9999920129776001, 0.9177113175392151, 0.0005472943303175271, 0.9128908514976501, 0.7918078303337097, 0.9780992865562439, 0.889995276927948, 0.9951162338256836, 0.9999500513076782, 0.9999473094940186, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999932050704956, 0.999916672706604, 0.9999974966049194, 0.9999539852142334, 0.9999284744262695, 0.997368574142456, 0.9999996423721313, 0.9999961853027344, 0.999923825263977, 0.9194271564483643, 0.6994236707687378, 0.20338143408298492, 1.0, 0.9999685287475586, 0.9999712705612183, 0.14616964757442474, 0.4049328565597534, 0.7785970568656921, 0.3073568046092987, 0.5017445087432861, 0.4990394115447998, 0.9999994039535522, 0.9999996423721313, 0.9999864101409912, 0.9999914169311523, 1.0, 0.9999865293502808, 5.732247454481865e-10, 9.775079234941586e-08, 2.317611658142482e-09, 0.9999970197677612, 0.9999808073043823, 0.999922513961792, 0.11552117019891739, 0.9996792078018188, 0.9857979416847229, 0.14953464269638062, 0.9999487400054932, 0.27354156970977783, 0.9999901056289673, 0.9999529123306274, 0.9998986721038818, 0.999152421951294, 1.0, 0.9999967813491821, 1.0, 1.0, 1.0, 0.9994007349014282, 0.9977643489837646, 0.9958204030990601, 0.6717868447303772, 0.4052655100822449, 0.991876482963562, 0.9529387950897217, 0.710481584072113, 0.973517894744873, 0.9999570846557617, 3.17766607622616e-05, 0.9999548196792603, 0.9999990463256836, 0.9999990463256836, 0.9999997615814209, 0.9999998807907104, 1.0, 0.9999978542327881, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.6897718906402588, 2.540655987104401e-05, 0.12953504920005798, 0.1890857070684433, 0.0011713765561580658, 8.347011970499807e-09, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999899864196777, 0.40362414717674255, 0.7868751287460327, 0.9350650906562805, 0.9980692267417908, 0.2649793028831482, 0.046439286321401596, 1.0, 0.9999998807907104, 1.0, 1.0, 0.9999816417694092, 0.9999997615814209, 0.999970555305481, 0.9999945163726807, 0.9933852553367615, 0.8582093715667725, 0.9413446187973022, 0.8972650170326233, 0.23370620608329773, 0.4547395706176758, 0.7543732523918152, 0.9999995231628418, 0.9986948370933533, 0.9999991655349731, 0.9999659061431885, 0.9999918937683105, 0.9999983310699463, 0.24331289529800415, 0.35917404294013977, 0.3480682075023651, 0.9980910420417786, 0.8933518528938293, 0.9935763478279114, 0.0010665151057764888, 0.9999967813491821, 0.9999957084655762, 1.0, 1.0, 1.0, 0.9999995231628418, 0.9973215460777283, 0.9999958276748657, 1.0, 0.992084801197052, 0.9999964237213135, 0.9999994039535522, 0.9996059536933899, 0.9999998807907104, 0.9999998807907104, 1.0, 0.9999966621398926, 0.9588165283203125, 0.9297915101051331, 0.9129531383514404, 0.9999994039535522, 1.0, 0.9999991655349731, 0.9999997615814209, 0.9999997615814209, 0.9999995231628418, 0.999998927116394, 0.9998526573181152, 0.9999998807907104, 1.0, 0.9999990463256836, 1.0, 0.9999998807907104, 1.0, 0.9999586343765259, 1.0, 1.0, 1.0, 0.9999990463256836, 0.9999998807907104, 0.9999982118606567, 0.9938641786575317, 0.9775616526603699, 0.9950580596923828, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9953336119651794, 0.38931262493133545, 0.9937404990196228, 2.0912439140374772e-06, 0.8074235320091248, 6.441356958930555e-07, 1.0, 1.0, 1.0, 1.0, 0.9824858903884888, 0.9898354411125183, 0.6535958051681519, 0.7434094548225403, 0.9584407806396484, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9195433855056763, 0.9986894726753235, 0.99977046251297, 0.8355464339256287, 0.16151851415634155, 0.009712218306958675, 0.9997686743736267, 0.9999891519546509, 0.1688336730003357, 0.999997615814209, 1.0, 1.0, 0.9985625147819519, 0.9998540878295898, 0.999992847442627, 4.246909668381704e-07, 0.09365885704755783, 0.7989708781242371, 0.9999998807907104, 0.9999997615814209, 1.0, 0.5823290944099426, 0.5787104964256287, 0.3905923068523407, 0.012789128348231316, 9.450325819670979e-07, 0.5102953910827637, 0.9999998807907104, 0.9999998807907104, 0.9999991655349731, 1.4655699942522915e-07, 0.043061595410108566, 0.894737720489502, 0.9530744552612305, 0.996482253074646, 4.545294359559193e-06, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9335569739341736, 1.0, 0.9999991655349731, 0.9999382495880127, 0.995098888874054, 0.6982179284095764, 7.006291657951635e-10, 0.03611199930310249, 0.7709771990776062, 0.9992548823356628, 0.9991263747215271, 0.99649578332901, 0.9999998807907104, 0.9998606443405151, 0.8710408210754395, 0.9986395239830017, 0.6320503950119019, 1.0, 1.0, 1.0, 0.9456174969673157, 0.00874006561934948, 0.03486586734652519, 0.9997621178627014, 0.35946205258369446, 0.812251627445221, 0.9999997615814209, 0.9999998807907104, 0.9999996423721313, 1.0, 1.0, 1.0, 0.09941577166318893, 0.12122482806444168, 0.0003380720445420593, 0.025679737329483032, 0.011161072179675102, 0.005199791397899389, 0.7904964685440063, 0.01461328100413084, 0.0019724369049072266, 0.9999963045120239, 0.9998513460159302, 0.9999454021453857, 0.4777214229106903, 0.9999966621398926, 0.9986541271209717, 0.9864298105239868, 0.9995619654655457, 0.8800662755966187, 0.9935113787651062, 0.9922391176223755, 0.9676616191864014, 0.9363653659820557, 0.998895525932312, 0.9955884218215942, 0.9897408485412598, 0.9966855645179749, 0.9983068704605103, 1.0, 0.9999998807907104, 1.0, 0.011425504460930824, 0.9999970197677612, 0.9999778270721436, 0.9999719858169556, 1.0, 0.9999971389770508, 0.9999995231628418, 0.9999998807907104, 0.8046973943710327, 1.0, 1.0, 1.0, 0.8469757437705994, 0.25426504015922546, 0.0030303478706628084, 0.9979897737503052, 0.9997308850288391, 0.995685338973999, 0.26064229011535645, 0.9639202952384949, 0.4481111764907837, 0.9917418956756592, 0.9949871301651001, 0.9752479791641235, 1.0, 0.5169793367385864, 0.9999990463256836, 0.9673287272453308, 0.9947957396507263, 0.33220523595809937, 0.9952399730682373, 0.9978243112564087, 0.9346486330032349, 0.551794171333313, 0.03983592987060547, 0.4048302173614502, 1.0, 1.0, 1.0, 0.5118873119354248, 0.9485242366790771, 0.7833495140075684, 0.4080224335193634, 0.677769660949707, 0.41923946142196655, 0.8634167313575745, 0.9999954700469971, 0.7916945219039917, 0.9753586053848267, 0.6623606085777283, 0.18700705468654633, 0.99172043800354, 0.95611172914505, 0.9956606030464172, 0.18439820408821106, 0.019669663161039352, 5.894539935979992e-05, 0.9999973773956299, 0.9999977350234985, 0.9999889135360718, 0.9999994039535522, 0.999962329864502, 1.0, 0.10403933376073837, 0.5071848630905151, 0.07808573544025421, 0.9999998807907104, 1.0, 0.4725123345851898, 0.9999786615371704, 0.9997150301933289, 0.9999921321868896, 0.9878941178321838, 0.9240275621414185, 0.9999226331710815, 0.9610640406608582, 0.896691083908081, 0.9889174699783325, 0.9951319694519043, 0.9999707937240601, 0.9986928105354309, 0.9761465191841125, 0.35523721575737, 0.07045489549636841, 0.9999982118606567, 0.9930887818336487, 1.0, 0.9999963045120239, 0.9999998807907104, 0.99730384349823, 0.13448703289031982, 0.036562323570251465, 0.20502273738384247, 0.999998927116394, 0.9999960660934448, 0.7244946956634521, 0.9998494386672974, 0.9829078316688538, 0.9999972581863403, 0.9959750771522522, 1.0, 0.9999250173568726, 0.875101625919342, 0.9730218052864075, 0.4168318808078766, 0.9999440908432007, 0.9999988079071045, 0.9999649524688721, 0.9997833371162415, 0.9999350309371948, 0.0009762503323145211, 1.0, 1.0, 1.0, 8.175714901881292e-05, 0.9999994039535522, 0.9998981952667236, 0.9980091452598572, 0.9998949766159058, 0.9995429515838623, 0.9989878535270691, 0.999470055103302, 0.9999805688858032, 1.0, 0.9999974966049194, 0.9999994039535522, 0.10120324790477753, 3.2999903396557784e-06, 0.03002418763935566, 0.9999872446060181, 0.9987792372703552, 0.9999834299087524, 0.9966452717781067, 0.31122347712516785, 0.3828766644001007, 0.16436617076396942, 0.9977967739105225, 0.9824017882347107, 0.9678383469581604, 0.9945905208587646, 0.0015231240540742874, 0.9774705171585083, 0.9907748103141785, 0.4141817092895508, 0.9998809099197388, 0.9999932050704956, 1.0, 1.0, 0.9999990463256836, 0.9999994039535522, 0.13549046218395233, 0.4492356479167938, 0.048590127378702164, 1.0, 1.0, 1.0, 0.999992847442627, 1.0, 0.9999991655349731, 0.9978771209716797, 0.9807857871055603, 0.852462112903595, 0.744598388671875, 0.7609797120094299, 0.9712187647819519, 0.9996422529220581, 0.999982476234436, 1.0, 0.9901279807090759, 0.9975380897521973, 0.06286962330341339 ], "eval_math_runtime": 201.2239, "eval_math_samples_per_second": 3.727, "eval_math_score": -0.14748883247375488, "eval_math_steps_per_second": 0.119, "step": 125 }, { "epoch": 2.21, "learning_rate": 0.0002, "loss": 0.0069, "step": 126 }, { "epoch": 2.23, "learning_rate": 0.0002, "loss": 0.0193, "step": 127 }, { "epoch": 2.25, "learning_rate": 0.0002, "loss": 0.0289, "step": 128 }, { "epoch": 2.26, "learning_rate": 0.0002, "loss": 0.0324, "step": 129 }, { "epoch": 2.28, "learning_rate": 0.0002, "loss": 0.0638, "step": 130 }, { "epoch": 2.3, "learning_rate": 0.0002, "loss": 0.0044, "step": 131 }, { "epoch": 2.32, "learning_rate": 0.0002, "loss": 0.0319, "step": 132 }, { "epoch": 2.33, "learning_rate": 0.0002, "loss": 0.0333, "step": 133 }, { "epoch": 2.35, "learning_rate": 0.0002, "loss": 0.0013, "step": 134 }, { "epoch": 2.37, "learning_rate": 0.0002, "loss": 0.0123, "step": 135 }, { "epoch": 2.39, "learning_rate": 0.0002, "loss": 0.0203, "step": 136 }, { "epoch": 2.4, "learning_rate": 0.0002, "loss": 0.0115, "step": 137 }, { "epoch": 2.42, "learning_rate": 0.0002, "loss": 0.0012, "step": 138 }, { "epoch": 2.44, "learning_rate": 0.0002, "loss": 0.0195, "step": 139 }, { "epoch": 2.46, "learning_rate": 0.0002, "loss": 0.0661, "step": 140 }, { "epoch": 2.47, "learning_rate": 0.0002, "loss": 0.4407, "step": 141 }, { "epoch": 2.49, "learning_rate": 0.0002, "loss": 0.0028, "step": 142 }, { "epoch": 2.51, "learning_rate": 0.0002, "loss": 0.0051, "step": 143 }, { "epoch": 2.53, "learning_rate": 0.0002, "loss": 0.015, "step": 144 }, { "epoch": 2.54, "learning_rate": 0.0002, "loss": 0.0053, "step": 145 }, { "epoch": 2.56, "learning_rate": 0.0002, "loss": 0.0203, "step": 146 }, { "epoch": 2.58, "learning_rate": 0.0002, "loss": 0.066, "step": 147 }, { "epoch": 2.6, "learning_rate": 0.0002, "loss": 0.0094, "step": 148 }, { "epoch": 2.61, "learning_rate": 0.0002, "loss": 0.0171, "step": 149 }, { "epoch": 2.63, "learning_rate": 0.0002, "loss": 0.0228, "step": 150 }, { "epoch": 2.63, "eval_math_accuracy": 0.8173333333333334, "eval_math_average_probability": 0.8123735189437866, "eval_math_brier_score": 0.1503276824951172, "eval_math_loss": 0.9861154556274414, "eval_math_probabilities": [ 0.8013375401496887, 0.9314551949501038, 0.8548316359519958, 0.9999860525131226, 0.9999995231628418, 0.9999992847442627, 1.0, 1.0, 1.0, 0.9875834584236145, 0.806584358215332, 0.9830207824707031, 0.09412826597690582, 0.004626914858818054, 0.9927252531051636, 0.3837220370769501, 0.5901761651039124, 0.8840576410293579, 0.9997900128364563, 0.6723666191101074, 0.9945763349533081, 0.2588123083114624, 0.17747525870800018, 0.24405743181705475, 0.00030546743073500693, 0.9998364448547363, 0.9997673630714417, 0.5942893624305725, 0.13413985073566437, 0.0001264838792849332, 0.13368922472000122, 0.03371625766158104, 0.0003731609904207289, 0.9993495345115662, 0.999998927116394, 0.9999840259552002, 1.0, 1.0, 1.0, 0.12500107288360596, 9.706079436000437e-05, 0.0015377093805000186, 1.0, 1.0, 1.0, 0.423324853181839, 0.04738793149590492, 0.9595783352851868, 1.0, 1.0, 0.9999997615814209, 0.9982461929321289, 0.9666613340377808, 0.9983869791030884, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999741315841675, 0.9934752583503723, 0.999530553817749, 0.9994489550590515, 0.9990997314453125, 0.999998927116394, 3.628988224591012e-06, 3.874532922054641e-05, 0.9594030976295471, 0.9996076226234436, 0.9999603033065796, 0.9999977350234985, 0.9998897314071655, 0.9999994039535522, 1.0, 1.0, 1.0, 1.0, 0.9999293088912964, 0.9924254417419434, 0.9995608925819397, 0.9961872696876526, 0.9998784065246582, 0.9998165965080261, 0.9998631477355957, 1.0, 1.0, 0.1038157269358635, 0.6706569790840149, 0.9998112320899963, 1.0, 1.0, 1.0, 0.00016339831927325577, 0.9991287589073181, 0.0037795265670865774, 0.9994576573371887, 0.9998612403869629, 0.9999724626541138, 0.956009566783905, 0.993010938167572, 0.7039796710014343, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999765932559967, 0.2820528745651245, 0.6299279928207397, 0.6336652040481567, 0.3558039665222168, 0.09370282292366028, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999020099639893, 0.9999381303787231, 0.999626874923706, 0.008285761810839176, 0.28629860281944275, 0.9986972212791443, 1.0, 0.9999996423721313, 0.9999862909317017, 0.9999994039535522, 0.9999887943267822, 0.9999874830245972, 0.042044878005981445, 0.9321061968803406, 0.9963555335998535, 1.0, 1.0, 1.0, 0.3860200047492981, 1.0, 0.9999998807907104, 0.9999916553497314, 1.0, 0.9999995231628418, 1.0, 1.0, 1.0, 0.002757691778242588, 0.9786230325698853, 0.9999314546585083, 0.9999998807907104, 1.0, 1.0, 0.0063841575756669044, 0.22733429074287415, 0.7775404453277588, 0.8725534081459045, 0.8787643313407898, 0.7998197674751282, 0.9999914169311523, 0.9537715911865234, 0.9986417889595032, 1.0, 0.9810090065002441, 1.0, 0.886431097984314, 9.694071934074344e-12, 0.6367807388305664, 0.9894037246704102, 0.8618413805961609, 0.8510802984237671, 1.0, 0.9999996423721313, 0.9999984502792358, 0.999876856803894, 0.9986609220504761, 0.9999315738677979, 0.8292967081069946, 0.7019312381744385, 0.05313243716955185, 0.9941936135292053, 0.999957799911499, 0.9999901056289673, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999934434890747, 0.9995505213737488, 0.999998927116394, 0.9547871351242065, 0.20637467503547668, 0.970639705657959, 0.9983748197555542, 0.9975347518920898, 0.00016294897068291903, 0.999854564666748, 0.9901902675628662, 1.0, 0.7507430911064148, 0.4289851784706116, 0.7692642211914062, 1.0, 0.987250030040741, 0.37637728452682495, 0.9999990463256836, 1.0, 0.9999799728393555, 0.9999802112579346, 1.0, 0.9999923706054688, 0.9999997615814209, 0.3259419798851013, 0.9999991655349731, 0.2552535831928253, 0.9980631470680237, 0.06544894725084305, 0.9999732971191406, 0.9999955892562866, 0.9998372793197632, 1.0, 1.0, 1.0, 0.9999996423721313, 0.9975197911262512, 0.5841714143753052, 1.0, 0.9574158787727356, 0.9998970031738281, 1.0, 1.0, 1.0, 0.6411216855049133, 0.9985402822494507, 0.9859752058982849, 0.9994297623634338, 0.964752197265625, 0.5752678513526917, 1.0, 1.0, 1.0, 0.9989848732948303, 0.9999115467071533, 0.6878409385681152, 0.9999189376831055, 0.9999120235443115, 0.995975911617279, 0.9999997615814209, 1.0, 1.0, 0.1681661754846573, 0.7973651885986328, 0.9994065761566162, 0.9999799728393555, 0.999944806098938, 0.999813973903656, 0.9999018907546997, 0.9999984502792358, 0.9999896287918091, 0.9988738894462585, 0.9998786449432373, 0.9999608993530273, 0.9999732971191406, 0.9999998807907104, 0.99998939037323, 0.9999760389328003, 0.9995062351226807, 0.9999954700469971, 0.9956061244010925, 0.024145647883415222, 0.9983270764350891, 0.6660557389259338, 0.9836204051971436, 0.6327917575836182, 0.9996160268783569, 0.9999996423721313, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998818635940552, 0.9970947504043579, 0.9999696016311646, 0.9997180104255676, 0.9984706044197083, 0.9895830154418945, 1.0, 1.0, 0.9999867677688599, 0.9567256569862366, 0.835687518119812, 0.26758259534835815, 1.0, 0.9999995231628418, 0.9999997615814209, 0.3386020064353943, 0.02621171995997429, 0.09037907421588898, 0.884045422077179, 0.004892504774034023, 0.6903680562973022, 0.9999998807907104, 1.0, 0.9999938011169434, 1.0, 1.0, 0.9999998807907104, 1.3667625191338129e-11, 1.223246226533803e-10, 1.0703382624654978e-10, 0.9999991655349731, 0.9999902248382568, 0.9999276399612427, 0.013238473795354366, 0.9999037981033325, 0.9456169009208679, 0.15231184661388397, 0.9998143315315247, 0.2462969273328781, 0.9999982118606567, 0.9999011754989624, 0.9999822378158569, 0.9999998807907104, 1.0, 0.9999996423721313, 1.0, 1.0, 1.0, 0.9998801946640015, 0.9992941617965698, 0.9996227025985718, 0.49947381019592285, 0.773683488368988, 0.7495631575584412, 0.9914714694023132, 0.8433712124824524, 0.9930216670036316, 1.0, 0.12694352865219116, 1.0, 0.9999997615814209, 0.9999996423721313, 1.0, 1.0, 1.0, 0.9999754428863525, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.7310255765914917, 0.00015754048945382237, 0.18860241770744324, 0.36668017506599426, 0.0013610894093289971, 4.5892196709473865e-08, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998258948326111, 0.5630912780761719, 0.9028489589691162, 0.5615326166152954, 0.9895362854003906, 0.2493039071559906, 0.004865061957389116, 1.0, 1.0, 1.0, 1.0, 0.9999997615814209, 1.0, 0.9999971389770508, 0.9999998807907104, 0.9999781847000122, 0.9443056583404541, 0.9885308146476746, 0.9916579127311707, 0.20568718016147614, 0.6671643853187561, 0.8548428416252136, 0.9999984502792358, 0.9999040365219116, 0.9999997615814209, 0.9999872446060181, 0.9999995231628418, 0.9999994039535522, 0.2364906519651413, 0.26867327094078064, 0.3899894654750824, 0.9994576573371887, 0.9731547832489014, 0.9930405616760254, 3.3906187582033454e-06, 0.9999938011169434, 0.9999898672103882, 1.0, 1.0, 1.0, 0.9999997615814209, 0.9947762489318848, 0.9999977350234985, 1.0, 0.9999970197677612, 1.0, 1.0, 0.9999780654907227, 1.0, 1.0, 1.0, 0.999996542930603, 0.9971051812171936, 0.9931198358535767, 0.9169993996620178, 0.9999996423721313, 1.0, 0.9999985694885254, 1.0, 1.0, 1.0, 1.0, 0.9999886751174927, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998375177383423, 0.9979928731918335, 0.9999395608901978, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.8662083745002747, 0.4484540820121765, 0.9451032876968384, 1.079612510501704e-09, 0.34920734167099, 4.0221700969844676e-10, 1.0, 1.0, 1.0, 1.0, 0.9271144866943359, 0.9859262704849243, 0.44345295429229736, 0.7953904867172241, 0.9704682230949402, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.04335547238588333, 0.9712350964546204, 0.999152421951294, 0.5257843136787415, 0.4494398832321167, 0.06004317104816437, 0.9999988079071045, 0.9999997615814209, 0.0011444150004535913, 0.9999996423721313, 1.0, 1.0, 0.9964385032653809, 0.9999990463256836, 1.0, 2.623837076498603e-07, 0.5280252695083618, 0.9992178678512573, 1.0, 1.0, 1.0, 0.1339375078678131, 0.13180135190486908, 0.1905062049627304, 0.000467888341518119, 3.064124939555768e-06, 0.13624770939350128, 1.0, 1.0, 1.0, 3.408656112924291e-08, 0.16251231729984283, 0.9798438549041748, 0.7015630006790161, 0.9041873216629028, 1.2836075258260138e-10, 1.0, 1.0, 1.0, 1.0, 0.9999871253967285, 1.0, 1.0, 0.9998838901519775, 0.9999394416809082, 0.8373131155967712, 1.4827262972971766e-08, 0.3150058388710022, 0.29522576928138733, 0.9995960593223572, 0.9994776844978333, 0.9988191723823547, 1.0, 0.9999843835830688, 0.5316330194473267, 0.9965636134147644, 0.5601105093955994, 1.0, 1.0, 1.0, 0.9167428016662598, 0.08630324900150299, 0.04801918566226959, 0.9999905824661255, 0.7210108637809753, 0.9632091522216797, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.001368520432151854, 0.44137340784072876, 4.46082367488998e-07, 0.014893393963575363, 7.927860860945657e-05, 3.0144636184559204e-05, 0.9219545125961304, 0.00040464577614329755, 0.0019052838906645775, 0.9999995231628418, 0.9998750686645508, 0.9999843835830688, 0.039543867111206055, 0.9999978542327881, 0.9997649788856506, 0.999862790107727, 0.9999538660049438, 0.9999476671218872, 0.9999995231628418, 0.9998470544815063, 0.998896598815918, 0.9310318231582642, 0.9706305861473083, 0.9547158479690552, 0.9997546076774597, 0.9999420642852783, 0.9999750852584839, 0.9999998807907104, 0.9999992847442627, 1.0, 0.05296103656291962, 0.9999997615814209, 0.999997615814209, 0.9999804496765137, 1.0, 0.9999982118606567, 0.9999881982803345, 0.9999953508377075, 0.3090629279613495, 1.0, 1.0, 1.0, 0.9641543030738831, 0.162003755569458, 1.1198824978464472e-08, 0.9999984502792358, 0.9999997615814209, 0.9999690055847168, 0.34002864360809326, 0.866601824760437, 0.31299951672554016, 0.9979495406150818, 0.999607264995575, 0.9919095635414124, 1.0, 0.7935293912887573, 1.0, 0.9996896982192993, 0.9999908208847046, 0.5728018879890442, 0.9970682263374329, 0.9433049559593201, 0.05691097676753998, 0.5190537571907043, 0.09756164997816086, 0.4926547706127167, 1.0, 1.0, 1.0, 0.140238419175148, 0.7690957188606262, 0.14415645599365234, 0.4156700074672699, 0.76800537109375, 0.3694034814834595, 0.9473482966423035, 0.9999995231628418, 0.9880309700965881, 0.9966617822647095, 0.9684865474700928, 0.5419439077377319, 0.9887546300888062, 0.9976277947425842, 0.9963235855102539, 0.10684535652399063, 0.049848590046167374, 2.2275351511780173e-05, 0.9999996423721313, 0.9999938011169434, 0.9999970197677612, 0.9999995231628418, 0.999998927116394, 1.0, 0.16500046849250793, 0.8352866768836975, 0.008565324358642101, 1.0, 1.0, 0.6229800581932068, 1.0, 0.9999996423721313, 1.0, 0.9503698945045471, 0.7764531373977661, 0.9998452663421631, 0.9988025426864624, 0.9984924793243408, 0.9997652173042297, 0.9981012940406799, 0.9999963045120239, 0.9991951584815979, 0.8756048679351807, 0.4760726988315582, 0.004721361678093672, 0.9999946355819702, 0.9974653720855713, 1.0, 0.9999890327453613, 1.0, 0.9988269209861755, 0.27219709753990173, 0.03230009227991104, 0.5680275559425354, 1.0, 1.0, 0.9999452829360962, 0.9999998807907104, 0.9999934434890747, 1.0, 0.9955700039863586, 1.0, 0.9999992847442627, 0.8627943992614746, 0.9095977544784546, 0.659582257270813, 0.9983355402946472, 0.9997095465660095, 0.9964626431465149, 0.9999984502792358, 1.0, 0.030000710859894753, 0.9999992847442627, 0.999998927116394, 0.9999984502792358, 0.0006043959874659777, 0.9999997615814209, 0.999984860420227, 0.9981796741485596, 0.9995179176330566, 0.9989068508148193, 0.999998927116394, 0.9999996423721313, 1.0, 0.9999998807907104, 0.9999887943267822, 0.9999960660934448, 0.00458217179402709, 4.050582447234774e-08, 0.032959192991256714, 0.9999997615814209, 0.9997100234031677, 0.9999862909317017, 0.9907854795455933, 0.041441790759563446, 0.5416333079338074, 0.0019115419127047062, 0.9876692891120911, 0.9675129055976868, 0.9583655595779419, 0.962476909160614, 0.00040163073572330177, 0.592214047908783, 0.6923621892929077, 0.04770148545503616, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 0.05341428145766258, 0.4959639012813568, 0.0387398861348629, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9700018763542175, 0.9987285733222961, 0.9567697644233704, 0.9788364768028259, 0.6728900671005249, 0.03654106333851814, 0.8037645220756531, 0.999988317489624, 0.9999910593032837, 1.0, 0.9988821148872375, 0.9999183416366577, 0.10121521353721619 ], "eval_math_runtime": 201.1127, "eval_math_samples_per_second": 3.729, "eval_math_score": -0.1503276824951172, "eval_math_steps_per_second": 0.119, "step": 150 }, { "epoch": 2.65, "learning_rate": 0.0002, "loss": 0.1084, "step": 151 }, { "epoch": 2.67, "learning_rate": 0.0002, "loss": 0.0068, "step": 152 }, { "epoch": 2.68, "learning_rate": 0.0002, "loss": 0.0192, "step": 153 }, { "epoch": 2.7, "learning_rate": 0.0002, "loss": 0.0007, "step": 154 }, { "epoch": 2.72, "learning_rate": 0.0002, "loss": 0.0093, "step": 155 }, { "epoch": 2.74, "learning_rate": 0.0002, "loss": 0.4069, "step": 156 }, { "epoch": 2.75, "learning_rate": 0.0002, "loss": 0.0231, "step": 157 }, { "epoch": 2.77, "learning_rate": 0.0002, "loss": 0.0249, "step": 158 }, { "epoch": 2.79, "learning_rate": 0.0002, "loss": 0.0465, "step": 159 }, { "epoch": 2.81, "learning_rate": 0.0002, "loss": 0.0339, "step": 160 }, { "epoch": 2.82, "learning_rate": 0.0002, "loss": 0.0126, "step": 161 }, { "epoch": 2.84, "learning_rate": 0.0002, "loss": 0.044, "step": 162 }, { "epoch": 2.86, "learning_rate": 0.0002, "loss": 0.0039, "step": 163 }, { "epoch": 2.88, "learning_rate": 0.0002, "loss": 0.0104, "step": 164 }, { "epoch": 2.89, "learning_rate": 0.0002, "loss": 0.0077, "step": 165 }, { "epoch": 2.91, "learning_rate": 0.0002, "loss": 0.0045, "step": 166 }, { "epoch": 2.93, "learning_rate": 0.0002, "loss": 0.0046, "step": 167 }, { "epoch": 2.95, "learning_rate": 0.0002, "loss": 0.0006, "step": 168 }, { "epoch": 2.96, "learning_rate": 0.0002, "loss": 0.0037, "step": 169 }, { "epoch": 2.98, "learning_rate": 0.0002, "loss": 0.0015, "step": 170 }, { "epoch": 3.0, "learning_rate": 0.0002, "loss": 0.0005, "step": 171 }, { "epoch": 3.02, "learning_rate": 0.0002, "loss": 0.0002, "step": 172 }, { "epoch": 3.04, "learning_rate": 0.0002, "loss": 0.0006, "step": 173 }, { "epoch": 3.05, "learning_rate": 0.0002, "loss": 0.0006, "step": 174 }, { "epoch": 3.07, "learning_rate": 0.0002, "loss": 0.0009, "step": 175 }, { "epoch": 3.07, "eval_math_accuracy": 0.8146666666666667, "eval_math_average_probability": 0.8137734532356262, "eval_math_brier_score": 0.15471577644348145, "eval_math_loss": 1.0626981258392334, "eval_math_probabilities": [ 0.9990401864051819, 0.9987272620201111, 0.992990255355835, 0.9999898672103882, 0.9999997615814209, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9728721976280212, 0.8585329055786133, 0.9908590912818909, 0.14412620663642883, 0.001532719936221838, 0.9974506497383118, 0.9440782070159912, 0.8894739151000977, 0.9655789136886597, 0.9999969005584717, 0.046698544174432755, 0.84991055727005, 0.06470396369695663, 0.14673376083374023, 0.06983377039432526, 0.0008099137339740992, 0.9999977350234985, 0.9999711513519287, 0.7851619124412537, 0.10993026942014694, 0.001358301960863173, 0.12340006977319717, 0.06653755158185959, 0.001990212593227625, 0.3402368426322937, 0.9999992847442627, 0.9979918003082275, 1.0, 1.0, 1.0, 0.016542166471481323, 7.5074708547617774e-06, 0.006214377470314503, 1.0, 1.0, 1.0, 0.2964445650577545, 0.009193255566060543, 0.8081239461898804, 1.0, 1.0, 0.9999990463256836, 0.9991704225540161, 0.9817942380905151, 0.9994243383407593, 0.9999954700469971, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999980926513672, 0.9998148083686829, 0.9986660480499268, 0.9999996423721313, 0.9999556541442871, 1.0, 0.00495552783831954, 7.593000646011205e-07, 0.9921602606773376, 0.9999892711639404, 0.9999995231628418, 1.0, 0.9999784231185913, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9996719360351562, 0.9906655550003052, 0.8584807515144348, 0.9861146211624146, 0.9997432827949524, 0.9992426633834839, 1.0, 1.0, 1.0, 0.001492238137871027, 0.0008931801421567798, 0.9783450365066528, 1.0, 1.0, 1.0, 0.013829193077981472, 0.9998140931129456, 0.04624401032924652, 1.0, 1.0, 1.0, 0.9999955892562866, 0.9999996423721313, 0.9991575479507446, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.8526838421821594, 0.9136449098587036, 0.2602793574333191, 0.03755372390151024, 0.0015360014513134956, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.00029442523373290896, 0.0037117621395736933, 0.9921257495880127, 1.0, 1.0, 0.9999998807907104, 0.9999438524246216, 0.9969388246536255, 0.9983986020088196, 0.9545691013336182, 0.9993365406990051, 0.9999376535415649, 1.0, 1.0, 1.0, 0.8301631808280945, 1.0, 0.9999995231628418, 0.9999572038650513, 1.0, 0.9999995231628418, 1.0, 1.0, 1.0, 1.3713188309338875e-05, 0.06747108697891235, 0.9962239265441895, 1.0, 1.0, 1.0, 0.03728414326906204, 0.039646245539188385, 0.5828949809074402, 0.9998270869255066, 0.9995706677436829, 0.9993738532066345, 1.0, 0.037353385239839554, 0.9999655485153198, 1.0, 0.999991774559021, 1.0, 0.983221173286438, 1.7699909246604584e-11, 0.8077591061592102, 0.8392825126647949, 0.5420300960540771, 0.3936152756214142, 1.0, 0.9999488592147827, 0.999983549118042, 0.5788662433624268, 0.9992992877960205, 0.9998276233673096, 0.9443360567092896, 0.8417370915412903, 0.16528591513633728, 0.9905800223350525, 0.9983306527137756, 0.9999901056289673, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999023675918579, 0.9683210849761963, 0.999988317489624, 0.9999415874481201, 0.9999957084655762, 0.999997615814209, 0.9999998807907104, 1.0, 0.8416310548782349, 0.9999992847442627, 0.9978169202804565, 1.0, 0.503063976764679, 0.3205845057964325, 0.7619945406913757, 1.0, 0.9724015593528748, 0.040657006204128265, 0.9999880790710449, 1.0, 0.999943733215332, 0.9999992847442627, 1.0, 0.9999995231628418, 0.9999696016311646, 2.475651683653268e-07, 0.9999685287475586, 0.3144243657588959, 0.9996678829193115, 0.04895547777414322, 0.7712210416793823, 0.9998718500137329, 0.0006084964843466878, 1.0, 1.0, 1.0, 1.0, 0.9996429681777954, 0.22703875601291656, 1.0, 0.9224922060966492, 0.9984037280082703, 1.0, 1.0, 1.0, 0.978492796421051, 0.9999865293502808, 0.9955130219459534, 0.9955315589904785, 0.9883583188056946, 0.014311742968857288, 1.0, 1.0, 1.0, 0.999847412109375, 0.9999481439590454, 0.7282890677452087, 0.9999995231628418, 0.9999994039535522, 0.9999988079071045, 0.9999978542327881, 1.0, 1.0, 0.8281816244125366, 0.9703561663627625, 0.9999955892562866, 0.9993914365768433, 0.999782145023346, 0.9994189739227295, 0.9999938011169434, 1.0, 0.9999997615814209, 0.9984651803970337, 0.999846339225769, 0.9999393224716187, 0.9995711445808411, 0.9999995231628418, 0.9999943971633911, 0.9989761114120483, 0.8968200087547302, 0.9998999834060669, 0.9999997615814209, 0.03544827550649643, 0.9791728258132935, 0.7340118885040283, 0.9689418077468872, 0.6578278541564941, 0.9999951124191284, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999856948852539, 0.9999934434890747, 0.9999973773956299, 0.9999986886978149, 0.9999867677688599, 0.9998176693916321, 1.0, 1.0, 0.9999876022338867, 0.9880357384681702, 0.8985042572021484, 0.08799797296524048, 1.0, 0.9999872446060181, 0.9999966621398926, 0.4059300124645233, 0.43999266624450684, 0.4693898856639862, 0.05972497910261154, 0.06925104558467865, 0.17788393795490265, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 9.891370220723589e-14, 4.6595713398822625e-11, 1.0105333236865022e-09, 1.0, 1.0, 1.0, 0.9517166018486023, 1.0, 0.9956894516944885, 0.007123964373022318, 0.999930739402771, 0.041421979665756226, 0.9999998807907104, 0.999998927116394, 0.9999881982803345, 0.9997259974479675, 1.0, 0.9998683929443359, 1.0, 1.0, 1.0, 0.9999489784240723, 0.9993582367897034, 0.9999630451202393, 0.9851099252700806, 0.9946240782737732, 0.9523754715919495, 0.9971790313720703, 0.8289161324501038, 0.9971576929092407, 0.999502420425415, 1.455617564261047e-07, 0.9991152882575989, 1.0, 1.0, 1.0, 0.9999996423721313, 1.0, 0.9991115927696228, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.8905442357063293, 8.842635907058138e-06, 0.09604618698358536, 0.5051009058952332, 2.2474454453913495e-05, 1.7724465450896787e-08, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.0990268811583519, 0.9600505828857422, 0.009496508166193962, 0.9997155070304871, 0.32724931836128235, 6.584483799088048e-06, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999986886978149, 0.9999992847442627, 0.451722115278244, 0.9999934434890747, 0.9996824264526367, 0.9997389912605286, 0.19974850118160248, 0.538529634475708, 0.7431250214576721, 1.0, 1.0, 1.0, 0.9999982118606567, 0.9999994039535522, 0.9999995231628418, 0.18700622022151947, 0.14439693093299866, 0.32009536027908325, 0.9994550347328186, 0.998538613319397, 0.997115969657898, 1.333532782155089e-05, 0.9999998807907104, 0.9999973773956299, 1.0, 1.0, 1.0, 1.0, 0.9999676942825317, 1.0, 1.0, 0.9999706745147705, 0.9999995231628418, 1.0, 0.9997789263725281, 1.0, 1.0, 1.0, 0.9999997615814209, 0.05575035139918327, 0.8600127100944519, 0.03493482992053032, 1.0, 1.0, 0.9999997615814209, 0.999998927116394, 0.9999998807907104, 0.9999998807907104, 1.0, 0.9999998807907104, 0.9999971389770508, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999059438705444, 0.9149354100227356, 0.9997159838676453, 1.0, 1.0, 1.0, 0.999970555305481, 1.0, 1.0, 0.047714415937662125, 0.7098724842071533, 0.9955945611000061, 3.4075087196328013e-10, 0.1154840886592865, 1.64075808495312e-09, 1.0, 1.0, 1.0, 1.0, 0.3473905026912689, 0.9999080896377563, 0.22831693291664124, 0.6795331239700317, 0.9389440417289734, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.7527579665184021, 0.7162756323814392, 0.9993732571601868, 0.1263236701488495, 0.8965207934379578, 0.37124794721603394, 0.9999523162841797, 0.9999991655349731, 0.0002532133075874299, 1.0, 1.0, 1.0, 0.9999583959579468, 1.0, 1.0, 7.745942980363907e-07, 1.1071019656583303e-07, 0.994113028049469, 1.0, 1.0, 1.0, 0.6711134314537048, 0.5298965573310852, 0.8271860480308533, 0.00017123730503953993, 1.8794050042907247e-14, 0.42171671986579895, 1.0, 1.0, 1.0, 4.546691023676885e-09, 0.3331426978111267, 0.9987671375274658, 0.4903581142425537, 0.9054309725761414, 6.642333211237528e-11, 1.0, 1.0, 1.0, 1.0, 0.9999744892120361, 1.0, 0.9999983310699463, 0.9996669292449951, 0.9999814033508301, 0.9889362454414368, 2.484112155798357e-05, 0.9980807304382324, 0.696157693862915, 0.9996155500411987, 0.99955815076828, 0.9976807832717896, 1.0, 0.9998243451118469, 0.9560290575027466, 0.9999905824661255, 0.5026838183403015, 1.0, 1.0, 1.0, 0.5209113955497742, 0.8488134145736694, 0.16006849706172943, 0.9987471103668213, 0.24784989655017853, 0.8073166012763977, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.261514914105646e-05, 0.0038095342461019754, 0.0002635067794471979, 0.0639372393488884, 0.11227517575025558, 0.5321599245071411, 0.989807665348053, 0.2414666712284088, 0.02018623985350132, 0.9999997615814209, 0.9999039173126221, 0.9999954700469971, 0.21458499133586884, 0.9999995231628418, 0.999990701675415, 0.881115734577179, 0.8066745400428772, 0.9924944639205933, 0.999907374382019, 0.9975889921188354, 0.9712552428245544, 0.9990943670272827, 0.9998785257339478, 0.9991596937179565, 0.9994702935218811, 0.9999079704284668, 0.9999827146530151, 1.0, 1.0, 1.0, 0.742490291595459, 1.0, 1.0, 0.999705970287323, 1.0, 1.0, 1.0, 1.0, 0.9995859265327454, 1.0, 1.0, 1.0, 0.9738973379135132, 0.03604697063565254, 0.00012342529953457415, 1.0, 1.0, 0.9999998807907104, 0.17038381099700928, 0.7521790266036987, 0.14294403791427612, 0.9999077320098877, 0.9999926090240479, 0.9999716281890869, 1.0, 0.9949796795845032, 1.0, 0.9999723434448242, 0.9999674558639526, 0.4444352686405182, 0.9997939467430115, 0.9997506737709045, 0.9994034767150879, 0.9726321697235107, 0.004706015344709158, 0.3484872877597809, 1.0, 1.0, 1.0, 0.10951845347881317, 0.37027284502983093, 0.1197509691119194, 0.3329557180404663, 0.6248264908790588, 0.4261712431907654, 0.9111721515655518, 1.0, 0.9980667233467102, 0.9162835478782654, 0.7125499248504639, 0.03716486319899559, 0.9926445484161377, 0.9387626051902771, 0.9858793616294861, 0.153243750333786, 0.28029054403305054, 0.00013486744137480855, 0.9999998807907104, 0.9999998807907104, 0.9999998807907104, 1.0, 1.0, 1.0, 0.17196521162986755, 0.9549118876457214, 0.00013849844981450588, 1.0, 1.0, 0.4793822765350342, 1.0, 1.0, 1.0, 0.943040132522583, 0.965853750705719, 0.9997691512107849, 0.9999496936798096, 0.9997149109840393, 0.9999384880065918, 0.9944784641265869, 0.9999992847442627, 0.9965695142745972, 0.9976879358291626, 0.9313705563545227, 0.715369462966919, 0.9999978542327881, 0.9998656511306763, 1.0, 0.9899875521659851, 1.0, 0.998982846736908, 0.06542608141899109, 0.06343347579240799, 0.5361071228981018, 1.0, 1.0, 0.9596670269966125, 1.0, 1.0, 1.0, 0.9845635890960693, 1.0, 0.9999510049819946, 0.987837553024292, 0.9966650605201721, 0.8610681891441345, 0.9990130662918091, 0.999990701675415, 0.999830961227417, 0.9999997615814209, 1.0, 0.8219539523124695, 1.0, 1.0, 1.0, 4.810346581507474e-05, 0.9999997615814209, 0.9999922513961792, 0.9997045397758484, 0.9999978542327881, 0.9999690055847168, 1.0, 1.0, 1.0, 0.9999994039535522, 0.9999946355819702, 0.9999769926071167, 0.0878731906414032, 0.0017266833456233144, 0.11466622352600098, 1.0, 0.9725052118301392, 0.9999997615814209, 0.9993066787719727, 0.523610532283783, 0.08682649582624435, 6.390136695699766e-05, 0.9999953508377075, 0.9997202754020691, 0.9970471262931824, 0.9829849600791931, 2.1631365143548464e-06, 0.9730200171470642, 0.9469166994094849, 0.10515039414167404, 0.9801472425460815, 0.9999988079071045, 1.0, 1.0, 0.9999998807907104, 0.9999725818634033, 0.02941068448126316, 0.18748149275779724, 0.0559183694422245, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9789361953735352, 0.9986873269081116, 0.8353451490402222, 0.3999749422073364, 0.7329229712486267, 0.3486204445362091, 0.996717631816864, 0.9999657869338989, 0.9999728202819824, 1.0, 0.9935615062713623, 0.999413013458252, 0.2904314398765564 ], "eval_math_runtime": 201.0823, "eval_math_samples_per_second": 3.73, "eval_math_score": -0.15471577644348145, "eval_math_steps_per_second": 0.119, "step": 175 }, { "epoch": 3.09, "learning_rate": 0.0002, "loss": 0.0035, "step": 176 }, { "epoch": 3.11, "learning_rate": 0.0002, "loss": 0.005, "step": 177 }, { "epoch": 3.12, "learning_rate": 0.0002, "loss": 0.0031, "step": 178 }, { "epoch": 3.14, "learning_rate": 0.0002, "loss": 0.0007, "step": 179 }, { "epoch": 3.16, "learning_rate": 0.0002, "loss": 0.0033, "step": 180 }, { "epoch": 3.18, "learning_rate": 0.0002, "loss": 0.0007, "step": 181 }, { "epoch": 3.19, "learning_rate": 0.0002, "loss": 0.0049, "step": 182 }, { "epoch": 3.21, "learning_rate": 0.0002, "loss": 0.0006, "step": 183 }, { "epoch": 3.23, "learning_rate": 0.0002, "loss": 0.0002, "step": 184 }, { "epoch": 3.25, "learning_rate": 0.0002, "loss": 0.0001, "step": 185 }, { "epoch": 3.26, "learning_rate": 0.0002, "loss": 0.0018, "step": 186 }, { "epoch": 3.28, "learning_rate": 0.0002, "loss": 0.0012, "step": 187 }, { "epoch": 3.3, "learning_rate": 0.0002, "loss": 0.0006, "step": 188 }, { "epoch": 3.32, "learning_rate": 0.0002, "loss": 0.0008, "step": 189 }, { "epoch": 3.33, "learning_rate": 0.0002, "loss": 0.0005, "step": 190 }, { "epoch": 3.35, "learning_rate": 0.0002, "loss": 0.0091, "step": 191 }, { "epoch": 3.37, "learning_rate": 0.0002, "loss": 0.0001, "step": 192 }, { "epoch": 3.39, "learning_rate": 0.0002, "loss": 0.0042, "step": 193 }, { "epoch": 3.4, "learning_rate": 0.0002, "loss": 0.0026, "step": 194 }, { "epoch": 3.42, "learning_rate": 0.0002, "loss": 0.0002, "step": 195 }, { "epoch": 3.44, "learning_rate": 0.0002, "loss": 0.0002, "step": 196 }, { "epoch": 3.46, "learning_rate": 0.0002, "loss": 0.0051, "step": 197 }, { "epoch": 3.47, "learning_rate": 0.0002, "loss": 0.0136, "step": 198 }, { "epoch": 3.49, "learning_rate": 0.0002, "loss": 0.0102, "step": 199 }, { "epoch": 3.51, "learning_rate": 0.0002, "loss": 0.0, "step": 200 }, { "epoch": 3.51, "eval_math_accuracy": 0.812, "eval_math_average_probability": 0.817578911781311, "eval_math_brier_score": 0.15400166809558868, "eval_math_loss": 1.1789568662643433, "eval_math_probabilities": [ 0.9989752769470215, 0.9973324537277222, 0.9781664609909058, 0.999998927116394, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9455435276031494, 0.9538608193397522, 0.9958062171936035, 0.14330339431762695, 0.00010313162056263536, 0.9956098198890686, 0.9880791306495667, 0.9453150033950806, 0.9824998378753662, 1.0, 0.17790347337722778, 0.9239442348480225, 0.28049951791763306, 0.3071887195110321, 0.08757153898477554, 0.0005521251587197185, 0.9998822212219238, 0.9980151653289795, 0.8964991569519043, 0.2079169899225235, 0.014785338193178177, 0.2328769862651825, 0.1759934425354004, 0.0014180701691657305, 0.05975380167365074, 0.9999998807907104, 0.999525785446167, 1.0, 1.0, 1.0, 0.002930088434368372, 2.0323278704381664e-07, 0.00019066348613705486, 1.0, 1.0, 1.0, 0.04983333498239517, 0.0014338864712044597, 0.0003973495913669467, 1.0, 1.0, 0.9999998807907104, 0.9999936819076538, 0.9999395608901978, 0.9999991655349731, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999864101409912, 0.9999037981033325, 0.9999300241470337, 0.9969236254692078, 0.9999998807907104, 0.8056594729423523, 4.097121530932668e-10, 0.9999294281005859, 0.9999772310256958, 0.9999982118606567, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999730587005615, 0.9928679466247559, 0.9750414490699768, 0.9934279322624207, 0.9999994039535522, 0.9999858140945435, 1.0, 1.0, 1.0, 0.006611410528421402, 0.005841359030455351, 0.8911345601081848, 1.0, 1.0, 1.0, 0.007063216529786587, 0.9999258518218994, 0.015810109674930573, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.9999788999557495, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9924005270004272, 0.971751868724823, 0.5219942927360535, 0.05883925035595894, 0.001362619805149734, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0002443851553834975, 0.0006116696167737246, 0.9797990322113037, 1.0, 1.0, 1.0, 0.9999951124191284, 0.999821126461029, 0.999860405921936, 0.8105773329734802, 0.9885267019271851, 0.9991815686225891, 1.0, 1.0, 1.0, 0.989629328250885, 1.0, 1.0, 0.9999933242797852, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 1.1250280294916593e-05, 0.720708966255188, 0.9991662502288818, 1.0, 1.0, 1.0, 0.014321298338472843, 0.01484810933470726, 0.37655776739120483, 0.9999806880950928, 0.9999815225601196, 0.9999804496765137, 0.9999991655349731, 0.10144103318452835, 0.9988210797309875, 1.0, 0.9999984502792358, 1.0, 0.9791492819786072, 1.6520802087471864e-11, 0.908384382724762, 0.2808012068271637, 0.26942282915115356, 0.012740486301481724, 1.0, 0.9999998807907104, 1.0, 0.20134292542934418, 0.9997625946998596, 0.999976634979248, 0.9836745262145996, 0.8890628814697266, 0.2904449999332428, 0.9986652135848999, 0.9997708201408386, 0.9999995231628418, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999951124191284, 0.985145092010498, 0.999998927116394, 0.9999698400497437, 0.9999964237213135, 0.9999973773956299, 1.0, 1.0, 0.9956191182136536, 1.0, 0.9999204874038696, 1.0, 0.6842242479324341, 0.5312840938568115, 0.8540053963661194, 1.0, 0.9888477325439453, 0.010059783235192299, 0.9999998807907104, 1.0, 0.9999994039535522, 1.0, 1.0, 1.0, 0.9999186992645264, 6.605974101070444e-10, 0.9999610185623169, 0.1936216801404953, 0.9984524250030518, 0.05747690796852112, 0.9384328126907349, 0.9987215399742126, 7.68278641771758e-06, 1.0, 1.0, 1.0, 1.0, 0.9993016719818115, 0.012396248988807201, 1.0, 0.6999374628067017, 0.9999423027038574, 1.0, 1.0, 1.0, 0.9813883304595947, 0.9999843835830688, 0.9911417961120605, 0.9986923336982727, 0.997849702835083, 0.11826018244028091, 1.0, 1.0, 1.0, 0.9999672174453735, 0.999988317489624, 0.8188163638114929, 1.0, 0.9999998807907104, 0.9999998807907104, 1.0, 1.0, 1.0, 0.387207955121994, 0.9909895062446594, 0.9999988079071045, 0.9989514350891113, 0.999470055103302, 0.9990677237510681, 0.9999994039535522, 1.0, 1.0, 0.9999617338180542, 0.9999947547912598, 0.999998927116394, 0.9999536275863647, 1.0, 0.9999998807907104, 0.9985466599464417, 0.3708987534046173, 0.9999309778213501, 0.9999990463256836, 0.018295221030712128, 0.9985673427581787, 0.8879684805870056, 0.998237133026123, 0.9082358479499817, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998358488082886, 0.9999352693557739, 0.9999762773513794, 0.9999973773956299, 0.9999878406524658, 0.9998339414596558, 1.0, 1.0, 0.9999970197677612, 0.977920413017273, 0.8039851188659668, 0.09512217342853546, 1.0, 0.9999673366546631, 0.9999905824661255, 0.8206048011779785, 0.28189781308174133, 0.28185710310935974, 0.19695468246936798, 0.4376080334186554, 0.036542825400829315, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.491510787428543e-16, 1.941467386162854e-12, 1.971316339333118e-11, 1.0, 1.0, 0.9999997615814209, 0.10383754968643188, 0.9999996423721313, 0.8471006155014038, 0.01503017172217369, 0.9998810291290283, 0.14970161020755768, 1.0, 1.0, 0.9999995231628418, 0.9999996423721313, 1.0, 0.9999985694885254, 1.0, 1.0, 1.0, 0.9999774694442749, 0.9996809959411621, 0.9999650716781616, 0.9790534377098083, 0.9907841682434082, 0.9515441656112671, 0.9998539686203003, 0.8997371196746826, 0.9999363422393799, 0.9971963167190552, 2.5126857039481365e-08, 0.9955344200134277, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999963045120239, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9006873965263367, 2.735212547122501e-05, 0.15637394785881042, 0.3802877366542816, 9.166647032543551e-06, 8.591977823657615e-12, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.06190912425518036, 0.9828693270683289, 0.006239749025553465, 0.9958494901657104, 0.07459395378828049, 3.2882533105293987e-06, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999996423721313, 0.9999998807907104, 0.4309370815753937, 0.9999985694885254, 0.9995620846748352, 0.9999568462371826, 0.4266990125179291, 0.9343335032463074, 0.740191638469696, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.23730652034282684, 0.1985214352607727, 0.29451486468315125, 0.9999995231628418, 0.999995231628418, 0.9999110698699951, 2.9919547159806825e-06, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 0.9996718168258667, 1.0, 1.0, 0.9999970197677612, 1.0, 1.0, 0.9907419085502625, 1.0, 1.0, 1.0, 1.0, 0.032439056783914566, 0.9905992150306702, 0.06698240339756012, 0.9999997615814209, 1.0, 0.9999982118606567, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999943971633911, 0.9990602135658264, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9993889331817627, 0.8533952236175537, 0.9982933402061462, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0024305556435137987, 0.5389343500137329, 0.9989866614341736, 1.2822486995800464e-11, 0.3037671148777008, 5.73039705964451e-11, 1.0, 1.0, 1.0, 1.0, 0.25766798853874207, 0.9999994039535522, 0.3321100175380707, 0.5594395399093628, 0.9460130333900452, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9751082062721252, 0.9245894551277161, 0.99993896484375, 0.3039478361606598, 0.9680384397506714, 0.16745427250862122, 0.9999985694885254, 1.0, 0.00810698326677084, 1.0, 1.0, 1.0, 0.9999821186065674, 0.9999998807907104, 1.0, 6.111010808496076e-09, 3.981035234801311e-08, 0.9803204536437988, 1.0, 1.0, 1.0, 0.7257767915725708, 0.7147145867347717, 0.9312700033187866, 0.0007203257409855723, 4.437765191672542e-14, 0.4373508095741272, 1.0, 1.0, 1.0, 1.2190730647176906e-09, 0.4293443262577057, 0.9973382353782654, 0.33416110277175903, 0.9039080142974854, 9.907986974269645e-14, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999634027481079, 0.9999997615814209, 0.9551252126693726, 4.1908506318577565e-06, 0.9878270030021667, 0.8717851638793945, 0.9995375871658325, 0.9987284541130066, 0.9999933242797852, 1.0, 0.9999995231628418, 0.997658371925354, 0.9999996423721313, 0.8339645862579346, 1.0, 1.0, 1.0, 0.9259528517723083, 0.9701093435287476, 0.13950304687023163, 0.9993630051612854, 0.006953650154173374, 0.911760151386261, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.750448046157544e-07, 0.0014124350855126977, 0.0010716755641624331, 0.0016481204656884074, 0.005328086670488119, 0.18805575370788574, 0.963187038898468, 0.46385833621025085, 0.008377807214856148, 1.0, 0.9999996423721313, 1.0, 0.39896565675735474, 1.0, 0.9999990463256836, 0.9302987456321716, 0.948409914970398, 0.9842395782470703, 0.9999904632568359, 0.9998809099197388, 0.9986080527305603, 0.9986492991447449, 0.9995759129524231, 0.9972543120384216, 0.9964600205421448, 0.9988264441490173, 0.9998624324798584, 1.0, 1.0, 1.0, 0.6788930892944336, 1.0, 1.0, 0.9999982118606567, 1.0, 1.0, 1.0, 1.0, 0.9998632669448853, 1.0, 1.0, 1.0, 0.9854147434234619, 0.04118681699037552, 4.174317291472107e-05, 1.0, 1.0, 0.9999998807907104, 0.21482643485069275, 0.9057621359825134, 0.18454979360103607, 0.9999979734420776, 0.9999998807907104, 0.9999997615814209, 1.0, 0.9986037611961365, 1.0, 0.9999946355819702, 0.999998927116394, 0.8125267028808594, 0.9992870688438416, 0.9992330074310303, 0.9984642267227173, 0.8697814345359802, 0.0004905774840153754, 0.12900853157043457, 1.0, 1.0, 1.0, 0.08434952795505524, 0.4270342290401459, 0.051315344870090485, 0.25851330161094666, 0.5043827295303345, 0.44651567935943604, 0.9984631538391113, 1.0, 0.9999111890792847, 0.9559395909309387, 0.6779343485832214, 0.17000412940979004, 0.9384064674377441, 0.9923171997070312, 0.9889487028121948, 0.5623910427093506, 0.6906800866127014, 9.901214070850983e-05, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.14219199120998383, 0.8972190618515015, 0.00020136097737122327, 1.0, 1.0, 0.5359618663787842, 1.0, 1.0, 1.0, 0.99908447265625, 0.9873766899108887, 1.0, 0.9995644688606262, 0.9975838661193848, 0.9996160268783569, 0.9966199398040771, 0.9999982118606567, 0.9931509494781494, 0.9995269775390625, 0.9917048215866089, 0.5464566349983215, 0.9999997615814209, 0.9999762773513794, 1.0, 0.9966385364532471, 1.0, 0.9991340041160583, 0.3836880028247833, 0.0823424682021141, 0.6615832448005676, 1.0, 1.0, 0.9997053742408752, 1.0, 1.0, 1.0, 0.9973020553588867, 1.0, 0.9999998807907104, 0.999201238155365, 0.9998823404312134, 0.9354981184005737, 0.9995704293251038, 0.9999821186065674, 0.9998503923416138, 1.0, 1.0, 0.760455846786499, 1.0, 1.0, 1.0, 0.003919582813978195, 0.9999997615814209, 0.9999973773956299, 0.9994673132896423, 0.9999932050704956, 0.9999206066131592, 1.0, 1.0, 1.0, 0.9999792575836182, 0.9999716281890869, 0.9998552799224854, 0.08288458734750748, 0.00022703816648572683, 0.051696427166461945, 0.9999998807907104, 0.7324085831642151, 0.9999978542327881, 0.9864097237586975, 0.2977037727832794, 0.23934032022953033, 0.009107098914682865, 0.9999998807907104, 0.9999793767929077, 0.9910548329353333, 0.9842772483825684, 2.272885879506248e-08, 0.968065083026886, 0.9387175440788269, 0.0445549301803112, 0.9246771335601807, 0.9999951124191284, 0.9999998807907104, 1.0, 1.0, 0.9999985694885254, 0.023405911400914192, 0.275566428899765, 0.1079031229019165, 1.0, 1.0, 1.0, 1.0, 1.0, 0.983066201210022, 0.9990818500518799, 0.9448419213294983, 0.21015606820583344, 0.7426583766937256, 0.3157001733779907, 0.9939349293708801, 1.0, 1.0, 1.0, 0.999123752117157, 0.9999667406082153, 0.2357679307460785 ], "eval_math_runtime": 200.9972, "eval_math_samples_per_second": 3.731, "eval_math_score": -0.15400166809558868, "eval_math_steps_per_second": 0.119, "step": 200 }, { "epoch": 3.53, "learning_rate": 0.0002, "loss": 0.0078, "step": 201 }, { "epoch": 3.54, "learning_rate": 0.0002, "loss": 0.1523, "step": 202 }, { "epoch": 3.56, "learning_rate": 0.0002, "loss": 0.0008, "step": 203 }, { "epoch": 3.58, "learning_rate": 0.0002, "loss": 0.0001, "step": 204 }, { "epoch": 3.6, "learning_rate": 0.0002, "loss": 0.0078, "step": 205 }, { "epoch": 3.61, "learning_rate": 0.0002, "loss": 0.0009, "step": 206 }, { "epoch": 3.63, "learning_rate": 0.0002, "loss": 0.0019, "step": 207 }, { "epoch": 3.65, "learning_rate": 0.0002, "loss": 0.0001, "step": 208 }, { "epoch": 3.67, "learning_rate": 0.0002, "loss": 0.0001, "step": 209 }, { "epoch": 3.68, "learning_rate": 0.0002, "loss": 0.0062, "step": 210 }, { "epoch": 3.7, "learning_rate": 0.0002, "loss": 0.0023, "step": 211 }, { "epoch": 3.72, "learning_rate": 0.0002, "loss": 0.0035, "step": 212 }, { "epoch": 3.74, "learning_rate": 0.0002, "loss": 0.0, "step": 213 }, { "epoch": 3.75, "learning_rate": 0.0002, "loss": 0.0002, "step": 214 }, { "epoch": 3.77, "learning_rate": 0.0002, "loss": 0.0001, "step": 215 }, { "epoch": 3.79, "learning_rate": 0.0002, "loss": 0.0036, "step": 216 }, { "epoch": 3.81, "learning_rate": 0.0002, "loss": 0.0001, "step": 217 }, { "epoch": 3.82, "learning_rate": 0.0002, "loss": 0.0001, "step": 218 }, { "epoch": 3.84, "learning_rate": 0.0002, "loss": 0.0002, "step": 219 }, { "epoch": 3.86, "learning_rate": 0.0002, "loss": 0.0823, "step": 220 }, { "epoch": 3.88, "learning_rate": 0.0002, "loss": 0.0, "step": 221 }, { "epoch": 3.89, "learning_rate": 0.0002, "loss": 0.0, "step": 222 }, { "epoch": 3.91, "learning_rate": 0.0002, "loss": 0.0001, "step": 223 }, { "epoch": 3.93, "learning_rate": 0.0002, "loss": 0.0066, "step": 224 }, { "epoch": 3.95, "learning_rate": 0.0002, "loss": 0.0043, "step": 225 }, { "epoch": 3.95, "eval_math_accuracy": 0.804, "eval_math_average_probability": 0.808824896812439, "eval_math_brier_score": 0.16282209753990173, "eval_math_loss": 1.2952638864517212, "eval_math_probabilities": [ 0.9706417322158813, 0.9846718907356262, 0.8952536582946777, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9991888403892517, 0.9526705145835876, 0.9987301230430603, 0.7891477346420288, 0.0007642070995643735, 0.999446451663971, 0.9277735948562622, 0.9072503447532654, 0.988109827041626, 1.0, 0.9318724870681763, 0.9903764128684998, 0.45719870924949646, 0.20697513222694397, 0.14454273879528046, 0.018254518508911133, 0.9999980926513672, 0.9999978542327881, 0.9559594392776489, 0.4603410065174103, 0.00014582766743842512, 0.13143222033977509, 0.0872623473405838, 5.221122410148382e-05, 0.9076762795448303, 0.9999998807907104, 0.9998292922973633, 1.0, 1.0, 1.0, 0.09970349818468094, 1.290838895329216e-06, 6.486649908765685e-06, 1.0, 1.0, 1.0, 0.005696411244571209, 0.0057044546119868755, 0.0024017433170229197, 1.0, 1.0, 0.9999998807907104, 0.9999963045120239, 0.9999750852584839, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999082088470459, 0.9999440908432007, 0.9999998807907104, 0.9999817609786987, 1.0, 0.0002286812523379922, 0.18104393780231476, 0.990439772605896, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999393105506897, 0.992260754108429, 0.9577414989471436, 0.9998912811279297, 1.0, 0.9999951124191284, 0.9992470741271973, 1.0, 1.0, 0.00026100088143721223, 0.00037966875243000686, 0.3427738845348358, 1.0, 1.0, 1.0, 0.0006787048187106848, 0.9999901056289673, 0.0026381751522421837, 1.0, 1.0, 1.0, 0.9997825026512146, 0.9999978542327881, 0.9990053772926331, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999986886978149, 0.47934556007385254, 0.8953709602355957, 0.8561629056930542, 0.21664723753929138, 0.07900407165288925, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0007909336709417403, 0.0012741503305733204, 0.9997157454490662, 1.0, 1.0, 0.9999997615814209, 0.9998856782913208, 0.9971067309379578, 0.9990335702896118, 0.07902522385120392, 0.8762469291687012, 0.9985880255699158, 1.0, 1.0, 1.0, 0.9434992074966431, 1.0, 1.0, 0.9999699592590332, 0.9999998807907104, 0.9999986886978149, 1.0, 1.0, 1.0, 1.579264790052548e-05, 0.26425257325172424, 0.9981809854507446, 1.0, 1.0, 1.0, 9.403418516740203e-05, 0.010393640026450157, 0.11236788332462311, 0.9992184638977051, 0.9983662962913513, 0.9975119829177856, 1.0, 0.07885700464248657, 0.9994779229164124, 1.0, 0.9999998807907104, 1.0, 0.9749891757965088, 7.413156595248438e-07, 0.8926994204521179, 0.9691872000694275, 0.8440073728561401, 0.7541455626487732, 1.0, 0.9999972581863403, 1.0, 0.7615059614181519, 0.9998371601104736, 0.9999964237213135, 0.9817590713500977, 0.8076852560043335, 0.16788966953754425, 0.9989317059516907, 0.9999905824661255, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999992847442627, 1.0, 0.9999678134918213, 0.9999998807907104, 1.0, 0.9999997615814209, 0.9999998807907104, 0.9467378854751587, 1.0, 0.9999921321868896, 1.0, 0.39714616537094116, 0.36284998059272766, 0.6953575015068054, 1.0, 0.9369472861289978, 0.030851390212774277, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9999936819076538, 5.4083342547528446e-05, 0.9999996423721313, 0.24048249423503876, 0.9995935559272766, 0.04488503560423851, 0.9825201630592346, 0.9786176681518555, 0.012516157701611519, 1.0, 1.0, 1.0, 1.0, 0.9954144954681396, 0.002456173300743103, 1.0, 0.6604348421096802, 0.9999996423721313, 1.0, 1.0, 1.0, 0.7986140847206116, 0.9973446726799011, 0.9853296875953674, 0.9875493049621582, 0.9587642550468445, 0.1461123526096344, 1.0, 1.0, 1.0, 0.9999861717224121, 0.9999908208847046, 0.7831220030784607, 0.9999998807907104, 0.9999991655349731, 0.999954342842102, 1.0, 1.0, 1.0, 0.0052849119529128075, 0.9907429814338684, 0.999997615814209, 0.9997604489326477, 0.9993782043457031, 0.9997749924659729, 0.3625594973564148, 0.999995231628418, 0.999947190284729, 0.9997007846832275, 0.9999816417694092, 0.9999898672103882, 0.9999998807907104, 0.9999998807907104, 1.0, 0.9983997941017151, 0.4521876871585846, 0.9998948574066162, 0.9999995231628418, 6.763240190110764e-09, 0.9963536262512207, 0.8816318511962891, 0.9969484210014343, 0.9697087407112122, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999249279499054, 0.999468982219696, 0.999936580657959, 0.9987937211990356, 0.9896653294563293, 0.9569419026374817, 1.0, 1.0, 1.0, 0.9735385775566101, 0.7912425398826599, 0.059316325932741165, 1.0, 0.9999948740005493, 0.9999980926513672, 0.9253392815589905, 0.7945635914802551, 0.87114018201828, 0.7260909676551819, 0.23449820280075073, 0.006390088237822056, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 9.280467517499479e-17, 2.413783860559949e-14, 1.8848707317165037e-12, 0.999998927116394, 0.9999959468841553, 0.9999452829360962, 0.0054239737801253796, 0.999998927116394, 0.006428026594221592, 0.06054966524243355, 0.9999911785125732, 0.07841720432043076, 0.9999998807907104, 0.9999979734420776, 0.9999994039535522, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999706745147705, 0.9997573494911194, 0.9999289512634277, 0.04789188131690025, 0.01035921648144722, 0.14362643659114838, 0.9783550500869751, 0.4605717658996582, 0.997329592704773, 0.9988734126091003, 5.515474640560569e-06, 0.9992828965187073, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.6649224758148193, 1.2685531146416906e-05, 0.06486199796199799, 0.7254611849784851, 2.0710545811652992e-07, 1.1392920027525344e-12, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.05928812548518181, 0.9946936964988708, 0.06098834052681923, 0.9960618615150452, 0.2801995575428009, 2.9034583349130116e-05, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999995231628418, 0.9999985694885254, 0.09500633180141449, 0.9759634733200073, 0.15097065269947052, 0.9355214834213257, 0.24540452659130096, 0.9327775239944458, 0.7483738660812378, 0.9999994039535522, 0.9997846484184265, 0.9999998807907104, 0.9999997615814209, 1.0, 1.0, 0.22208625078201294, 0.23741979897022247, 0.268512487411499, 0.9999991655349731, 0.9999765157699585, 0.9999203681945801, 2.0177290949163762e-08, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 0.7135330438613892, 0.9999998807907104, 1.0, 0.9999949932098389, 1.0, 1.0, 0.949107825756073, 1.0, 1.0, 1.0, 1.0, 0.06842835247516632, 0.9930127263069153, 0.18104112148284912, 0.9999998807907104, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9999998807907104, 0.999930739402771, 0.9999991655349731, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999065399169922, 0.9029042720794678, 0.9997671246528625, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.08998490869998932, 0.619822084903717, 0.9877819418907166, 2.1134902855601823e-11, 0.413900226354599, 1.376147351454804e-12, 1.0, 1.0, 1.0, 1.0, 0.38076797127723694, 0.9999803304672241, 0.2021111100912094, 0.5055441856384277, 0.9714845418930054, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9793798923492432, 0.7188885807991028, 0.9997914433479309, 0.926612377166748, 0.9886481165885925, 0.030588069930672646, 0.9999979734420776, 1.0, 2.128147207258735e-05, 1.0, 1.0, 1.0, 0.9880730509757996, 0.9999771118164062, 0.9999997615814209, 6.533409191433748e-07, 1.1517039411046426e-06, 0.9240750074386597, 1.0, 1.0, 1.0, 0.10456167161464691, 0.1881374567747116, 0.48613595962524414, 0.0003068427904509008, 2.905704288291844e-10, 0.4322112798690796, 1.0, 1.0, 1.0, 1.7076299485552227e-08, 0.7840625643730164, 0.998678982257843, 0.250895231962204, 0.9489893913269043, 3.622772451494262e-14, 1.0, 1.0, 1.0, 1.0, 0.9995811581611633, 1.0, 1.0, 1.0, 1.0, 0.9928398132324219, 0.00033953122328966856, 0.9992839694023132, 0.6495595574378967, 0.9997938275337219, 0.9992583394050598, 0.9998347759246826, 1.0, 0.9999985694885254, 0.9950990080833435, 0.9999995231628418, 0.9230369925498962, 1.0, 1.0, 1.0, 0.8615275025367737, 0.007838877849280834, 0.01490688230842352, 0.9998173117637634, 3.930665843654424e-05, 0.3263368606567383, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0002897108206525445, 0.0001205415537697263, 0.00020480959210544825, 6.903044891259924e-08, 9.8094083966771e-08, 2.2171840896589856e-07, 0.7433765530586243, 0.21118827164173126, 0.009009170345962048, 1.0, 0.9999998807907104, 1.0, 0.3603222072124481, 1.0, 1.0, 0.9999558925628662, 0.999671220779419, 0.9999359846115112, 0.9999998807907104, 0.9999947547912598, 1.0, 0.9903106093406677, 0.9990986585617065, 0.9991243481636047, 0.9999452829360962, 0.9999724626541138, 0.9999960660934448, 1.0, 1.0, 1.0, 0.9967784285545349, 1.0, 1.0, 0.9999760389328003, 1.0, 0.9999951124191284, 1.0, 1.0, 0.9888626337051392, 1.0, 1.0, 1.0, 0.9945936799049377, 0.1390402466058731, 4.475206316634228e-11, 1.0, 1.0, 1.0, 0.3523513078689575, 0.9831036329269409, 0.3083052337169647, 0.9999991655349731, 0.9999994039535522, 0.9999988079071045, 1.0, 0.9999498128890991, 1.0, 0.999993085861206, 0.9999994039535522, 0.7507104277610779, 0.999954104423523, 0.9999961853027344, 0.9999740123748779, 0.8699168562889099, 0.020094864070415497, 0.09618552774190903, 1.0, 1.0, 1.0, 0.023516027256846428, 0.8858917951583862, 0.024188851937651634, 0.2270546406507492, 0.6246189475059509, 0.24953116476535797, 0.9999407529830933, 1.0, 0.9999878406524658, 0.9876118302345276, 0.7903306484222412, 0.08687328547239304, 0.9953305721282959, 0.9995219707489014, 0.9980658888816833, 0.6849855184555054, 0.6899132132530212, 0.00014821632066741586, 0.9999990463256836, 0.9999998807907104, 0.9999978542327881, 1.0, 1.0, 1.0, 0.1155683845281601, 0.7466058731079102, 0.0011878986842930317, 1.0, 1.0, 0.4678317606449127, 0.9999998807907104, 0.9999897480010986, 1.0, 0.999809205532074, 0.9940348267555237, 1.0, 0.9997089505195618, 0.9987003803253174, 0.9998956918716431, 0.9559615850448608, 0.9999991655349731, 0.9939144253730774, 0.4112422466278076, 0.46821871399879456, 3.1665822461945936e-05, 0.9999949932098389, 0.9993744492530823, 1.0, 0.9983957409858704, 0.9999997615814209, 0.9678035974502563, 0.18310512602329254, 0.014947858639061451, 0.6058992147445679, 1.0, 1.0, 0.9999525547027588, 1.0, 0.9999994039535522, 1.0, 0.9970133304595947, 1.0, 0.9999996423721313, 0.9999462366104126, 0.9999961853027344, 0.9869771599769592, 0.9824628829956055, 0.9979039430618286, 0.9890301823616028, 1.0, 1.0, 0.983063280582428, 1.0, 1.0, 1.0, 0.013231697492301464, 1.0, 0.9999986886978149, 0.9994801878929138, 0.9999949932098389, 0.9999070167541504, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999845027923584, 0.9999630451202393, 0.01615145616233349, 7.724278816567676e-08, 0.00016008615784812719, 0.9999997615814209, 0.029994608834385872, 0.9999936819076538, 0.9996126294136047, 0.7007139325141907, 0.8628748059272766, 3.819091034529265e-07, 0.999991774559021, 0.9959047436714172, 0.6361640691757202, 0.9926528930664062, 4.0034223047769046e-08, 0.6469495892524719, 0.9979839324951172, 0.9339000582695007, 0.9865078926086426, 0.9998464584350586, 0.9999988079071045, 1.0, 1.0, 1.0, 0.027308287099003792, 0.1933271288871765, 0.15404973924160004, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9996637105941772, 0.9992727637290955, 0.9965044260025024, 0.8586398363113403, 0.9394081830978394, 0.20759522914886475, 0.9953486323356628, 0.9999996423721313, 0.9999998807907104, 1.0, 0.996324360370636, 0.9988683462142944, 0.31930458545684814 ], "eval_math_runtime": 201.0151, "eval_math_samples_per_second": 3.731, "eval_math_score": -0.16282209753990173, "eval_math_steps_per_second": 0.119, "step": 225 }, { "epoch": 3.96, "learning_rate": 0.0002, "loss": 0.0001, "step": 226 }, { "epoch": 3.98, "learning_rate": 0.0002, "loss": 0.0021, "step": 227 }, { "epoch": 4.0, "learning_rate": 0.0002, "loss": 0.0, "step": 228 }, { "epoch": 4.02, "learning_rate": 0.0002, "loss": 0.0, "step": 229 }, { "epoch": 4.04, "learning_rate": 0.0002, "loss": 0.0001, "step": 230 }, { "epoch": 4.05, "learning_rate": 0.0002, "loss": 0.0001, "step": 231 }, { "epoch": 4.07, "learning_rate": 0.0002, "loss": 0.0003, "step": 232 }, { "epoch": 4.09, "learning_rate": 0.0002, "loss": 0.0, "step": 233 }, { "epoch": 4.11, "learning_rate": 0.0002, "loss": 0.0003, "step": 234 }, { "epoch": 4.12, "learning_rate": 0.0002, "loss": 0.0004, "step": 235 }, { "epoch": 4.14, "learning_rate": 0.0002, "loss": 0.0001, "step": 236 }, { "epoch": 4.16, "learning_rate": 0.0002, "loss": 0.0006, "step": 237 }, { "epoch": 4.18, "learning_rate": 0.0002, "loss": 0.0003, "step": 238 }, { "epoch": 4.19, "learning_rate": 0.0002, "loss": 0.0001, "step": 239 }, { "epoch": 4.21, "learning_rate": 0.0002, "loss": 0.0, "step": 240 }, { "epoch": 4.23, "learning_rate": 0.0002, "loss": 0.0001, "step": 241 }, { "epoch": 4.25, "learning_rate": 0.0002, "loss": 0.0043, "step": 242 }, { "epoch": 4.26, "learning_rate": 0.0002, "loss": 0.0002, "step": 243 }, { "epoch": 4.28, "learning_rate": 0.0002, "loss": 0.0, "step": 244 }, { "epoch": 4.3, "learning_rate": 0.0002, "loss": 0.0001, "step": 245 }, { "epoch": 4.32, "learning_rate": 0.0002, "loss": 0.0001, "step": 246 }, { "epoch": 4.33, "learning_rate": 0.0002, "loss": 0.0001, "step": 247 }, { "epoch": 4.35, "learning_rate": 0.0002, "loss": 0.0002, "step": 248 }, { "epoch": 4.37, "learning_rate": 0.0002, "loss": 0.0, "step": 249 }, { "epoch": 4.39, "learning_rate": 0.0002, "loss": 0.0004, "step": 250 }, { "epoch": 4.39, "eval_math_accuracy": 0.812, "eval_math_average_probability": 0.8123654723167419, "eval_math_brier_score": 0.1613004356622696, "eval_math_loss": 1.3319684267044067, "eval_math_probabilities": [ 0.9741411209106445, 0.9881205558776855, 0.9425725340843201, 0.9999994039535522, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999040365219116, 0.9048265218734741, 0.9989646673202515, 0.885695219039917, 0.004438477568328381, 0.9997897744178772, 0.8243713974952698, 0.8913780450820923, 0.9942822456359863, 1.0, 0.6356664896011353, 0.8980053067207336, 0.5816526412963867, 0.1231098622083664, 0.04076016694307327, 0.061139944940805435, 0.9999998807907104, 1.0, 0.978892982006073, 0.5748351216316223, 0.0008021540124900639, 0.09379920363426208, 0.0491364486515522, 8.934139259508811e-06, 0.8736464977264404, 1.0, 0.9997097849845886, 1.0, 1.0, 1.0, 0.14475835859775543, 0.06397636234760284, 0.0003403585869818926, 1.0, 1.0, 1.0, 0.14117911458015442, 0.010709831491112709, 0.0004302920133341104, 1.0, 1.0, 0.9999996423721313, 0.9999974966049194, 0.9998610019683838, 0.999998927116394, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9971213936805725, 0.9999879598617554, 0.9999997615814209, 0.9999873638153076, 1.0, 6.918422150192782e-05, 0.6608961224555969, 0.9872472286224365, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999929666519165, 0.9997953772544861, 0.9995731711387634, 0.9999479055404663, 0.9999998807907104, 0.9999502897262573, 0.9997664093971252, 1.0, 1.0, 1.74569522641832e-05, 0.0005521214916370809, 0.24506542086601257, 1.0, 1.0, 1.0, 0.0005008330917917192, 0.9999094009399414, 0.004186431877315044, 1.0, 1.0, 1.0, 0.9959837198257446, 0.9999756813049316, 0.9929238557815552, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9989527463912964, 0.12387906759977341, 0.49940013885498047, 0.8129159212112427, 0.1349012404680252, 0.017026375979185104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 0.0006247059791348875, 0.0005426732823252678, 0.9998218417167664, 1.0, 1.0, 0.9999990463256836, 0.9999405145645142, 0.9976321458816528, 0.9994082450866699, 0.14649708569049835, 0.943533718585968, 0.9998915195465088, 1.0, 1.0, 1.0, 0.5915393829345703, 1.0, 1.0, 0.9999550580978394, 0.9999997615814209, 0.999992847442627, 1.0, 1.0, 1.0, 8.847656118859959e-08, 0.7661390900611877, 0.997654378414154, 1.0, 1.0, 1.0, 0.00044505970436148345, 0.02661844715476036, 0.01408118475228548, 0.9996157884597778, 0.9987187385559082, 0.9990633130073547, 1.0, 0.022006502375006676, 0.999581515789032, 1.0, 0.9999988079071045, 1.0, 0.9936020970344543, 2.3589992181882735e-09, 0.9318777918815613, 0.9938832521438599, 0.989939272403717, 0.9848682284355164, 1.0, 1.0, 1.0, 0.9801909923553467, 0.9997428059577942, 0.9999958276748657, 0.9594303965568542, 0.768364429473877, 0.1272604614496231, 0.9999939203262329, 0.9999997615814209, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999833106994629, 1.0, 0.9999643564224243, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9998461008071899, 1.0, 0.999976634979248, 1.0, 0.23212166130542755, 0.14497193694114685, 0.7078603506088257, 1.0, 0.4899677634239197, 0.1985165774822235, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9999094009399414, 3.104321513092145e-05, 0.9999990463256836, 0.32414352893829346, 0.9998193383216858, 0.041744016110897064, 0.9823594689369202, 0.9991675615310669, 0.01144142635166645, 1.0, 1.0, 1.0, 1.0, 0.9991076588630676, 0.009626530110836029, 1.0, 0.9929787516593933, 1.0, 1.0, 1.0, 1.0, 0.859512984752655, 0.995345413684845, 0.9880235195159912, 0.992313802242279, 0.9505258202552795, 0.23239129781723022, 1.0, 1.0, 1.0, 0.9999991655349731, 0.9999985694885254, 0.8359873294830322, 0.9999998807907104, 0.9999994039535522, 0.9999762773513794, 1.0, 1.0, 1.0, 0.0005230226088315248, 0.9985369443893433, 0.9999938011169434, 0.9999879598617554, 0.9999680519104004, 0.9999932050704956, 0.0006850910140201449, 0.9997329115867615, 0.9672356843948364, 0.9993072748184204, 0.999988317489624, 0.9999736547470093, 1.0, 0.9999998807907104, 1.0, 0.9999716281890869, 0.9856376051902771, 0.9999959468841553, 0.9998348951339722, 1.0437944952812472e-10, 0.9485979080200195, 0.8302844762802124, 0.9841005802154541, 0.8874624371528625, 0.9999644756317139, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999841570854187, 0.9998916387557983, 0.9999942779541016, 0.9986818432807922, 0.9924619793891907, 0.9308562278747559, 1.0, 1.0, 1.0, 0.9903333783149719, 0.8363292217254639, 0.045719653367996216, 1.0, 0.9999985694885254, 0.9999994039535522, 0.991084098815918, 0.4497230052947998, 0.5501145720481873, 0.862385094165802, 0.14162123203277588, 0.009293337352573872, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.5380951510729165e-17, 2.3830143299597524e-15, 3.0828234388012576e-13, 1.0, 0.9999997615814209, 0.9999957084655762, 0.001973476493731141, 0.9999964237213135, 0.0018946706550195813, 0.18821823596954346, 0.9999998807907104, 0.08549052476882935, 1.0, 0.9999955892562866, 0.9999997615814209, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999945163726807, 0.9999387264251709, 0.9999330043792725, 0.01647505722939968, 0.006083548069000244, 0.05134065821766853, 0.9365686774253845, 0.3662651479244232, 0.994441568851471, 0.9994832277297974, 1.4600455870095175e-05, 0.9997501969337463, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.5849418640136719, 1.3734671711063129e-06, 0.01081871334463358, 0.8283438086509705, 3.225946088036835e-08, 9.367904875759968e-15, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.08383513987064362, 0.9965433478355408, 0.20835945010185242, 0.9918138980865479, 0.1676061451435089, 1.8304428976989584e-06, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999995231628418, 0.48147428035736084, 0.9866858720779419, 0.027203381061553955, 0.9459337592124939, 0.11230636388063431, 0.8144705295562744, 0.7917433381080627, 0.9999992847442627, 0.9999850988388062, 1.0, 0.9999998807907104, 1.0, 1.0, 0.18327580392360687, 0.19192561507225037, 0.16897690296173096, 0.9999996423721313, 0.9999926090240479, 0.9999758005142212, 1.6779736711214355e-07, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.8615950345993042, 1.0, 1.0, 0.9999827146530151, 1.0, 1.0, 0.9849662780761719, 1.0, 1.0, 1.0, 1.0, 0.9341269135475159, 0.9972115159034729, 0.9160809516906738, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999395608901978, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999920129776001, 0.9915720224380493, 0.9999881982803345, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.8531895875930786, 0.6042506694793701, 0.9937329888343811, 2.0052832283568023e-08, 0.045877791941165924, 1.091580927210789e-12, 1.0, 1.0, 1.0, 1.0, 0.5181328654289246, 0.9999738931655884, 0.27935269474983215, 0.6290788054466248, 0.9922479391098022, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9791086316108704, 0.6892402768135071, 0.9991676807403564, 0.9586399793624878, 0.9947065711021423, 0.1303037852048874, 0.9999997615814209, 1.0, 0.002620456274598837, 1.0, 1.0, 1.0, 0.8805500268936157, 0.9999896287918091, 1.0, 4.3760584844676487e-07, 9.313931741417036e-07, 0.8813202381134033, 1.0, 1.0, 1.0, 0.1709742546081543, 0.4545031189918518, 0.8428913354873657, 8.450386667391285e-05, 1.4805924498581535e-12, 0.4547331929206848, 1.0, 1.0, 1.0, 6.539921493242673e-09, 0.8675456643104553, 0.9996874332427979, 0.19884993135929108, 0.975166916847229, 5.052567115778131e-14, 1.0, 1.0, 1.0, 1.0, 0.02612978406250477, 1.0, 1.0, 1.0, 1.0, 0.959337592124939, 1.3698307839149493e-06, 0.992318868637085, 0.7397592663764954, 0.9999552965164185, 0.9998980760574341, 0.993587851524353, 1.0, 0.9999526739120483, 0.999995231628418, 0.9999995231628418, 0.9640495777130127, 1.0, 1.0, 1.0, 0.9646381139755249, 0.0013541507069021463, 0.010744565166532993, 0.9999831914901733, 0.00034956372110173106, 0.4249313175678253, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.1128406748175621, 0.00022558016644325107, 0.002447534818202257, 9.273719001612335e-07, 2.0397916955516848e-07, 4.408197418204196e-10, 0.8959543108940125, 0.323490709066391, 0.0032306495122611523, 1.0, 0.9999998807907104, 1.0, 0.17555712163448334, 1.0, 0.9999998807907104, 0.9999996423721313, 0.9995049238204956, 0.9999716281890869, 0.9999986886978149, 0.9999853372573853, 0.9999983310699463, 0.9999269247055054, 0.9999773502349854, 0.9999788999557495, 0.9999957084655762, 0.9999929666519165, 0.9999995231628418, 1.0, 1.0, 1.0, 0.9454662799835205, 1.0, 1.0, 0.9999970197677612, 1.0, 0.9999986886978149, 1.0, 1.0, 0.9995023012161255, 1.0, 1.0, 1.0, 0.9986119270324707, 0.0944746881723404, 9.965504810249826e-11, 0.9999998807907104, 1.0, 0.9999998807907104, 0.38539543747901917, 0.9847621917724609, 0.2926565110683441, 0.9999966621398926, 0.9999970197677612, 0.9999945163726807, 1.0, 0.999038815498352, 1.0, 0.9999767541885376, 0.9999938011169434, 0.6397589445114136, 0.9999979734420776, 1.0, 0.9999997615814209, 0.8607320189476013, 0.02910822443664074, 0.039598532021045685, 1.0, 1.0, 1.0, 0.01062098704278469, 0.8583924770355225, 0.0033170413225889206, 0.14073121547698975, 0.5791673064231873, 0.2202242612838745, 0.9968974590301514, 1.0, 0.9739721417427063, 0.9806737899780273, 0.7695471048355103, 0.0006811409257352352, 0.996001660823822, 0.9979707598686218, 0.9987491369247437, 0.9905125498771667, 0.9988096952438354, 0.00033601128961890936, 0.9999921321868896, 0.9999990463256836, 0.9999797344207764, 1.0, 1.0, 1.0, 0.12165839970111847, 0.6106840968132019, 0.001074924599379301, 1.0, 1.0, 0.32501405477523804, 1.0, 0.9999957084655762, 1.0, 0.9998810291290283, 0.9786832332611084, 1.0, 0.9997255206108093, 0.9985548853874207, 0.9998993873596191, 0.9606248140335083, 0.9999998807907104, 0.9986633062362671, 0.9793347120285034, 0.7565671801567078, 0.008260617963969707, 0.9999998807907104, 0.9999579191207886, 1.0, 0.9998979568481445, 0.9999997615814209, 0.833492636680603, 0.05980520695447922, 0.015350098721683025, 0.6243038177490234, 1.0, 1.0, 0.9999804496765137, 0.9999998807907104, 0.9999171495437622, 1.0, 0.9996699094772339, 1.0, 1.0, 0.9999884366989136, 0.9999971389770508, 0.9852525591850281, 0.9899809956550598, 0.9988253712654114, 0.993261992931366, 1.0, 1.0, 0.46587347984313965, 1.0, 1.0, 1.0, 0.0036667627282440662, 1.0, 0.9999979734420776, 0.9997081160545349, 0.9999983310699463, 0.9999740123748779, 1.0, 1.0, 1.0, 1.0, 0.9999992847442627, 0.9999990463256836, 0.0005246068467386067, 7.97366617177886e-09, 5.374192824092461e-06, 0.9999998807907104, 0.09196827560663223, 0.9999969005584717, 0.9998947381973267, 0.47912177443504333, 0.8789961934089661, 8.127476576191839e-06, 0.9999957084655762, 0.9989702701568604, 0.47202929854393005, 0.9992349147796631, 1.1004954103555065e-07, 0.9498332142829895, 0.9999696016311646, 0.9951153993606567, 0.9997947812080383, 0.9999713897705078, 0.9999998807907104, 1.0, 1.0, 1.0, 0.28129124641418457, 0.11767486482858658, 0.23468127846717834, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998626708984375, 0.9995213747024536, 0.9997273087501526, 0.8469322919845581, 0.7674239277839661, 0.7058064937591553, 0.9940052628517151, 1.0, 1.0, 1.0, 0.9858877062797546, 0.9913544058799744, 0.3242725729942322 ], "eval_math_runtime": 201.0851, "eval_math_samples_per_second": 3.73, "eval_math_score": -0.1613004356622696, "eval_math_steps_per_second": 0.119, "step": 250 }, { "epoch": 4.4, "learning_rate": 0.0002, "loss": 0.0004, "step": 251 }, { "epoch": 4.42, "learning_rate": 0.0002, "loss": 0.0001, "step": 252 }, { "epoch": 4.44, "learning_rate": 0.0002, "loss": 0.001, "step": 253 }, { "epoch": 4.46, "learning_rate": 0.0002, "loss": 0.0, "step": 254 }, { "epoch": 4.47, "learning_rate": 0.0002, "loss": 0.0, "step": 255 }, { "epoch": 4.49, "learning_rate": 0.0002, "loss": 0.0001, "step": 256 }, { "epoch": 4.51, "learning_rate": 0.0002, "loss": 0.0001, "step": 257 }, { "epoch": 4.53, "learning_rate": 0.0002, "loss": 0.0, "step": 258 }, { "epoch": 4.54, "learning_rate": 0.0002, "loss": 0.0001, "step": 259 }, { "epoch": 4.56, "learning_rate": 0.0002, "loss": 0.0001, "step": 260 }, { "epoch": 4.58, "learning_rate": 0.0002, "loss": 0.0003, "step": 261 }, { "epoch": 4.6, "learning_rate": 0.0002, "loss": 0.0, "step": 262 }, { "epoch": 4.61, "learning_rate": 0.0002, "loss": 0.0001, "step": 263 }, { "epoch": 4.63, "learning_rate": 0.0002, "loss": 0.0, "step": 264 }, { "epoch": 4.65, "learning_rate": 0.0002, "loss": 0.0001, "step": 265 }, { "epoch": 4.67, "learning_rate": 0.0002, "loss": 0.0002, "step": 266 }, { "epoch": 4.68, "learning_rate": 0.0002, "loss": 0.0001, "step": 267 }, { "epoch": 4.7, "learning_rate": 0.0002, "loss": 0.0001, "step": 268 }, { "epoch": 4.72, "learning_rate": 0.0002, "loss": 0.0, "step": 269 }, { "epoch": 4.74, "learning_rate": 0.0002, "loss": 0.0001, "step": 270 }, { "epoch": 4.75, "learning_rate": 0.0002, "loss": 0.0004, "step": 271 }, { "epoch": 4.77, "learning_rate": 0.0002, "loss": 0.0, "step": 272 }, { "epoch": 4.79, "learning_rate": 0.0002, "loss": 0.0, "step": 273 }, { "epoch": 4.81, "learning_rate": 0.0002, "loss": 0.0043, "step": 274 }, { "epoch": 4.82, "learning_rate": 0.0002, "loss": 0.0015, "step": 275 }, { "epoch": 4.82, "eval_math_accuracy": 0.8106666666666666, "eval_math_average_probability": 0.8108142614364624, "eval_math_brier_score": 0.16225366294384003, "eval_math_loss": 1.4052680730819702, "eval_math_probabilities": [ 0.9936263561248779, 0.9981673955917358, 0.9919402003288269, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998981952667236, 0.8883320093154907, 0.9991890788078308, 0.6083513498306274, 5.109177436679602e-05, 0.9998093247413635, 0.7663571238517761, 0.8539000153541565, 0.9905903339385986, 1.0, 0.41795018315315247, 0.6443413496017456, 0.7741377949714661, 0.10188275575637817, 0.0453404001891613, 0.060431014746427536, 1.0, 1.0, 0.9950094223022461, 0.5933858752250671, 0.0005595828988589346, 0.05632929876446724, 0.0229653213173151, 6.46454782327055e-06, 0.301479309797287, 1.0, 0.9998456239700317, 1.0, 1.0, 1.0, 0.01746947318315506, 0.0011782085057348013, 7.55835571908392e-05, 1.0, 1.0, 1.0, 0.3839975595474243, 0.010017422959208488, 9.917401257553138e-06, 1.0, 1.0, 0.9999984502792358, 0.9999971389770508, 0.9998356103897095, 0.9999988079071045, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9857336282730103, 0.9999940395355225, 0.9998986721038818, 0.9998331069946289, 1.0, 1.1395246524159575e-08, 0.414775013923645, 0.9950579404830933, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999942421913147, 0.9982965588569641, 0.9930978417396545, 0.9996166229248047, 0.9999986886978149, 0.9999653100967407, 0.9999885559082031, 1.0, 1.0, 1.948449835253996e-06, 0.00018388887110631913, 0.3106932044029236, 1.0, 1.0, 1.0, 0.00017555398517288268, 0.9936675429344177, 0.00029287789948284626, 1.0, 1.0, 1.0, 0.9993730187416077, 0.9999964237213135, 0.9896091222763062, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999345541000366, 0.07211864739656448, 0.4645310342311859, 0.9296751022338867, 0.16656631231307983, 0.020405108109116554, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0675061047077179, 0.39778512716293335, 0.9999998807907104, 1.0, 0.9999997615814209, 0.9999822378158569, 0.9999998807907104, 0.999995231628418, 0.9999984502792358, 0.11397288739681244, 0.9840831160545349, 0.9999821186065674, 1.0, 1.0, 1.0, 0.540530264377594, 1.0, 1.0, 0.9999574422836304, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 1.956232517841272e-05, 0.9745551347732544, 0.9996660947799683, 1.0, 1.0, 1.0, 0.01191641390323639, 0.061539050191640854, 0.010902847163379192, 0.9995018243789673, 0.9989916682243347, 0.9988446235656738, 1.0, 0.007876602932810783, 0.9999446868896484, 1.0, 0.9999991655349731, 1.0, 0.9986683130264282, 5.674960149157013e-14, 0.9625539779663086, 0.9683951735496521, 0.9778417348861694, 0.8923529982566833, 1.0, 0.9999998807907104, 0.9999998807907104, 0.9526988863945007, 0.9988479614257812, 0.9999982118606567, 0.9452857971191406, 0.8393964171409607, 0.0779203549027443, 0.9999852180480957, 0.9999746084213257, 0.9999992847442627, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9998984336853027, 1.0, 0.9999949932098389, 1.0, 1.0, 1.0, 1.0, 0.9972996115684509, 1.0, 0.9991987347602844, 1.0, 0.3144204318523407, 0.18421493470668793, 0.6977302432060242, 1.0, 0.7301677465438843, 0.4337575137615204, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999981164932251, 7.002168331382563e-06, 0.9999996423721313, 0.3945668041706085, 0.9998878240585327, 0.03268681466579437, 0.9944654107093811, 0.9999551773071289, 0.0003254342882428318, 1.0, 1.0, 1.0, 1.0, 0.9997095465660095, 0.0023508272133767605, 1.0, 0.993719220161438, 0.9999995231628418, 1.0, 1.0, 1.0, 0.9780398607254028, 0.9997267127037048, 0.9994465708732605, 0.9984889030456543, 0.9600583910942078, 0.25945809483528137, 1.0, 1.0, 1.0, 0.9999892711639404, 0.9999978542327881, 0.8500493168830872, 0.9999998807907104, 0.9999996423721313, 0.9999891519546509, 1.0, 1.0, 1.0, 0.002896921243518591, 0.9995997548103333, 0.9999997615814209, 0.9999991655349731, 0.999997615814209, 0.9999992847442627, 0.039557017385959625, 0.9999997615814209, 0.9999456405639648, 0.9985879063606262, 0.9999756813049316, 0.9999183416366577, 0.9999940395355225, 0.9999986886978149, 1.0, 0.9999837875366211, 0.9932675361633301, 0.9999982118606567, 0.999998927116394, 1.788809456115814e-08, 0.9936966300010681, 0.8165881037712097, 0.9617595076560974, 0.7989182472229004, 0.9999542236328125, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999873638153076, 0.9999830722808838, 0.9999997615814209, 0.999803364276886, 0.9982853531837463, 0.9679627418518066, 1.0, 1.0, 0.9999998807907104, 0.9979560375213623, 0.7761082649230957, 0.012743604369461536, 1.0, 0.9999998807907104, 1.0, 0.9915776252746582, 0.5633413791656494, 0.38425305485725403, 0.8913801908493042, 0.14700686931610107, 0.02131519466638565, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.1013178628482067e-16, 3.3238195419474977e-15, 1.3269779934978795e-14, 1.0, 1.0, 0.9999998807907104, 0.013528049923479557, 0.9999998807907104, 0.032255321741104126, 0.22908753156661987, 1.0, 0.23955458402633667, 1.0, 0.9999995231628418, 1.0, 0.9999902248382568, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999974966049194, 0.9999547004699707, 0.9996452331542969, 0.011714885011315346, 0.0021353643387556076, 0.03900861740112305, 0.9147940874099731, 0.4455832242965698, 0.9922879934310913, 0.9999570846557617, 7.22440427125548e-06, 0.9999752044677734, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999980926513672, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 0.6427749991416931, 9.282296531409884e-08, 0.00426087761297822, 0.7236366868019104, 3.437618900647976e-08, 8.943726022368065e-15, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.15926440060138702, 0.9974989295005798, 0.149034321308136, 0.995281994342804, 0.162214457988739, 4.1823514607131074e-07, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.4586499035358429, 0.9770492911338806, 0.07569213956594467, 0.9578129053115845, 0.5148200392723083, 0.45488879084587097, 0.8328272700309753, 0.9999997615814209, 0.9999986886978149, 1.0, 0.9999998807907104, 1.0, 1.0, 0.2071569263935089, 0.21005047857761383, 0.14512944221496582, 0.9999997615814209, 0.9991530179977417, 0.999977707862854, 2.140918695658911e-05, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9985465407371521, 1.0, 1.0, 0.9999860525131226, 1.0, 1.0, 0.9857158064842224, 1.0, 1.0, 1.0, 0.9999998807907104, 0.6536422371864319, 0.998571515083313, 0.6849501729011536, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999567270278931, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999865293502808, 0.9371366500854492, 0.9999910593032837, 1.0, 1.0, 1.0, 0.9999988079071045, 1.0, 1.0, 0.20273743569850922, 0.7196005582809448, 0.9695685505867004, 2.8980937094580383e-10, 0.01995912566781044, 2.1415738106489446e-12, 1.0, 1.0, 1.0, 1.0, 0.6309905648231506, 0.9999520778656006, 0.18432411551475525, 0.7670667767524719, 0.9963690042495728, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9714695811271667, 0.5369090437889099, 0.9998069405555725, 0.9385316371917725, 0.9948337078094482, 0.06358972191810608, 1.0, 1.0, 0.002895098179578781, 1.0, 1.0, 1.0, 0.9814580082893372, 1.0, 1.0, 1.3894350558985025e-08, 5.528617066374863e-07, 0.9662343263626099, 1.0, 1.0, 1.0, 0.22204738855361938, 0.5652912855148315, 0.9234350919723511, 7.587748314108467e-06, 4.3728092445615506e-17, 0.41158565878868103, 1.0, 1.0, 1.0, 4.666353081717034e-09, 0.8818444609642029, 0.999951958656311, 0.2107389122247696, 0.9879719614982605, 1.1053115887837972e-13, 1.0, 1.0, 1.0, 1.0, 0.19389784336090088, 1.0, 1.0, 0.9999995231628418, 1.0, 0.9897744655609131, 2.4203179460613455e-09, 0.9955257773399353, 0.6872877478599548, 0.9999915361404419, 0.9999841451644897, 0.887287974357605, 1.0, 0.9995532631874084, 0.9996765851974487, 0.9999959468841553, 0.7316544055938721, 1.0, 1.0, 1.0, 0.971120297908783, 0.0017193435924127698, 0.0037167684640735388, 0.9999840259552002, 0.0002529937482904643, 0.17478230595588684, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0028506291564553976, 0.0019121953519061208, 0.01212325319647789, 1.4031097634870093e-06, 2.912632091067735e-08, 3.487991007133928e-09, 0.9145451784133911, 0.11456476151943207, 0.0001520001096650958, 1.0, 0.9999998807907104, 1.0, 0.10770975798368454, 1.0, 0.9999995231628418, 0.9999982118606567, 0.9990506768226624, 0.9999693632125854, 0.9999302625656128, 0.9988833069801331, 0.9996687173843384, 0.9999876022338867, 0.9999998807907104, 1.0, 0.999997615814209, 0.9999961853027344, 0.9999997615814209, 1.0, 1.0, 1.0, 0.9612770080566406, 1.0, 1.0, 0.9999998807907104, 1.0, 0.9999998807907104, 1.0, 1.0, 0.9990684390068054, 1.0, 1.0, 1.0, 0.9992473125457764, 0.09577919542789459, 1.7597393542345685e-09, 1.0, 1.0, 1.0, 0.35620737075805664, 0.9633349180221558, 0.18560156226158142, 0.9999922513961792, 0.9999973773956299, 0.9999977350234985, 1.0, 0.9987494945526123, 1.0, 0.9999978542327881, 0.9999240636825562, 0.7110603451728821, 0.9999982118606567, 1.0, 0.9999997615814209, 0.9603965878486633, 0.03618870675563812, 0.11756718903779984, 1.0, 1.0, 1.0, 0.03724487125873566, 0.5215311050415039, 0.011557026766240597, 0.0683039054274559, 0.628030002117157, 0.20027771592140198, 0.9915581941604614, 1.0, 0.947625994682312, 0.9854022264480591, 0.8108946084976196, 8.974855154519901e-05, 0.9946466088294983, 0.9954397082328796, 0.9992893934249878, 0.9951352477073669, 0.9943332672119141, 0.00012630029232241213, 0.9999980926513672, 1.0, 0.9999985694885254, 1.0, 1.0, 1.0, 0.26604264974594116, 0.7312895655632019, 0.0005410716403275728, 1.0, 1.0, 0.6740425229072571, 1.0, 0.9999998807907104, 1.0, 0.9973351359367371, 0.9605960845947266, 0.9999996423721313, 0.9999607801437378, 0.999829888343811, 0.9999896287918091, 0.9299302697181702, 0.9999995231628418, 0.9981154203414917, 0.8821696043014526, 0.5874342322349548, 0.007038792595267296, 1.0, 0.9999691247940063, 1.0, 0.9999303817749023, 1.0, 0.9694157242774963, 0.06519167870283127, 0.01994115486741066, 0.7251455187797546, 1.0, 1.0, 0.9999953508377075, 1.0, 0.9999890327453613, 1.0, 0.9894272685050964, 1.0, 0.9999991655349731, 0.9998937845230103, 0.9999659061431885, 0.9595885276794434, 0.9986648559570312, 0.9999104738235474, 0.9992471933364868, 1.0, 1.0, 0.45780420303344727, 1.0, 1.0, 1.0, 0.0007804742781445384, 1.0, 0.9999997615814209, 0.9999927282333374, 1.0, 0.9999986886978149, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999998807907104, 0.00010441784252179787, 2.236520524334651e-09, 1.1583446024587829e-07, 1.0, 0.33567678928375244, 0.9999998807907104, 0.9999610185623169, 0.22342462837696075, 0.8763703107833862, 2.4427752578048967e-05, 0.9999997615814209, 0.9994716048240662, 0.3637305200099945, 0.9986251592636108, 2.5755400656635175e-07, 0.9788755178451538, 0.9999257326126099, 0.9798598885536194, 0.9999924898147583, 0.9999992847442627, 1.0, 1.0, 1.0, 1.0, 0.1447569876909256, 0.14068090915679932, 0.0696801170706749, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9972243309020996, 0.9998975992202759, 0.9999325275421143, 0.9507718682289124, 0.903347909450531, 0.5526163578033447, 0.9830610156059265, 1.0, 1.0, 1.0, 0.9862635135650635, 0.9926725029945374, 0.2595725953578949 ], "eval_math_runtime": 200.904, "eval_math_samples_per_second": 3.733, "eval_math_score": -0.16225366294384003, "eval_math_steps_per_second": 0.119, "step": 275 }, { "epoch": 4.84, "learning_rate": 0.0002, "loss": 0.0088, "step": 276 }, { "epoch": 4.86, "learning_rate": 0.0002, "loss": 0.0002, "step": 277 }, { "epoch": 4.88, "learning_rate": 0.0002, "loss": 0.0095, "step": 278 }, { "epoch": 4.89, "learning_rate": 0.0002, "loss": 0.0002, "step": 279 }, { "epoch": 4.91, "learning_rate": 0.0002, "loss": 0.0001, "step": 280 }, { "epoch": 4.93, "learning_rate": 0.0002, "loss": 0.0003, "step": 281 }, { "epoch": 4.95, "learning_rate": 0.0002, "loss": 0.0002, "step": 282 }, { "epoch": 4.96, "learning_rate": 0.0002, "loss": 0.0001, "step": 283 }, { "epoch": 4.98, "learning_rate": 0.0002, "loss": 0.0001, "step": 284 }, { "epoch": 5.0, "learning_rate": 0.0002, "loss": 0.0003, "step": 285 }, { "epoch": 5.02, "learning_rate": 0.0002, "loss": 0.0001, "step": 286 }, { "epoch": 5.04, "learning_rate": 0.0002, "loss": 0.0, "step": 287 }, { "epoch": 5.05, "learning_rate": 0.0002, "loss": 0.0002, "step": 288 }, { "epoch": 5.07, "learning_rate": 0.0002, "loss": 0.0022, "step": 289 }, { "epoch": 5.09, "learning_rate": 0.0002, "loss": 0.0, "step": 290 }, { "epoch": 5.11, "learning_rate": 0.0002, "loss": 0.0001, "step": 291 }, { "epoch": 5.12, "learning_rate": 0.0002, "loss": 0.0, "step": 292 }, { "epoch": 5.14, "learning_rate": 0.0002, "loss": 0.0, "step": 293 }, { "epoch": 5.16, "learning_rate": 0.0002, "loss": 0.0001, "step": 294 }, { "epoch": 5.18, "learning_rate": 0.0002, "loss": 0.0, "step": 295 }, { "epoch": 5.19, "learning_rate": 0.0002, "loss": 0.0001, "step": 296 }, { "epoch": 5.21, "learning_rate": 0.0002, "loss": 0.0001, "step": 297 }, { "epoch": 5.23, "learning_rate": 0.0002, "loss": 0.0002, "step": 298 }, { "epoch": 5.25, "learning_rate": 0.0002, "loss": 0.0001, "step": 299 }, { "epoch": 5.26, "learning_rate": 0.0002, "loss": 0.0002, "step": 300 }, { "epoch": 5.26, "eval_math_accuracy": 0.8186666666666667, "eval_math_average_probability": 0.8161761164665222, "eval_math_brier_score": 0.1567799150943756, "eval_math_loss": 1.2768502235412598, "eval_math_probabilities": [ 0.9877586960792542, 0.9925284385681152, 0.929697573184967, 0.9999945163726807, 1.0, 0.9999995231628418, 1.0, 1.0, 1.0, 0.9996824264526367, 0.9241553544998169, 0.9990249872207642, 0.7100338339805603, 0.0011562026338651776, 0.9998502731323242, 0.7224334478378296, 0.9749334454536438, 0.9959152340888977, 1.0, 0.18840447068214417, 0.2870553135871887, 0.5828121900558472, 0.18493974208831787, 0.0752544179558754, 0.011886000633239746, 0.9999996423721313, 0.9999994039535522, 0.998974084854126, 0.9891642928123474, 0.9860323667526245, 0.14151889085769653, 0.10889016091823578, 0.00010228317842120305, 0.7378221154212952, 1.0, 0.9998981952667236, 1.0, 1.0, 1.0, 0.07432517409324646, 0.15615923702716827, 0.003068906255066395, 1.0, 1.0, 1.0, 0.10192613303661346, 0.11525429040193558, 2.750095973169664e-07, 1.0, 1.0, 0.9999970197677612, 0.999997615814209, 0.9985389709472656, 0.9999974966049194, 0.999937891960144, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9897247552871704, 0.9999994039535522, 0.9999709129333496, 0.9995377063751221, 1.0, 0.06446918845176697, 1.4131438774711569e-06, 0.9993452429771423, 0.9999938011169434, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999992847442627, 0.9999997615814209, 0.9997304081916809, 0.9999997615814209, 0.9999994039535522, 0.9996370077133179, 1.0, 1.0, 0.0002389924629824236, 0.009059568867087364, 0.7207091450691223, 1.0, 1.0, 1.0, 2.1253972590784542e-05, 0.9988653659820557, 3.995129372924566e-05, 1.0, 1.0, 1.0, 0.9562018513679504, 0.99981290102005, 0.9832030534744263, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9854971766471863, 0.25157254934310913, 0.7549772262573242, 0.937997043132782, 0.18398594856262207, 0.010978744365274906, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.9999998807907104, 0.02487720362842083, 0.07799428701400757, 0.9999561309814453, 1.0, 0.9999998807907104, 0.9999988079071045, 0.9999880790710449, 0.9996495246887207, 0.9997939467430115, 0.22911451756954193, 0.9874833822250366, 0.999897837638855, 1.0, 1.0, 1.0, 0.9331264495849609, 1.0, 1.0, 0.9999420642852783, 0.9999998807907104, 0.999992847442627, 1.0, 1.0, 1.0, 0.001985696144402027, 0.7548614144325256, 0.9998376369476318, 0.9999927282333374, 1.0, 1.0, 0.06471580266952515, 0.30182167887687683, 0.6198533177375793, 0.9993723034858704, 0.9971588850021362, 0.9981772899627686, 0.9999998807907104, 0.017715783789753914, 0.9996618032455444, 1.0, 0.9999988079071045, 1.0, 0.9948770403862, 2.0915287279876793e-09, 0.9267825484275818, 0.9999849796295166, 0.9999129772186279, 0.999971866607666, 1.0, 1.0, 1.0, 0.981415867805481, 0.9999591112136841, 0.9999995231628418, 0.8152642846107483, 0.5677120685577393, 0.2730613648891449, 0.9999992847442627, 0.9999971389770508, 0.9999985694885254, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999951124191284, 1.0, 0.9994568228721619, 0.9999996423721313, 1.0, 1.0, 1.0, 0.9999555349349976, 1.0, 0.9999632835388184, 1.0, 0.04826132953166962, 0.2740296721458435, 0.721886157989502, 1.0, 0.853259801864624, 0.05119231343269348, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9998987913131714, 0.002044376917183399, 0.9999988079071045, 0.44410327076911926, 0.9997723698616028, 0.06331109255552292, 0.9994914531707764, 0.9999779462814331, 0.002763479482382536, 1.0, 1.0, 1.0, 1.0, 0.9999799728393555, 0.2076149880886078, 1.0, 0.9998911619186401, 0.999998927116394, 1.0, 1.0, 1.0, 0.9783481955528259, 0.9987006187438965, 0.9988252520561218, 0.9991220831871033, 0.9976176619529724, 0.05809808149933815, 1.0, 1.0, 1.0, 0.9999992847442627, 0.999998927116394, 0.8754785656929016, 0.9999995231628418, 0.9999982118606567, 0.9999042749404907, 1.0, 1.0, 1.0, 0.006527874618768692, 0.9736537337303162, 0.9999780654907227, 0.9999762773513794, 0.9999401569366455, 0.9999934434890747, 0.45552048087120056, 0.9999723434448242, 0.9987892508506775, 0.9997085928916931, 0.9999923706054688, 0.9999948740005493, 0.9999995231628418, 0.9999996423721313, 1.0, 0.9999988079071045, 0.9986571073532104, 0.9999998807907104, 0.01214002724736929, 3.8343496271409094e-05, 0.9913581609725952, 0.9298328757286072, 0.9969677329063416, 0.9617770910263062, 0.9999920129776001, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9973781108856201, 0.9967141151428223, 0.9999432563781738, 0.9976546764373779, 0.9946079254150391, 0.7608224749565125, 1.0, 1.0, 1.0, 0.9811656475067139, 0.7915966510772705, 0.0825800821185112, 1.0, 0.9999994039535522, 0.9999997615814209, 0.9542137980461121, 0.06237487122416496, 0.09186627715826035, 0.7910452485084534, 0.35967203974723816, 0.03883012384176254, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.475174947360057e-18, 1.0733140933441424e-15, 1.1470262885460007e-15, 1.0, 0.9999997615814209, 0.9999806880950928, 0.009697443805634975, 0.9999984502792358, 0.0061595244333148, 0.3320156931877136, 0.9999998807907104, 0.23311050236225128, 1.0, 0.9999979734420776, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999966621398926, 0.9999420642852783, 0.9999396800994873, 0.03455766290426254, 0.018067166209220886, 0.7331455945968628, 0.9917362332344055, 0.20238344371318817, 0.9996705055236816, 0.9595771431922913, 8.6017017508766e-08, 0.9906576871871948, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9998624324798584, 1.0, 1.0, 0.6615864634513855, 3.57571821041347e-07, 0.0017105141887441278, 0.6270858645439148, 4.808204678852235e-08, 1.5632363618492537e-15, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.6655816435813904, 0.9993425011634827, 0.7576255798339844, 0.9899194240570068, 0.11866028606891632, 9.746260730025824e-06, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9776846766471863, 0.9806151986122131, 0.002238599583506584, 0.8036607503890991, 0.5674469470977783, 0.8205904960632324, 0.7365446090698242, 0.9999994039535522, 1.0, 1.0, 0.9999978542327881, 1.0, 1.0, 0.25400614738464355, 0.3193072974681854, 0.20975883305072784, 0.9999994039535522, 0.9999927282333374, 0.9999797344207764, 4.0412919588561635e-07, 1.0, 0.9999991655349731, 1.0, 1.0, 1.0, 1.0, 0.05369454249739647, 0.9999998807907104, 1.0, 0.9999315738677979, 1.0, 1.0, 0.8916724324226379, 1.0, 1.0, 1.0, 1.0, 0.9822354316711426, 0.999969482421875, 0.9952125549316406, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9994634985923767, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999990463256836, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999629259109497, 0.9655250310897827, 0.9999146461486816, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.3267459571361542, 0.6236868500709534, 0.993952214717865, 6.760144888318109e-09, 0.006184133235365152, 8.83583397420784e-12, 1.0, 1.0, 1.0, 1.0, 0.5290638208389282, 0.999982476234436, 0.2387019693851471, 0.6719508767127991, 0.9981787204742432, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9652037620544434, 0.9661141633987427, 0.9999243021011353, 0.961000919342041, 0.9982160925865173, 0.007639353163540363, 1.0, 1.0, 0.10847258567810059, 1.0, 1.0, 1.0, 0.999135434627533, 0.9999998807907104, 1.0, 8.935504780538395e-08, 5.825122784131054e-08, 0.9707785248756409, 1.0, 1.0, 1.0, 0.5769251585006714, 0.7767069935798645, 0.9568352103233337, 7.286630534508731e-06, 1.1114932352328591e-13, 0.6834945678710938, 1.0, 1.0, 1.0, 2.0653693866279355e-08, 0.8760920763015747, 0.9999383687973022, 0.1618209183216095, 0.9646095037460327, 2.8324051190266797e-15, 1.0, 1.0, 1.0, 1.0, 4.793224434251897e-06, 1.0, 1.0, 1.0, 1.0, 0.814918577671051, 2.186871128628809e-09, 0.9094677567481995, 0.844931960105896, 0.999969482421875, 0.999946117401123, 0.8870434165000916, 1.0, 0.9994781613349915, 0.9997089505195618, 0.9999972581863403, 0.7378177046775818, 1.0, 1.0, 1.0, 0.9960601925849915, 0.00010187191219301894, 0.005649200174957514, 0.9998476505279541, 0.00018434283265378326, 0.008805871941149235, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.09655693918466568, 2.923619467765093e-05, 0.05787983909249306, 1.0961464624870132e-07, 9.875413525151089e-06, 3.602735034746729e-07, 0.8773807883262634, 0.3197910785675049, 0.0004901019274257123, 1.0, 0.9999998807907104, 1.0, 0.10598523169755936, 1.0, 0.9999995231628418, 0.9999865293502808, 0.9999806880950928, 0.9999945163726807, 0.9999805688858032, 0.9999878406524658, 0.9999792575836182, 0.9997398257255554, 0.9999866485595703, 0.999991774559021, 0.9999539852142334, 0.9999682903289795, 0.9999957084655762, 1.0, 1.0, 1.0, 0.9537066221237183, 1.0, 0.9999997615814209, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 0.9999716281890869, 1.0, 1.0, 1.0, 0.998964786529541, 0.15002521872520447, 4.3515499537072344e-10, 0.9999994039535522, 1.0, 0.9999996423721313, 0.3975577652454376, 0.9077551364898682, 0.18864169716835022, 0.9999892711639404, 0.9999982118606567, 0.9999995231628418, 1.0, 0.9983457326889038, 1.0, 0.9999996423721313, 0.9999057054519653, 0.7239072322845459, 0.9999778270721436, 0.9999992847442627, 0.9999986886978149, 0.890518844127655, 0.013416680507361889, 0.05747589096426964, 1.0, 1.0, 1.0, 0.025316495448350906, 0.18119920790195465, 0.012487836182117462, 0.08863041549921036, 0.4432298541069031, 0.2753593325614929, 0.976235032081604, 0.999998927116394, 0.9945849776268005, 0.9876952171325684, 0.8897667527198792, 0.004150957800447941, 0.9987803101539612, 0.9989814162254333, 0.9994215965270996, 0.997739315032959, 0.9990656971931458, 2.7372734621167183e-05, 0.9999825954437256, 0.9999994039535522, 0.9999972581863403, 1.0, 1.0, 1.0, 0.24140827357769012, 0.8161184191703796, 0.020366031676530838, 1.0, 1.0, 0.723243772983551, 0.9999932050704956, 0.9993358254432678, 0.9999959468841553, 0.999998927116394, 0.9805527329444885, 1.0, 0.9987381100654602, 0.9938898086547852, 0.9976999163627625, 0.9723736047744751, 1.0, 0.9992853999137878, 0.9996559619903564, 0.5199150443077087, 0.04012829810380936, 1.0, 0.9999901056289673, 1.0, 0.9999387264251709, 1.0, 0.7914350032806396, 0.07761424779891968, 0.016203517094254494, 0.20961548388004303, 1.0, 1.0, 0.9999814033508301, 1.0, 0.9999963045120239, 1.0, 0.9997143149375916, 1.0, 1.0, 0.9999467134475708, 0.9999755620956421, 0.9640953540802002, 0.9884908199310303, 0.9992508292198181, 0.9936684966087341, 1.0, 1.0, 0.9999297857284546, 1.0, 1.0, 1.0, 0.008803162723779678, 1.0, 0.9999939203262329, 0.999968409538269, 0.9999996423721313, 0.9999980926513672, 1.0, 1.0, 1.0, 1.0, 0.9999592304229736, 0.9999737739562988, 0.0023570097982883453, 3.442167508183047e-05, 1.4315588714453042e-06, 0.9999998807907104, 0.14274664223194122, 0.9999933242797852, 0.9975982308387756, 0.05932007357478142, 0.30672505497932434, 0.25425589084625244, 0.9991433620452881, 0.8155273199081421, 0.7911255955696106, 0.9951916933059692, 2.9272470669639006e-07, 0.9954161643981934, 0.9999825954437256, 0.9890534281730652, 0.9999459981918335, 0.9999736547470093, 1.0, 1.0, 1.0, 1.0, 0.42209479212760925, 0.1392708718776703, 0.35605666041374207, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999939203262329, 0.9996603727340698, 0.9999575614929199, 0.6660751104354858, 0.7415533065795898, 0.8242797255516052, 0.9316858649253845, 1.0, 1.0, 1.0, 0.9575637578964233, 0.9893016219139099, 0.14899201691150665 ], "eval_math_runtime": 201.1851, "eval_math_samples_per_second": 3.728, "eval_math_score": -0.1567799150943756, "eval_math_steps_per_second": 0.119, "step": 300 }, { "epoch": 5.28, "learning_rate": 0.0002, "loss": 0.0, "step": 301 }, { "epoch": 5.3, "learning_rate": 0.0002, "loss": 0.001, "step": 302 }, { "epoch": 5.32, "learning_rate": 0.0002, "loss": 0.0, "step": 303 }, { "epoch": 5.33, "learning_rate": 0.0002, "loss": 0.0, "step": 304 }, { "epoch": 5.35, "learning_rate": 0.0002, "loss": 0.0002, "step": 305 }, { "epoch": 5.37, "learning_rate": 0.0002, "loss": 0.0, "step": 306 }, { "epoch": 5.39, "learning_rate": 0.0002, "loss": 0.0, "step": 307 }, { "epoch": 5.4, "learning_rate": 0.0002, "loss": 0.0, "step": 308 }, { "epoch": 5.42, "learning_rate": 0.0002, "loss": 0.0, "step": 309 }, { "epoch": 5.44, "learning_rate": 0.0002, "loss": 0.0, "step": 310 }, { "epoch": 5.46, "learning_rate": 0.0002, "loss": 0.0, "step": 311 }, { "epoch": 5.47, "learning_rate": 0.0002, "loss": 0.0001, "step": 312 }, { "epoch": 5.49, "learning_rate": 0.0002, "loss": 0.0004, "step": 313 }, { "epoch": 5.51, "learning_rate": 0.0002, "loss": 0.0, "step": 314 }, { "epoch": 5.53, "learning_rate": 0.0002, "loss": 0.0, "step": 315 }, { "epoch": 5.54, "learning_rate": 0.0002, "loss": 0.0087, "step": 316 }, { "epoch": 5.56, "learning_rate": 0.0002, "loss": 0.0344, "step": 317 }, { "epoch": 5.58, "learning_rate": 0.0002, "loss": 0.0009, "step": 318 }, { "epoch": 5.6, "learning_rate": 0.0002, "loss": 0.0004, "step": 319 }, { "epoch": 5.61, "learning_rate": 0.0002, "loss": 0.0, "step": 320 }, { "epoch": 5.63, "learning_rate": 0.0002, "loss": 0.0, "step": 321 }, { "epoch": 5.65, "learning_rate": 0.0002, "loss": 0.0, "step": 322 }, { "epoch": 5.67, "learning_rate": 0.0002, "loss": 0.0, "step": 323 }, { "epoch": 5.68, "learning_rate": 0.0002, "loss": 0.0, "step": 324 }, { "epoch": 5.7, "learning_rate": 0.0002, "loss": 0.0002, "step": 325 }, { "epoch": 5.7, "eval_math_accuracy": 0.816, "eval_math_average_probability": 0.8163599371910095, "eval_math_brier_score": 0.15924298763275146, "eval_math_loss": 1.5116074085235596, "eval_math_probabilities": [ 0.9967918992042542, 0.997322142124176, 0.9827213883399963, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999526739120483, 0.8628817200660706, 0.9984012246131897, 0.7690772414207458, 0.005476095248013735, 0.9999130964279175, 0.3699347972869873, 0.8266818523406982, 0.9938656687736511, 1.0, 0.4050202965736389, 0.548800528049469, 0.8977255821228027, 0.38511568307876587, 0.42544642090797424, 0.420399010181427, 1.0, 1.0, 0.9995238780975342, 0.9816282391548157, 0.17419616878032684, 0.31027379631996155, 0.21682079136371613, 0.004179095383733511, 0.1720467060804367, 1.0, 0.9989655017852783, 1.0, 1.0, 1.0, 0.011677601374685764, 0.5032681822776794, 0.000575416546780616, 1.0, 1.0, 1.0, 0.03545253351330757, 0.003051656298339367, 2.004012316092485e-07, 1.0, 1.0, 1.0, 0.9999055862426758, 0.9933459758758545, 0.9999313354492188, 0.9999912977218628, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9928387999534607, 0.9995158910751343, 0.9999991655349731, 0.9999876022338867, 1.0, 0.0003550653636921197, 0.08022478222846985, 0.9913560152053833, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999110698699951, 0.9999998807907104, 0.9997580647468567, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9999877214431763, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 2.5069779439945705e-05, 0.9990873336791992, 1.1603357961575966e-05, 1.0, 1.0, 1.0, 0.9996651411056519, 0.9999998807907104, 0.999944806098938, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999827146530151, 0.5396710634231567, 0.9065953493118286, 0.8508569598197937, 0.018689917400479317, 0.029769863933324814, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.006819482892751694, 0.04008922725915909, 0.9999922513961792, 1.0, 1.0, 1.0, 0.9999957084655762, 0.9997294545173645, 0.9999123811721802, 0.40606433153152466, 0.9910498857498169, 0.9998757839202881, 1.0, 1.0, 1.0, 0.7859936952590942, 1.0, 1.0, 0.9999594688415527, 1.0, 0.9999982118606567, 1.0, 1.0, 1.0, 0.015322706662118435, 0.9999150037765503, 0.999992847442627, 1.0, 1.0, 1.0, 0.010006444528698921, 0.13892842829227448, 0.5784686803817749, 0.9997760653495789, 0.9993890523910522, 0.9999295473098755, 1.0, 0.47505563497543335, 0.9994331002235413, 1.0, 0.9999984502792358, 1.0, 0.9855426549911499, 6.270343673540207e-14, 0.9453749656677246, 0.9996993541717529, 0.9945585131645203, 0.9998348951339722, 1.0, 1.0, 1.0, 0.9817941188812256, 0.9999560117721558, 0.9999967813491821, 0.9433128833770752, 0.6730114221572876, 0.14030437171459198, 0.9999892711639404, 0.9999961853027344, 0.9999994039535522, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999992847442627, 1.0, 0.9999862909317017, 1.0, 1.0, 1.0, 1.0, 0.9999985694885254, 1.0, 0.999883770942688, 1.0, 0.0821303129196167, 0.36735421419143677, 0.5823050737380981, 1.0, 0.9683111310005188, 0.40149298310279846, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999654293060303, 3.002138873853255e-05, 0.9999985694885254, 0.658505916595459, 0.9999730587005615, 0.04920458793640137, 0.9999504089355469, 0.9999997615814209, 0.002541993511840701, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9993739724159241, 1.0, 0.9845120906829834, 0.9999911785125732, 1.0, 1.0, 1.0, 0.9670127034187317, 0.999483585357666, 0.9989612102508545, 0.9966631531715393, 0.998854398727417, 0.009822655469179153, 1.0, 1.0, 1.0, 0.9999986886978149, 0.9999990463256836, 0.8082265853881836, 1.0, 1.0, 0.9999897480010986, 1.0, 1.0, 1.0, 4.27886625402607e-05, 0.19216839969158173, 0.9998117089271545, 0.9997172951698303, 0.9991762042045593, 0.9997140765190125, 3.2019765967561398e-06, 0.9998927116394043, 0.9853877425193787, 0.99986732006073, 0.9999420642852783, 0.9999997615814209, 0.9999970197677612, 0.9999933242797852, 1.0, 0.9999980926513672, 0.9949316382408142, 0.9999996423721313, 1.0, 6.600717370019993e-06, 0.9999998807907104, 0.7488139867782593, 0.9444406628608704, 0.7295747399330139, 0.9999995231628418, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999643087387085, 0.9998360872268677, 0.9999978542327881, 0.9965265393257141, 0.987602174282074, 0.6890073418617249, 1.0, 1.0, 1.0, 0.9591568112373352, 0.8345623016357422, 0.023093651980161667, 1.0, 0.9999998807907104, 0.9999998807907104, 0.9931012392044067, 0.002820385852828622, 0.20378394424915314, 0.9660822153091431, 0.17791002988815308, 0.028210552409291267, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.2346773119014106e-19, 1.550530016880547e-11, 5.2244289083124575e-18, 1.0, 0.9999998807907104, 0.9999887943267822, 3.0937351880311326e-07, 0.9999783039093018, 3.678280336316675e-06, 0.3492027521133423, 1.0, 0.18989621102809906, 1.0, 0.9999972581863403, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999978542327881, 0.9999452829360962, 0.999990701675415, 0.009111160412430763, 4.838895256398246e-05, 0.15563084185123444, 0.94840008020401, 0.39230045676231384, 0.9992285966873169, 0.9989711046218872, 2.5423624094855768e-08, 0.9993270635604858, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999935626983643, 1.0, 1.0, 1.0, 0.999998927116394, 1.0, 1.0, 0.8752558827400208, 8.402539464213987e-08, 0.0032239488791674376, 0.9767484664916992, 1.4196200659455371e-08, 3.8116452133257414e-14, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.11897922307252884, 0.9943925738334656, 0.7251303195953369, 0.9950252175331116, 0.18201595544815063, 1.5975919609445555e-07, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9873571395874023, 0.9991971850395203, 0.49299073219299316, 0.9963144659996033, 0.526333749294281, 0.8009034395217896, 0.7397754192352295, 0.9999997615814209, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 0.2896145284175873, 0.2996552884578705, 0.2837032973766327, 0.999963641166687, 0.9995237588882446, 0.9998564720153809, 6.6665097619988956e-06, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.5490215420722961, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 0.9225790500640869, 1.0, 1.0, 1.0, 1.0, 0.8280363082885742, 0.9998681545257568, 0.9146966338157654, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999516010284424, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999927282333374, 0.9783440828323364, 0.9999992847442627, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.17768271267414093, 0.791248619556427, 0.999440610408783, 3.97329591450557e-09, 0.13455867767333984, 2.363310068476121e-12, 1.0, 1.0, 1.0, 1.0, 0.6345317959785461, 0.999998927116394, 0.2513349652290344, 0.6890951991081238, 0.9995872378349304, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9958881735801697, 0.9998266100883484, 0.999996542930603, 0.9228377342224121, 0.9996629953384399, 0.0006600613705813885, 0.9999997615814209, 1.0, 0.00472307438030839, 1.0, 1.0, 1.0, 0.6686476469039917, 0.9999980926513672, 1.0, 1.074439870407673e-09, 0.00024883553851395845, 0.9979689717292786, 1.0, 1.0, 1.0, 0.48947155475616455, 0.6410654187202454, 0.9727888107299805, 1.0786372968141222e-06, 3.6801645438578093e-19, 0.035597264766693115, 1.0, 1.0, 1.0, 6.252291129271725e-09, 0.8212328553199768, 0.9999477863311768, 0.045573655515909195, 0.7480166554450989, 4.3801238372822345e-16, 1.0, 1.0, 1.0, 1.0, 6.429734639823437e-05, 1.0, 1.0, 1.0, 1.0, 0.33966097235679626, 1.6316656115122896e-07, 0.9912994503974915, 0.9354026913642883, 0.999967098236084, 0.9999058246612549, 0.04553777351975441, 1.0, 0.9996187686920166, 0.9997318387031555, 0.999998927116394, 0.913993239402771, 1.0, 1.0, 1.0, 0.9912393689155579, 1.9657154552987777e-05, 0.004094246309250593, 0.9999703168869019, 7.3945689109677915e-06, 0.0001537688513053581, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.00853020790964365, 2.2098970475781243e-07, 0.001807573949918151, 1.2093577250738008e-09, 8.290735564742135e-08, 1.692392572749668e-07, 0.9176836013793945, 0.6643961668014526, 0.0003922870382666588, 1.0, 0.9999983310699463, 0.9999998807907104, 0.0071135032922029495, 1.0, 0.9999998807907104, 0.9999990463256836, 0.9999943971633911, 0.9999991655349731, 0.9998483657836914, 0.9999452829360962, 0.9994007349014282, 0.9882892370223999, 0.9998513460159302, 0.9997541308403015, 0.9999817609786987, 0.9999920129776001, 0.9999994039535522, 1.0, 1.0, 1.0, 0.9818834066390991, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999182224273682, 1.0, 1.0, 1.0, 0.9999306201934814, 0.04436107352375984, 2.50114773336918e-08, 1.0, 1.0, 1.0, 0.47471821308135986, 0.9808228611946106, 0.18968066573143005, 0.9999854564666748, 0.999998927116394, 1.0, 1.0, 0.9998414516448975, 1.0, 0.9999979734420776, 0.9999938011169434, 0.4627395570278168, 1.0, 1.0, 1.0, 0.01917457766830921, 0.00016562685777898878, 0.0008777675684541464, 1.0, 1.0, 1.0, 0.0050041647627949715, 0.38472944498062134, 0.005143103655427694, 0.018521549180150032, 0.37356990575790405, 0.13656093180179596, 0.9303887486457825, 1.0, 0.9999997615814209, 0.9977959394454956, 0.9657303690910339, 0.014469603076577187, 0.999765932559967, 0.9990122318267822, 0.9991660118103027, 0.9870762228965759, 0.9993756413459778, 6.144186045276001e-06, 0.9999998807907104, 0.9999998807907104, 0.9999994039535522, 1.0, 1.0, 1.0, 0.10096580535173416, 0.7896511554718018, 0.0059195589274168015, 1.0, 1.0, 0.6093747615814209, 0.9999978542327881, 0.9998146891593933, 0.9999994039535522, 0.9995428323745728, 0.8693402409553528, 1.0, 0.9996778964996338, 0.9978775978088379, 0.9996509552001953, 0.971581220626831, 1.0, 0.9994716048240662, 0.00024229865812230855, 0.0004502419615164399, 1.0202366063083446e-08, 1.0, 0.9999377727508545, 1.0, 0.9999997615814209, 1.0, 0.99130779504776, 0.11951948702335358, 0.04179293289780617, 0.7348314523696899, 1.0, 1.0, 0.9999960660934448, 0.9999998807907104, 0.9999909400939941, 1.0, 0.9690640568733215, 1.0, 0.9999998807907104, 0.9998764991760254, 0.9999246597290039, 0.9690626859664917, 0.9951514005661011, 0.9997856020927429, 0.9968319535255432, 1.0, 1.0, 0.9974687099456787, 1.0, 1.0, 1.0, 2.5719475161167793e-05, 1.0, 0.9999997615814209, 0.99979168176651, 0.9999966621398926, 0.999964714050293, 1.0, 1.0, 1.0, 0.9999825954437256, 0.9675818085670471, 0.9701055884361267, 0.00010311726509826258, 7.247735940053845e-13, 1.250469450209124e-10, 1.0, 0.001458710408769548, 0.9999971389770508, 0.9988293051719666, 0.0217861607670784, 0.291797399520874, 0.00028184644179418683, 0.981374204158783, 0.06263919919729233, 0.9862158298492432, 0.9966481328010559, 4.808333073924587e-07, 0.9991720914840698, 1.0, 0.9997479319572449, 0.9999971389770508, 0.9999995231628418, 1.0, 1.0, 1.0, 1.0, 0.6142569780349731, 0.2606169581413269, 0.581856369972229, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999967813491821, 0.9999868869781494, 0.9448823928833008, 0.9974206686019897, 0.9901518225669861, 0.934175968170166, 1.0, 1.0, 1.0, 0.9740556478500366, 0.9963061809539795, 0.08349531143903732 ], "eval_math_runtime": 201.0753, "eval_math_samples_per_second": 3.73, "eval_math_score": -0.15924298763275146, "eval_math_steps_per_second": 0.119, "step": 325 }, { "epoch": 5.72, "learning_rate": 0.0002, "loss": 0.0, "step": 326 }, { "epoch": 5.74, "learning_rate": 0.0002, "loss": 0.0, "step": 327 }, { "epoch": 5.75, "learning_rate": 0.0002, "loss": 0.0001, "step": 328 }, { "epoch": 5.77, "learning_rate": 0.0002, "loss": 0.0003, "step": 329 }, { "epoch": 5.79, "learning_rate": 0.0002, "loss": 0.0, "step": 330 }, { "epoch": 5.81, "learning_rate": 0.0002, "loss": 0.0, "step": 331 }, { "epoch": 5.82, "learning_rate": 0.0002, "loss": 0.0, "step": 332 }, { "epoch": 5.84, "learning_rate": 0.0002, "loss": 0.0, "step": 333 }, { "epoch": 5.86, "learning_rate": 0.0002, "loss": 0.0, "step": 334 }, { "epoch": 5.88, "learning_rate": 0.0002, "loss": 0.0068, "step": 335 }, { "epoch": 5.89, "learning_rate": 0.0002, "loss": 0.0022, "step": 336 }, { "epoch": 5.91, "learning_rate": 0.0002, "loss": 0.0001, "step": 337 }, { "epoch": 5.93, "learning_rate": 0.0002, "loss": 0.0022, "step": 338 }, { "epoch": 5.95, "learning_rate": 0.0002, "loss": 0.0003, "step": 339 }, { "epoch": 5.96, "learning_rate": 0.0002, "loss": 0.0, "step": 340 }, { "epoch": 5.98, "learning_rate": 0.0002, "loss": 0.0008, "step": 341 }, { "epoch": 6.0, "learning_rate": 0.0002, "loss": 0.0399, "step": 342 }, { "epoch": 6.02, "learning_rate": 0.0002, "loss": 0.0, "step": 343 }, { "epoch": 6.04, "learning_rate": 0.0002, "loss": 0.0007, "step": 344 }, { "epoch": 6.05, "learning_rate": 0.0002, "loss": 0.0, "step": 345 }, { "epoch": 6.07, "learning_rate": 0.0002, "loss": 0.0002, "step": 346 }, { "epoch": 6.09, "learning_rate": 0.0002, "loss": 0.0001, "step": 347 }, { "epoch": 6.11, "learning_rate": 0.0002, "loss": 0.0002, "step": 348 }, { "epoch": 6.12, "learning_rate": 0.0002, "loss": 0.0407, "step": 349 }, { "epoch": 6.14, "learning_rate": 0.0002, "loss": 0.0001, "step": 350 }, { "epoch": 6.14, "eval_math_accuracy": 0.8133333333333334, "eval_math_average_probability": 0.8207166194915771, "eval_math_brier_score": 0.1538645476102829, "eval_math_loss": 1.2788736820220947, "eval_math_probabilities": [ 0.9874653220176697, 0.9697968363761902, 0.9355596899986267, 0.9999500513076782, 0.9999997615814209, 0.9999983310699463, 1.0, 1.0, 1.0, 0.998988926410675, 0.9382328987121582, 0.9992632269859314, 0.9591829180717468, 0.07792803645133972, 0.999873161315918, 0.9109772443771362, 0.7990008592605591, 0.9965587258338928, 0.9999998807907104, 0.28622740507125854, 0.7653065323829651, 0.8271327018737793, 0.46570494771003723, 0.2684669494628906, 0.04538764804601669, 0.9999997615814209, 0.999998927116394, 0.9989007711410522, 0.835698664188385, 0.0023121237754821777, 0.2201753854751587, 0.2174089103937149, 0.009031658060848713, 0.9837626218795776, 1.0, 0.9999898672103882, 1.0, 1.0, 1.0, 0.022719990462064743, 0.8537585735321045, 0.14600162208080292, 1.0, 1.0, 1.0, 0.0753956288099289, 0.013958623632788658, 4.2292294892831706e-06, 1.0, 1.0, 0.9999998807907104, 0.9999778270721436, 0.9954309463500977, 0.9999188184738159, 0.9936776757240295, 0.9999994039535522, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9966727495193481, 0.9994459748268127, 0.9915407299995422, 0.8932110071182251, 0.9999998807907104, 2.8584878464243957e-08, 0.007454311475157738, 0.9980680346488953, 0.9999936819076538, 0.9999995231628418, 1.0, 0.9999994039535522, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999921321868896, 0.9999996423721313, 0.9999773502349854, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9995755553245544, 0.999976634979248, 0.9999977350234985, 1.0, 1.0, 1.0, 8.797389341452799e-07, 0.924997091293335, 4.300428827264113e-06, 1.0, 1.0, 1.0, 0.9998301267623901, 0.9999990463256836, 0.9995415210723877, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999891519546509, 0.2710215747356415, 0.938694417476654, 0.7720885276794434, 0.05641738325357437, 0.008365345187485218, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999930739402771, 0.9999979734420776, 0.9999810457229614, 0.007881082594394684, 0.14444701373577118, 0.9985421895980835, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999998807907104, 0.2757909595966339, 0.9893797039985657, 0.9998555183410645, 1.0, 1.0, 1.0, 0.996523916721344, 1.0, 1.0, 0.9993391633033752, 0.9999992847442627, 0.9999762773513794, 1.0, 1.0, 1.0, 0.000920500373467803, 0.5345484614372253, 0.9817014932632446, 1.0, 1.0, 1.0, 0.00034649629378691316, 0.037403278052806854, 0.16514307260513306, 0.9994741082191467, 0.9985525012016296, 0.9997329115867615, 0.9999998807907104, 0.8101465106010437, 0.9980199337005615, 1.0, 0.9999991655349731, 1.0, 0.9125588536262512, 1.3955363774298402e-11, 0.7946147322654724, 1.0, 0.9999994039535522, 1.0, 1.0, 1.0, 1.0, 0.9990010857582092, 0.9999265670776367, 0.9999994039535522, 0.9583072066307068, 0.821938157081604, 0.4715195894241333, 0.999990701675415, 0.9999719858169556, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999979734420776, 1.0, 0.9999899864196777, 1.0, 1.0, 1.0, 1.0, 0.9999997615814209, 1.0, 0.9999873638153076, 1.0, 0.20286200940608978, 0.39564600586891174, 0.8829712867736816, 1.0, 0.7829235792160034, 0.0038424746599048376, 0.9999996423721313, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 0.9999994039535522, 0.0022788881324231625, 0.9999998807907104, 0.39627954363822937, 0.999626874923706, 0.05990465730428696, 0.9996391534805298, 0.9999914169311523, 0.004306362476199865, 1.0, 1.0, 1.0, 1.0, 0.9999946355819702, 0.14726009964942932, 1.0, 0.9970664381980896, 0.9993315935134888, 1.0, 1.0, 1.0, 0.9931715726852417, 0.9999645948410034, 0.9996660947799683, 0.9994062185287476, 0.9979037046432495, 0.0032947687432169914, 1.0, 1.0, 1.0, 0.9999607801437378, 0.9999886751174927, 0.7672923803329468, 0.9999996423721313, 0.9999979734420776, 0.9998476505279541, 1.0, 1.0, 1.0, 0.020925622433423996, 0.24488797783851624, 0.9979167580604553, 0.998330295085907, 0.9980329871177673, 0.9933977127075195, 7.774846017127857e-05, 0.998060405254364, 0.9415258169174194, 0.9999583959579468, 0.9999936819076538, 1.0, 0.9999995231628418, 1.0, 1.0, 0.9999997615814209, 0.9975612163543701, 1.0, 1.0, 1.7464209349782323e-06, 0.9999984502792358, 0.9427355527877808, 0.9995843768119812, 0.9499015212059021, 0.9999936819076538, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998617172241211, 0.9999568462371826, 0.9999971389770508, 0.9848317503929138, 0.9498348236083984, 0.5627726316452026, 1.0, 1.0, 0.9999990463256836, 0.9223659038543701, 0.7664235830307007, 0.13197939097881317, 1.0, 1.0, 1.0, 0.9700117111206055, 0.2024139165878296, 0.9263306856155396, 0.9506583213806152, 0.39984047412872314, 0.13743475079536438, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 3.6919561266782716e-22, 2.18405224461371e-10, 2.504795435641597e-19, 0.9999889135360718, 0.9999593496322632, 0.9979922771453857, 3.5204247978981584e-05, 0.9999904632568359, 0.01156576257199049, 0.18318508565425873, 0.9999959468841553, 0.14253339171409607, 1.0, 0.9999978542327881, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999959468841553, 0.9998289346694946, 0.9999074935913086, 0.0033169786911457777, 0.0005897394148632884, 0.30069342255592346, 0.9917837381362915, 0.5164625644683838, 0.9999063014984131, 0.9986639022827148, 0.00011092022032244131, 0.9985526204109192, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999990463256836, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.8141371011734009, 8.270633770735003e-06, 0.017115028575062752, 0.9607935547828674, 8.630914817331359e-05, 2.2970165041931217e-16, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999996423721313, 0.48407259583473206, 0.9982215762138367, 0.6181492209434509, 0.9855250716209412, 0.121112160384655, 2.827066600730177e-05, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999997615814209, 0.9999998807907104, 0.03828705474734306, 0.999963641166687, 0.9308427572250366, 0.9998847246170044, 0.4460064172744751, 0.7213147878646851, 0.8431221842765808, 1.0, 1.0, 1.0, 0.9999992847442627, 1.0, 1.0, 0.3611292541027069, 0.2640273869037628, 0.32834309339523315, 0.9991315007209778, 0.9996795654296875, 0.9881278872489929, 4.720181436823623e-07, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 0.9982432126998901, 1.0, 1.0, 0.9999994039535522, 1.0, 1.0, 0.9828981161117554, 1.0, 1.0, 1.0, 1.0, 0.9400075078010559, 0.9987474679946899, 0.9965115189552307, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998782873153687, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999850988388062, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999548196792603, 0.9945774078369141, 0.9999788999557495, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.02877829596400261, 0.8653485774993896, 0.9985803365707397, 1.8987939256476238e-06, 0.21626876294612885, 2.5814976822857716e-08, 1.0, 1.0, 1.0, 1.0, 0.9088648557662964, 0.9999998807907104, 0.344644159078598, 0.5996646285057068, 0.9953547716140747, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9968583583831787, 0.9997112154960632, 0.9999959468841553, 0.9651449918746948, 0.9996559619903564, 0.0003758615057449788, 1.0, 1.0, 0.04946964606642723, 1.0, 1.0, 1.0, 0.4679255187511444, 0.9999908208847046, 0.9999998807907104, 5.230487545304641e-07, 0.004413491580635309, 0.9809346795082092, 1.0, 1.0, 1.0, 0.38160017132759094, 0.4314754903316498, 0.9787337779998779, 2.0823221348109655e-05, 2.686202997165851e-15, 0.06203649565577507, 1.0, 1.0, 1.0, 2.39686226422009e-08, 0.5946574807167053, 0.9980558156967163, 0.1208154484629631, 0.8496062159538269, 7.111944720264752e-17, 1.0, 1.0, 1.0, 1.0, 3.3138010621769354e-05, 1.0, 1.0, 0.9999998807907104, 1.0, 0.2575377821922302, 1.38334462462808e-06, 0.95395827293396, 0.8448800444602966, 0.997546374797821, 0.9976513981819153, 0.23598860204219818, 1.0, 0.9999628067016602, 0.9998576641082764, 0.9999984502792358, 0.9965047836303711, 1.0, 1.0, 1.0, 0.9619806408882141, 8.919207175495103e-06, 0.13084955513477325, 0.9981191754341125, 0.0007581717218272388, 1.570074527990073e-05, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.022367175668478012, 0.00028838225989602506, 0.0033873484935611486, 3.0952811869155994e-08, 6.806322403463128e-07, 4.4720549340127036e-05, 0.8329719305038452, 0.40361320972442627, 0.0016771466471254826, 1.0, 1.0, 1.0, 0.01437581516802311, 1.0, 0.9999982118606567, 0.9999898672103882, 0.9998867511749268, 0.9999881982803345, 0.9999994039535522, 0.9999998807907104, 0.9999352693557739, 0.9994431138038635, 0.9999504089355469, 0.9999698400497437, 0.9999922513961792, 0.9999819993972778, 0.9999986886978149, 1.0, 1.0, 1.0, 0.9966232776641846, 1.0, 1.0, 0.9999997615814209, 1.0, 0.9999998807907104, 1.0, 1.0, 0.9956915974617004, 1.0, 1.0, 1.0, 0.9981017708778381, 0.007000940851867199, 1.7958740050616484e-10, 0.9999997615814209, 1.0, 1.0, 0.361677885055542, 0.9866130948066711, 0.3100588321685791, 0.9999964237213135, 0.9999998807907104, 1.0, 1.0, 0.9993226528167725, 1.0, 0.9999998807907104, 0.9999520778656006, 0.9652385115623474, 0.9999985694885254, 0.9999995231628418, 0.9999984502792358, 0.1526603251695633, 0.0042071775533258915, 0.019661352038383484, 1.0, 1.0, 1.0, 0.04273446649312973, 0.4688328802585602, 0.0164013784378767, 0.10342691093683243, 0.2796163856983185, 0.2554151117801666, 0.3205971419811249, 0.9999998807907104, 0.9999998807907104, 0.9856356382369995, 0.9330728054046631, 0.14814814925193787, 0.999901294708252, 0.9998260140419006, 0.9999620914459229, 0.9825577139854431, 0.9997480511665344, 0.0002658652374520898, 0.9999914169311523, 0.9999674558639526, 0.9997313618659973, 1.0, 1.0, 1.0, 0.1860208362340927, 0.7684915065765381, 0.011546393856406212, 1.0, 1.0, 0.07633616775274277, 1.0, 0.9999998807907104, 1.0, 0.9917313456535339, 0.6794828176498413, 1.0, 0.999757707118988, 0.9973275661468506, 0.9991989731788635, 0.9872015714645386, 0.9999997615814209, 0.9997329115867615, 0.02737763710319996, 0.10311122238636017, 0.00014836012269370258, 1.0, 0.9999449253082275, 1.0, 1.0, 1.0, 0.9991437196731567, 0.11565019190311432, 0.12604080140590668, 0.7433779835700989, 1.0, 1.0, 0.9999995231628418, 1.0, 1.0, 1.0, 0.9997424483299255, 1.0, 1.0, 0.9996664524078369, 0.999812662601471, 0.9248570799827576, 0.9961568713188171, 0.9996734857559204, 0.998099148273468, 1.0, 1.0, 0.9999960660934448, 1.0, 1.0, 1.0, 0.004563316702842712, 0.9999998807907104, 0.9999970197677612, 0.9998672008514404, 0.9999915361404419, 0.9999481439590454, 1.0, 1.0, 1.0, 0.9993877410888672, 0.9223402738571167, 0.9712051749229431, 0.002365675987675786, 1.6630327670519307e-10, 2.3206568755540502e-07, 1.0, 0.7565206289291382, 1.0, 0.9462104439735413, 0.011894762516021729, 0.30827176570892334, 0.9295287132263184, 0.9999960660934448, 0.9996552467346191, 0.9931640028953552, 0.9984480142593384, 1.1262916359555675e-06, 0.9964653253555298, 0.999993085861206, 0.9973347783088684, 0.9998528957366943, 0.9999964237213135, 1.0, 1.0, 1.0, 1.0, 0.8404258489608765, 0.38777613639831543, 0.47810930013656616, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999874830245972, 0.9999909400939941, 0.9999834299087524, 0.9646490216255188, 0.9596350193023682, 0.877169132232666, 0.7902054786682129, 1.0, 1.0, 1.0, 0.9057473540306091, 0.9484086632728577, 0.04522613063454628 ], "eval_math_runtime": 200.9795, "eval_math_samples_per_second": 3.732, "eval_math_score": -0.1538645476102829, "eval_math_steps_per_second": 0.119, "step": 350 }, { "epoch": 6.16, "learning_rate": 0.0002, "loss": 0.0, "step": 351 }, { "epoch": 6.18, "learning_rate": 0.0002, "loss": 0.0002, "step": 352 }, { "epoch": 6.19, "learning_rate": 0.0002, "loss": 0.0009, "step": 353 }, { "epoch": 6.21, "learning_rate": 0.0002, "loss": 0.0002, "step": 354 }, { "epoch": 6.23, "learning_rate": 0.0002, "loss": 0.0, "step": 355 }, { "epoch": 6.25, "learning_rate": 0.0002, "loss": 0.0039, "step": 356 }, { "epoch": 6.26, "learning_rate": 0.0002, "loss": 0.0001, "step": 357 }, { "epoch": 6.28, "learning_rate": 0.0002, "loss": 0.0, "step": 358 }, { "epoch": 6.3, "learning_rate": 0.0002, "loss": 0.0044, "step": 359 }, { "epoch": 6.32, "learning_rate": 0.0002, "loss": 0.0009, "step": 360 }, { "epoch": 6.33, "learning_rate": 0.0002, "loss": 0.0002, "step": 361 }, { "epoch": 6.35, "learning_rate": 0.0002, "loss": 0.0312, "step": 362 }, { "epoch": 6.37, "learning_rate": 0.0002, "loss": 0.013, "step": 363 }, { "epoch": 6.39, "learning_rate": 0.0002, "loss": 0.0003, "step": 364 }, { "epoch": 6.4, "learning_rate": 0.0002, "loss": 0.0002, "step": 365 }, { "epoch": 6.42, "learning_rate": 0.0002, "loss": 0.0007, "step": 366 }, { "epoch": 6.44, "learning_rate": 0.0002, "loss": 0.0, "step": 367 }, { "epoch": 6.46, "learning_rate": 0.0002, "loss": 0.0001, "step": 368 }, { "epoch": 6.47, "learning_rate": 0.0002, "loss": 0.0, "step": 369 }, { "epoch": 6.49, "learning_rate": 0.0002, "loss": 0.0, "step": 370 }, { "epoch": 6.51, "learning_rate": 0.0002, "loss": 0.0, "step": 371 }, { "epoch": 6.53, "learning_rate": 0.0002, "loss": 0.0001, "step": 372 }, { "epoch": 6.54, "learning_rate": 0.0002, "loss": 0.0005, "step": 373 }, { "epoch": 6.56, "learning_rate": 0.0002, "loss": 0.0, "step": 374 }, { "epoch": 6.58, "learning_rate": 0.0002, "loss": 0.0012, "step": 375 }, { "epoch": 6.58, "eval_math_accuracy": 0.824, "eval_math_average_probability": 0.8216871023178101, "eval_math_brier_score": 0.15792816877365112, "eval_math_loss": 1.5404590368270874, "eval_math_probabilities": [ 0.9877732396125793, 0.9241480231285095, 0.9650260806083679, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998007416725159, 0.9149071574211121, 0.99928879737854, 0.38800889253616333, 0.0010985133703798056, 0.9993308782577515, 0.994014322757721, 0.9375015497207642, 0.9957096576690674, 0.9999998807907104, 0.06941904127597809, 0.6159905791282654, 0.2587335407733917, 0.22804684937000275, 0.1470353752374649, 0.31334570050239563, 0.9999998807907104, 0.9999992847442627, 0.950481653213501, 0.3011614978313446, 0.00018400813860353082, 0.1878913938999176, 0.11511655151844025, 0.008915352635085583, 0.9907863140106201, 1.0, 0.9999984502792358, 1.0, 1.0, 1.0, 0.004131305031478405, 0.0033770506270229816, 0.0004676016396842897, 1.0, 1.0, 1.0, 0.0018777943914756179, 7.45750658097677e-05, 0.002192085376009345, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9991636276245117, 0.9999997615814209, 0.9999455213546753, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999955415725708, 0.9968221187591553, 0.9999992847442627, 0.9999182224273682, 1.0, 3.985628154623555e-06, 0.8453868627548218, 0.989267885684967, 1.0, 1.0, 1.0, 0.9999991655349731, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.999868631362915, 0.9999871253967285, 0.9999678134918213, 0.999998927116394, 0.9999996423721313, 1.0, 1.0, 1.0, 4.754136284645938e-07, 0.0018470840295776725, 0.7510156035423279, 1.0, 1.0, 1.0, 0.0016988905845209956, 0.9972885847091675, 0.0063718282617628574, 0.9999970197677612, 1.0, 1.0, 0.9999991655349731, 1.0, 0.9999767541885376, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998859167098999, 0.007886041887104511, 0.9578870534896851, 0.5380457043647766, 0.00035884161479771137, 5.431423346635711e-07, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0008792010485194623, 0.3732890784740448, 0.9999984502792358, 1.0, 1.0, 0.9999995231628418, 1.0, 1.0, 1.0, 0.7190867066383362, 0.9978951215744019, 0.9999575614929199, 1.0, 1.0, 1.0, 2.8348692922008922e-06, 1.0, 0.9999949932098389, 0.9999986886978149, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0008022086112760007, 0.0043654837645590305, 0.9974234104156494, 1.0, 1.0, 1.0, 5.628812687064055e-06, 0.00017008163558784872, 0.029708093032240868, 0.9999994039535522, 0.9999986886978149, 0.9999992847442627, 1.0, 0.9850441217422485, 1.0, 1.0, 0.9999948740005493, 1.0, 0.9767394065856934, 9.526038846630058e-10, 0.6295535564422607, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9737791419029236, 0.9995415210723877, 0.9996685981750488, 0.9680151343345642, 0.9070956110954285, 0.0040984791703522205, 0.9996790885925293, 0.9999419450759888, 0.9999947547912598, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999988079071045, 0.9772865176200867, 0.9999986886978149, 0.9999992847442627, 1.0, 1.0, 1.0, 1.0, 0.9999977350234985, 1.0, 0.9999943971633911, 1.0, 0.5212855339050293, 0.011772983707487583, 0.8619459271430969, 1.0, 0.9999370574951172, 0.8208949565887451, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999915361404419, 2.339049842703389e-07, 0.9999977350234985, 0.5248288512229919, 0.9998946189880371, 0.06955759972333908, 0.9572703838348389, 0.9997641444206238, 0.046442996710538864, 1.0, 1.0, 1.0, 1.0, 0.9999979734420776, 0.997359573841095, 1.0, 0.998900294303894, 0.9999020099639893, 1.0, 1.0, 1.0, 0.9999914169311523, 1.0, 1.0, 0.999943733215332, 0.999601423740387, 0.0012097049038857222, 1.0, 1.0, 1.0, 1.0, 0.9999969005584717, 0.961689829826355, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.16882991790771484, 0.9934955835342407, 0.9999980926513672, 0.9998853206634521, 0.9999921321868896, 0.9999642372131348, 0.18380087614059448, 0.9999961853027344, 0.9958594441413879, 0.9998364448547363, 0.9999978542327881, 0.9999991655349731, 0.9999986886978149, 1.0, 1.0, 1.0, 0.9999991655349731, 1.0, 0.9999992847442627, 9.62435375839732e-09, 0.997639536857605, 0.7150160670280457, 0.998430073261261, 0.8045229315757751, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9995312690734863, 0.9956509470939636, 0.9171652793884277, 1.0, 1.0, 0.9999967813491821, 0.9657946228981018, 0.8120583891868591, 0.048077162355184555, 1.0, 1.0, 1.0, 0.9970212578773499, 0.9165068864822388, 0.7060384750366211, 0.9656080603599548, 0.04489322751760483, 0.1875849813222885, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0490546841224032e-23, 1.104641226395261e-17, 5.1967073567542654e-23, 1.0, 1.0, 1.0, 2.3770953703206033e-06, 0.9999970197677612, 0.0027118113357573748, 0.0033802471589297056, 0.9999994039535522, 0.030846839770674706, 1.0, 1.0, 1.0, 0.9999747276306152, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999996423721313, 0.9999856948852539, 0.9995124340057373, 0.0010694446973502636, 0.0007705047610215843, 0.3346032500267029, 0.9992683529853821, 0.5359874963760376, 0.9998857975006104, 1.0, 0.015115329995751381, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.8883326649665833, 2.1731258570412137e-08, 0.014990649186074734, 0.8753084540367126, 0.0043227337300777435, 5.022229027820268e-20, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.5621696710586548, 0.9997236132621765, 0.18042996525764465, 0.9941421151161194, 0.07321517914533615, 8.482312097157774e-08, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0006102697225287557, 1.0, 0.9999988079071045, 0.9999995231628418, 0.3743577301502228, 0.2893775999546051, 0.9585502743721008, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.17571288347244263, 0.24871911108493805, 0.20304901897907257, 0.9999921321868896, 0.9978525638580322, 0.9999915361404419, 3.5249391657998785e-05, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999920129776001, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999334812164307, 1.0, 1.0, 1.0, 1.0, 0.8378989100456238, 0.8783680200576782, 0.8770092725753784, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999905824661255, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999991774559021, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999911785125732, 0.9975211024284363, 0.9999992847442627, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.13856510818004608, 0.6486384868621826, 0.9998559951782227, 2.912016808243045e-11, 0.03253040090203285, 6.643339307485507e-13, 1.0, 1.0, 1.0, 1.0, 0.7834408283233643, 1.0, 0.7925596237182617, 0.8930891752243042, 0.9974995255470276, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.99992835521698, 0.9995181560516357, 1.0, 0.9722399711608887, 0.9999942779541016, 0.032181516289711, 1.0, 1.0, 0.0014206924242898822, 1.0, 1.0, 1.0, 0.9698819518089294, 0.9999991655349731, 1.0, 3.5674846410316263e-10, 0.019396144896745682, 0.9998049139976501, 1.0, 1.0, 1.0, 0.12995079159736633, 0.6077058911323547, 0.8105568289756775, 1.865980630100239e-05, 4.7361102783172906e-18, 0.10931368172168732, 1.0, 1.0, 1.0, 9.796283576002374e-12, 0.003301493125036359, 0.9259292483329773, 0.4694834351539612, 0.9029518961906433, 3.624341071147538e-18, 1.0, 1.0, 1.0, 1.0, 0.999797523021698, 1.0, 1.0, 0.9999223947525024, 1.0, 0.9769302606582642, 1.9187687030353118e-06, 0.9952759742736816, 0.1838865578174591, 0.9993859529495239, 0.9992520213127136, 0.7565932869911194, 1.0, 0.9999920129776001, 0.9992984533309937, 0.9999926090240479, 0.9562022089958191, 1.0, 1.0, 1.0, 0.12814800441265106, 0.00012442654406186193, 0.022375088185071945, 1.0, 0.9741103649139404, 0.814415454864502, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.09007087349891663, 0.0009241750813089311, 2.2463937909833476e-07, 2.0787978005643026e-09, 4.2215103235321294e-07, 3.0797401961990545e-08, 0.9531071782112122, 0.15116871893405914, 0.0026261750608682632, 1.0, 0.9999984502792358, 1.0, 0.014852293767035007, 1.0, 1.0, 0.9999986886978149, 0.9999114274978638, 0.9999969005584717, 0.9992345571517944, 0.999987006187439, 0.9965529441833496, 0.9999825954437256, 0.9999996423721313, 0.9999995231628418, 0.9999864101409912, 0.9999836683273315, 0.9999994039535522, 1.0, 1.0, 1.0, 0.9996077418327332, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9935935139656067, 1.0, 1.0, 1.0, 0.9972941279411316, 0.0005712650599889457, 1.569513616295204e-11, 1.0, 1.0, 1.0, 0.3629363775253296, 0.995797872543335, 0.28246575593948364, 0.999998927116394, 0.9999996423721313, 1.0, 1.0, 0.9994576573371887, 1.0, 0.999950647354126, 0.99935382604599, 0.8944816589355469, 1.0, 1.0, 1.0, 0.042494114488363266, 0.0002341300278203562, 0.00258771819062531, 1.0, 1.0, 1.0, 0.00042101985309273005, 0.6451740264892578, 1.3888065950595774e-06, 0.10158953815698624, 0.4682444632053375, 0.19366049766540527, 0.9909391403198242, 1.0, 0.9999985694885254, 0.9812344908714294, 0.9745727777481079, 0.0325494147837162, 0.9917852878570557, 0.9999053478240967, 0.9993407130241394, 0.9921931624412537, 0.9950557947158813, 5.190096635487862e-05, 0.9999997615814209, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.05174354836344719, 0.7751174569129944, 0.0002122758305631578, 1.0, 1.0, 0.9612815380096436, 1.0, 1.0, 1.0, 0.9999977350234985, 0.9996716976165771, 1.0, 0.9999796152114868, 0.9999204874038696, 0.9999860525131226, 0.803035318851471, 0.9999996423721313, 0.998177170753479, 0.9266850352287292, 0.846955418586731, 0.017510361969470978, 0.9999959468841553, 0.9953110814094543, 1.0, 1.0, 1.0, 0.9999998807907104, 0.11392541229724884, 0.4153691232204437, 0.28247156739234924, 1.0, 1.0, 0.9998486042022705, 1.0, 1.0, 1.0, 0.9970439076423645, 1.0, 0.9999998807907104, 0.9999014139175415, 0.9998836517333984, 0.9763361811637878, 0.9999929666519165, 0.9999978542327881, 0.9999985694885254, 1.0, 1.0, 0.9993883371353149, 1.0, 1.0, 1.0, 1.364134641335113e-05, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999898672103882, 0.9961608648300171, 0.9970912933349609, 0.00034535888698883355, 3.2738777509290495e-13, 1.866181719378801e-06, 1.0, 0.9999231100082397, 1.0, 0.9984984397888184, 0.010748691856861115, 0.09710182249546051, 0.910886824131012, 1.0, 0.9999854564666748, 0.9999785423278809, 0.9999881982803345, 1.9941788309552066e-07, 0.9301260709762573, 0.999984622001648, 0.9950101375579834, 0.99994957447052, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9361687898635864, 0.5448992848396301, 0.07177828997373581, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9993798732757568, 0.9998452663421631, 0.9919106364250183, 0.6389628648757935, 0.9931942224502563, 0.30201834440231323, 0.9997193217277527, 1.0, 1.0, 1.0, 0.9999436140060425, 0.9999949932098389, 0.018147477880120277 ], "eval_math_runtime": 201.145, "eval_math_samples_per_second": 3.729, "eval_math_score": -0.15792816877365112, "eval_math_steps_per_second": 0.119, "step": 375 }, { "epoch": 6.6, "learning_rate": 0.0002, "loss": 0.0004, "step": 376 }, { "epoch": 6.61, "learning_rate": 0.0002, "loss": 0.0001, "step": 377 }, { "epoch": 6.63, "learning_rate": 0.0002, "loss": 0.0002, "step": 378 }, { "epoch": 6.65, "learning_rate": 0.0002, "loss": 0.0001, "step": 379 }, { "epoch": 6.67, "learning_rate": 0.0002, "loss": 0.0, "step": 380 }, { "epoch": 6.68, "learning_rate": 0.0002, "loss": 0.0003, "step": 381 }, { "epoch": 6.7, "learning_rate": 0.0002, "loss": 0.0053, "step": 382 }, { "epoch": 6.72, "learning_rate": 0.0002, "loss": 0.0, "step": 383 }, { "epoch": 6.74, "learning_rate": 0.0002, "loss": 0.0003, "step": 384 }, { "epoch": 6.75, "learning_rate": 0.0002, "loss": 0.0001, "step": 385 }, { "epoch": 6.77, "learning_rate": 0.0002, "loss": 0.0005, "step": 386 }, { "epoch": 6.79, "learning_rate": 0.0002, "loss": 0.0, "step": 387 }, { "epoch": 6.81, "learning_rate": 0.0002, "loss": 0.0, "step": 388 }, { "epoch": 6.82, "learning_rate": 0.0002, "loss": 0.0004, "step": 389 }, { "epoch": 6.84, "learning_rate": 0.0002, "loss": 0.0, "step": 390 }, { "epoch": 6.86, "learning_rate": 0.0002, "loss": 0.0, "step": 391 }, { "epoch": 6.88, "learning_rate": 0.0002, "loss": 0.0, "step": 392 }, { "epoch": 6.89, "learning_rate": 0.0002, "loss": 0.0, "step": 393 }, { "epoch": 6.91, "learning_rate": 0.0002, "loss": 0.0, "step": 394 }, { "epoch": 6.93, "learning_rate": 0.0002, "loss": 0.2038, "step": 395 }, { "epoch": 6.95, "learning_rate": 0.0002, "loss": 0.0001, "step": 396 }, { "epoch": 6.96, "learning_rate": 0.0002, "loss": 0.0003, "step": 397 }, { "epoch": 6.98, "learning_rate": 0.0002, "loss": 0.0005, "step": 398 }, { "epoch": 7.0, "learning_rate": 0.0002, "loss": 0.0063, "step": 399 }, { "epoch": 7.02, "learning_rate": 0.0002, "loss": 0.0043, "step": 400 }, { "epoch": 7.02, "eval_math_accuracy": 0.8093333333333333, "eval_math_average_probability": 0.8106809258460999, "eval_math_brier_score": 0.16440215706825256, "eval_math_loss": 1.7561619281768799, "eval_math_probabilities": [ 0.9429445266723633, 0.8724210858345032, 0.8490995764732361, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9899095296859741, 0.9693266153335571, 0.9994932413101196, 0.1540966033935547, 0.005755316466093063, 0.994525671005249, 0.9953575730323792, 0.9925064444541931, 0.9987565279006958, 0.9999998807907104, 0.0020007838029414415, 0.09554987400770187, 0.5030917525291443, 0.15423214435577393, 0.03718015179038048, 0.48827338218688965, 0.9999939203262329, 0.999927282333374, 0.8449088335037231, 0.33582374453544617, 0.41516557335853577, 0.14540712535381317, 0.0644523873925209, 0.08605457097291946, 0.00010748876229627058, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.011167841963469982, 0.0052567110396921635, 1.5548939700238407e-05, 1.0, 1.0, 1.0, 0.021364936605095863, 0.0016843716148287058, 0.026243720203638077, 1.0, 1.0, 1.0, 0.9999997615814209, 0.9998874664306641, 0.9999995231628418, 0.9999995231628418, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998636245727539, 0.9881244897842407, 0.9908066391944885, 0.9895488023757935, 1.0, 1.7052114928417517e-12, 4.816772536386793e-10, 0.9999673366546631, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999995231628418, 0.9882610440254211, 0.9932377338409424, 0.9999988079071045, 0.9999997615814209, 0.9999998807907104, 1.0, 1.0, 1.0, 3.432960227200965e-08, 0.0001759952720021829, 0.9409040808677673, 1.0, 1.0, 1.0, 9.734980267239735e-05, 0.9988088607788086, 8.268444071291015e-05, 0.9999998807907104, 1.0, 1.0, 0.999799907207489, 0.9999997615814209, 0.9790757894515991, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.9902393817901611, 0.0006625067326240242, 0.9074945449829102, 0.14370644092559814, 0.00016802594473119825, 1.8757101827304723e-07, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999995231628418, 1.0, 0.999997615814209, 0.0017336549935862422, 0.32700955867767334, 0.9998745918273926, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.5616581439971924, 0.9598290920257568, 0.9993513226509094, 1.0, 1.0, 1.0, 6.520157677658567e-12, 0.9999970197677612, 0.9966642260551453, 0.9999960660934448, 1.0, 0.9999991655349731, 1.0, 1.0, 1.0, 1.9542581242149026e-07, 0.2530691623687744, 0.07126456499099731, 1.0, 1.0, 1.0, 6.321365162875736e-06, 0.0008076921803876758, 0.010065910406410694, 0.9999934434890747, 0.9999922513961792, 0.9999958276748657, 1.0, 0.9844878315925598, 1.0, 1.0, 0.9999955892562866, 1.0, 0.9686028361320496, 6.236921786320626e-14, 0.8670212030410767, 0.9999998807907104, 0.999998927116394, 0.9999995231628418, 1.0, 1.0, 1.0, 0.990247905254364, 0.9999659061431885, 0.9999996423721313, 0.8021555542945862, 0.8563480973243713, 0.0006261634407564998, 0.9999957084655762, 0.9999864101409912, 0.9999951124191284, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9997081160545349, 1.0, 0.9999957084655762, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 0.9999954700469971, 0.9999969005584717, 1.0, 0.8026497960090637, 0.05274922028183937, 0.8504056334495544, 1.0, 0.9974738955497742, 0.41513270139694214, 1.0, 1.0, 1.0, 0.9999966621398926, 1.0, 0.9999978542327881, 0.9999910593032837, 2.514564911848538e-08, 0.9999891519546509, 0.3468046188354492, 0.9997547268867493, 0.038331568241119385, 0.8830848336219788, 0.9947787523269653, 0.018700364977121353, 1.0, 1.0, 1.0, 1.0, 0.9999977350234985, 0.9868263006210327, 1.0, 0.9985817670822144, 0.9997316002845764, 1.0, 1.0, 1.0, 0.9999947547912598, 1.0, 0.9999998807907104, 0.9999885559082031, 0.9996936321258545, 0.0017212132224813104, 1.0, 1.0, 1.0, 0.9999996423721313, 0.9999996423721313, 0.9978083968162537, 1.0, 1.0, 0.9999971389770508, 1.0, 1.0, 1.0, 0.9291380643844604, 0.9983667731285095, 0.9999802112579346, 0.9992691874504089, 0.9998340606689453, 0.9997863173484802, 0.884669303894043, 0.9999997615814209, 0.9995676875114441, 0.9999938011169434, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.9978849291801453, 1.6802859104103618e-09, 0.9558794498443604, 0.3498164117336273, 0.9996509552001953, 0.927638828754425, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 0.9974060654640198, 0.9896605014801025, 0.9066641330718994, 1.0, 1.0, 0.9999958276748657, 0.8847867846488953, 0.519504189491272, 0.10185941308736801, 1.0, 1.0, 1.0, 0.9999748468399048, 0.9979269504547119, 0.9995018243789673, 0.8821101188659668, 0.049049943685531616, 0.43697068095207214, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.8043647502541337e-26, 2.8783989005291085e-18, 6.572881753457834e-25, 0.9999986886978149, 0.9999945163726807, 0.9999841451644897, 0.0009983201744034886, 1.0, 0.9997727274894714, 0.014282813295722008, 0.9999706745147705, 0.028251420706510544, 1.0, 1.0, 1.0, 0.9999984502792358, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9999990463256836, 0.999976396560669, 0.999914288520813, 0.014132875017821789, 0.006447387393563986, 0.4385555386543274, 0.9999990463256836, 0.5394912958145142, 0.9999995231628418, 0.9999998807907104, 1.2606681593752e-05, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9282931089401245, 9.040562872542068e-06, 0.06675966829061508, 0.5506824254989624, 0.018575508147478104, 7.345549000902559e-23, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.7554729580879211, 0.985030472278595, 0.010319489985704422, 0.9897186756134033, 0.10936680436134338, 1.5263080399563478e-07, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999998927116394, 1.0, 3.468256792871216e-08, 1.0, 0.9999946355819702, 0.9999942779541016, 0.24336980283260345, 0.49475401639938354, 0.9165603518486023, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.17127996683120728, 0.5157628059387207, 0.3021223843097687, 1.0, 0.9648051261901855, 1.0, 2.014230631175451e-07, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999198913574219, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9988535642623901, 1.0, 1.0, 1.0, 1.0, 0.22893619537353516, 0.23127885162830353, 0.9909466505050659, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999446868896484, 0.9969052672386169, 0.9999719858169556, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.007344381941948e-07, 0.84297114610672, 0.9999321699142456, 1.632534710714617e-14, 0.027175182476639748, 9.946513929062328e-15, 1.0, 1.0, 1.0, 1.0, 0.2757425606250763, 1.0, 0.8600448369979858, 0.8530101180076599, 0.9905396699905396, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999990463256836, 0.12310183793306351, 1.0, 0.9873880743980408, 0.9999992847442627, 0.0008063202840276062, 1.0, 1.0, 0.2140050083398819, 1.0, 1.0, 1.0, 0.9998337030410767, 0.9999489784240723, 1.0, 7.035184185834624e-15, 1.2124497239529575e-10, 0.9985673427581787, 1.0, 1.0, 1.0, 0.1205366924405098, 0.060260966420173645, 0.2923891246318817, 8.375053766940255e-06, 7.169244808596129e-20, 0.2607194483280182, 1.0, 1.0, 1.0, 1.2293239343152962e-12, 0.0032404144294559956, 0.926364541053772, 0.564024806022644, 0.9646813869476318, 2.8173559698524156e-19, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.6393957138061523, 5.716961348767313e-10, 0.9703797698020935, 0.3078276216983795, 0.9969255328178406, 0.9963794350624084, 0.9983073472976685, 1.0, 0.9999997615814209, 0.9989375472068787, 0.9996956586837769, 0.9172918200492859, 1.0, 1.0, 1.0, 0.01267787255346775, 0.001501175807788968, 0.00248376140370965, 0.9999366998672485, 0.3615514039993286, 0.0941779613494873, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.6848422884941101, 0.054026417434215546, 1.8933859280423349e-07, 6.226411642273888e-05, 2.199511300204904e-06, 2.356008725785952e-13, 0.8441120982170105, 0.030882347375154495, 0.0025695087388157845, 1.0, 1.0, 1.0, 0.0989774540066719, 1.0, 1.0, 0.9020742774009705, 0.715294361114502, 0.295801043510437, 0.9999673366546631, 1.0, 0.9999921321868896, 0.9990228414535522, 0.9999966621398926, 0.9999836683273315, 0.9978446960449219, 0.9989917874336243, 0.9999135732650757, 1.0, 1.0, 1.0, 0.9999738931655884, 1.0, 1.0, 0.971897542476654, 1.0, 1.0, 1.0, 1.0, 0.2337254285812378, 1.0, 1.0, 1.0, 0.9852169156074524, 0.001685154507867992, 1.821150164005303e-07, 1.0, 1.0, 1.0, 0.32693204283714294, 0.9989995360374451, 0.4273659884929657, 1.0, 1.0, 1.0, 1.0, 0.9998735189437866, 1.0, 0.9999943971633911, 0.9966045618057251, 0.9908301830291748, 0.9999994039535522, 0.9999996423721313, 0.9999502897262573, 0.6384978890419006, 0.0038190558552742004, 0.4664112627506256, 1.0, 1.0, 1.0, 0.0004898545448668301, 0.6740902662277222, 7.47627709642984e-05, 0.15106521546840668, 0.5828249454498291, 0.16426728665828705, 0.9562847018241882, 1.0, 0.9991681575775146, 0.9831827878952026, 0.94121915102005, 0.25536397099494934, 0.9911600947380066, 0.9992233514785767, 0.9995433688163757, 0.9749346971511841, 0.9192919731140137, 4.154409180046059e-05, 0.9999998807907104, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.06691467016935349, 0.8029363751411438, 0.00022816139971837401, 1.0, 1.0, 0.747048020362854, 1.0, 1.0, 1.0, 0.9988957643508911, 0.9976676106452942, 0.9999998807907104, 0.9999996423721313, 0.9999980926513672, 0.9999995231628418, 0.270152747631073, 0.9999250173568726, 0.9888633489608765, 0.9999988079071045, 0.9998989105224609, 0.9884421229362488, 0.9999998807907104, 0.9998478889465332, 1.0, 1.0, 1.0, 0.9999527931213379, 0.2380104809999466, 0.48993152379989624, 0.17761269211769104, 1.0, 1.0, 0.9997345805168152, 1.0, 1.0, 1.0, 0.9999974966049194, 1.0, 1.0, 0.9984108209609985, 0.9972279667854309, 0.9407644271850586, 0.999921441078186, 0.9999796152114868, 0.9999707937240601, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.844810312462869e-08, 1.0, 0.9999997615814209, 0.9999996423721313, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.8938726782798767, 0.7016579508781433, 0.641927182674408, 0.0005656119901686907, 2.602796450590361e-12, 0.0011387430131435394, 1.0, 0.9999996423721313, 1.0, 0.9918357729911804, 0.030102424323558807, 0.6802172064781189, 0.000780188653152436, 0.918916642665863, 0.9455056190490723, 0.9991400241851807, 0.9999947547912598, 1.0810331474431223e-07, 0.8203614950180054, 0.9935170412063599, 0.7445070147514343, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.6579119563102722, 0.5036973357200623, 0.012988785281777382, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9997912049293518, 0.9997108578681946, 0.3292750120162964, 0.9638171792030334, 0.44749802350997925, 4.056671241414733e-05, 0.8420439958572388, 0.9997792840003967, 0.9997594952583313, 0.9999996423721313, 0.9999083280563354, 0.9999890327453613, 0.0010850777616724372 ], "eval_math_runtime": 201.3021, "eval_math_samples_per_second": 3.726, "eval_math_score": -0.16440215706825256, "eval_math_steps_per_second": 0.119, "step": 400 }, { "epoch": 7.04, "learning_rate": 0.0002, "loss": 0.0001, "step": 401 }, { "epoch": 7.05, "learning_rate": 0.0002, "loss": 0.0004, "step": 402 }, { "epoch": 7.07, "learning_rate": 0.0002, "loss": 0.0003, "step": 403 }, { "epoch": 7.09, "learning_rate": 0.0002, "loss": 0.0, "step": 404 }, { "epoch": 7.11, "learning_rate": 0.0002, "loss": 0.0, "step": 405 }, { "epoch": 7.12, "learning_rate": 0.0002, "loss": 0.0128, "step": 406 }, { "epoch": 7.14, "learning_rate": 0.0002, "loss": 0.0001, "step": 407 }, { "epoch": 7.16, "learning_rate": 0.0002, "loss": 0.0005, "step": 408 }, { "epoch": 7.18, "learning_rate": 0.0002, "loss": 0.0001, "step": 409 }, { "epoch": 7.19, "learning_rate": 0.0002, "loss": 0.0001, "step": 410 }, { "epoch": 7.21, "learning_rate": 0.0002, "loss": 0.0004, "step": 411 }, { "epoch": 7.23, "learning_rate": 0.0002, "loss": 0.0004, "step": 412 }, { "epoch": 7.25, "learning_rate": 0.0002, "loss": 0.0, "step": 413 }, { "epoch": 7.26, "learning_rate": 0.0002, "loss": 0.0001, "step": 414 }, { "epoch": 7.28, "learning_rate": 0.0002, "loss": 0.0002, "step": 415 }, { "epoch": 7.3, "learning_rate": 0.0002, "loss": 0.0, "step": 416 }, { "epoch": 7.32, "learning_rate": 0.0002, "loss": 0.0, "step": 417 }, { "epoch": 7.33, "learning_rate": 0.0002, "loss": 0.0014, "step": 418 }, { "epoch": 7.35, "learning_rate": 0.0002, "loss": 0.0004, "step": 419 }, { "epoch": 7.37, "learning_rate": 0.0002, "loss": 0.0168, "step": 420 }, { "epoch": 7.39, "learning_rate": 0.0002, "loss": 0.0003, "step": 421 }, { "epoch": 7.4, "learning_rate": 0.0002, "loss": 0.0001, "step": 422 }, { "epoch": 7.42, "learning_rate": 0.0002, "loss": 0.0001, "step": 423 }, { "epoch": 7.44, "learning_rate": 0.0002, "loss": 0.0001, "step": 424 }, { "epoch": 7.46, "learning_rate": 0.0002, "loss": 0.0, "step": 425 }, { "epoch": 7.46, "eval_math_accuracy": 0.812, "eval_math_average_probability": 0.8120921850204468, "eval_math_brier_score": 0.16692234575748444, "eval_math_loss": 1.671823263168335, "eval_math_probabilities": [ 0.9574011564254761, 0.9846744537353516, 0.9479662179946899, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9961726069450378, 0.8446101546287537, 0.9979799389839172, 0.2927791178226471, 0.002319630701094866, 0.9987313151359558, 0.9978190660476685, 0.9962032437324524, 0.9999152421951294, 0.9999998807907104, 0.0014741395134478807, 0.050097666680812836, 0.21892936527729034, 0.1404525488615036, 0.01888142339885235, 0.9884351491928101, 1.0, 0.9999998807907104, 0.9985700845718384, 0.9892066717147827, 0.056873615831136703, 0.00730718020349741, 0.0011694623390212655, 1.2624796319471443e-08, 0.2684471011161804, 1.0, 0.998979389667511, 1.0, 1.0, 1.0, 0.019847843796014786, 0.03956097736954689, 0.0003408365591894835, 1.0, 1.0, 1.0, 0.002191278152167797, 0.006551794707775116, 0.0013990307925269008, 1.0, 1.0, 1.0, 1.0, 0.9999657869338989, 1.0, 0.8796809911727905, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999382495880127, 0.9959166646003723, 0.9984307885169983, 0.999860405921936, 1.0, 4.554276335395901e-13, 9.5287278067957e-10, 0.9997966885566711, 0.9999994039535522, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999997615814209, 0.9999376535415649, 0.9983335137367249, 0.9993627667427063, 0.9999994039535522, 0.9999996423721313, 0.9999963045120239, 1.0, 1.0, 3.244136621560756e-07, 2.102418193317135e-06, 0.0144179817289114, 1.0, 1.0, 1.0, 0.0031949833501130342, 0.9995699524879456, 0.13783545792102814, 1.0, 1.0, 1.0, 0.9999747276306152, 1.0, 0.9995249509811401, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999926090240479, 0.010470201261341572, 0.05121993273496628, 0.1146698147058487, 0.00045805503032170236, 3.935120673759229e-07, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0002417368086753413, 0.0018852036446332932, 0.9999985694885254, 1.0, 0.9999997615814209, 0.9999946355819702, 1.0, 1.0, 0.9999998807907104, 0.22261546552181244, 0.998688280582428, 0.9999983310699463, 1.0, 1.0, 1.0, 0.11644219607114792, 1.0, 1.0, 0.99835604429245, 0.9999997615814209, 0.999995231628418, 1.0, 1.0, 1.0, 0.026607079431414604, 0.6749407649040222, 0.999619722366333, 0.9999979734420776, 1.0, 1.0, 2.2617025024374016e-05, 9.719248919282109e-05, 0.0005927791353315115, 0.9999990463256836, 0.9994829893112183, 0.9574447274208069, 1.0, 0.6468821167945862, 1.0, 1.0, 0.9999552965164185, 1.0, 0.9807908535003662, 2.0622623075373936e-13, 0.9182945489883423, 0.9996250867843628, 0.9977980852127075, 0.9940586090087891, 1.0, 1.0, 1.0, 0.9917317032814026, 0.999723494052887, 0.9997736811637878, 0.1569167524576187, 0.21578769385814667, 0.0009808368049561977, 0.999942421913147, 0.9999676942825317, 0.9999966621398926, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9984286427497864, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999995231628418, 1.0, 1.0, 0.055450569838285446, 0.004720720928162336, 0.5151379108428955, 1.0, 0.99626225233078, 0.7218323945999146, 1.0, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 0.9999994039535522, 2.183796254939807e-08, 0.9999998807907104, 0.5874932408332825, 0.9995428323745728, 0.021272335201501846, 0.9989941716194153, 0.9998495578765869, 0.7510195374488831, 1.0, 1.0, 1.0, 1.0, 0.9991150498390198, 0.2169639766216278, 1.0, 0.9971312284469604, 0.9999995231628418, 1.0, 1.0, 1.0, 0.9999862909317017, 1.0, 1.0, 0.9999991655349731, 0.8336784839630127, 1.5732430256321095e-05, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999998807907104, 0.9846424460411072, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9901317358016968, 0.9998890161514282, 0.9999995231628418, 1.0, 1.0, 1.0, 0.0563710555434227, 0.9999991655349731, 0.9998185038566589, 0.9998916387557983, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.06990262120962143, 0.007379468996077776, 0.9977182149887085, 0.8363181352615356, 0.9999158382415771, 0.9881265163421631, 0.9999817609786987, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999992847442627, 0.9999922513961792, 1.0, 0.9997103810310364, 0.9983556866645813, 0.9646293520927429, 1.0, 1.0, 1.0, 0.9651395678520203, 0.7619080543518066, 0.19460275769233704, 1.0, 0.9999998807907104, 1.0, 0.9669091701507568, 0.962605357170105, 0.7340160012245178, 0.8752768635749817, 0.1789446920156479, 0.16496670246124268, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0620342857325064e-24, 6.088170881322109e-21, 1.180983150822841e-23, 1.0, 1.0, 1.0, 0.00010435185686219484, 0.9999998807907104, 0.0032087014988064766, 0.0023902682587504387, 0.999995231628418, 0.05875006690621376, 1.0, 1.0, 1.0, 0.9999995231628418, 1.0, 0.9999964237213135, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999960660934448, 0.9999305009841919, 0.0012216647155582905, 0.0010643379064276814, 0.13366946578025818, 0.999930739402771, 0.007435685954988003, 0.9999104738235474, 1.0, 4.0953349525807425e-05, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999815225601196, 1.0, 1.0, 0.8409857153892517, 7.097426119040406e-11, 0.004800115246325731, 0.9977512955665588, 9.032396497410389e-10, 1.6307099341946622e-19, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.8530381321907043, 0.993071973323822, 0.007897533476352692, 0.9978089928627014, 0.18295353651046753, 5.015596826751789e-08, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9463525414466858, 1.0, 0.9978724718093872, 0.999834418296814, 0.11192909628152847, 0.2000609040260315, 0.924461305141449, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0576368011534214, 0.12071438133716583, 0.11938026547431946, 0.9998233914375305, 0.9995531439781189, 0.9999972581863403, 8.032269960267513e-08, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999934434890747, 1.0, 1.0, 0.999995231628418, 1.0, 1.0, 0.998900294303894, 1.0, 1.0, 1.0, 1.0, 0.36604249477386475, 0.44349732995033264, 0.9247777462005615, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9998809099197388, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999988079071045, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999139308929443, 0.9899723529815674, 0.9999699592590332, 1.0, 1.0, 1.0, 0.9999992847442627, 1.0, 1.0, 0.6514559984207153, 0.6455770134925842, 0.9992250204086304, 3.245292923281795e-12, 0.001053312444128096, 1.196616807377926e-12, 1.0, 1.0, 1.0, 1.0, 0.04822896793484688, 1.0, 0.24687150120735168, 0.82968670129776, 0.998563826084137, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9997263550758362, 0.047536421567201614, 0.9996215105056763, 0.944694995880127, 0.9996625185012817, 0.004437606316059828, 0.9999985694885254, 1.0, 0.0014463759725913405, 1.0, 1.0, 1.0, 0.22832714021205902, 0.9974303841590881, 1.0, 4.2181735881996474e-10, 1.4124933387098422e-14, 0.9919811487197876, 1.0, 1.0, 1.0, 0.7390985488891602, 0.8080968260765076, 0.9495129585266113, 8.72446980793029e-06, 6.367394922091918e-19, 0.4959274232387543, 1.0, 1.0, 1.0, 3.120997860150965e-08, 0.9374096393585205, 0.9997925162315369, 0.18288327753543854, 0.9924758076667786, 1.8145732884580822e-18, 1.0, 1.0, 1.0, 1.0, 0.9683384895324707, 1.0, 1.0, 0.9999980926513672, 1.0, 0.018260309472680092, 1.3441892741756573e-16, 0.9476416110992432, 0.44495171308517456, 0.9997991919517517, 0.9986826777458191, 0.8299558758735657, 1.0, 0.9999905824661255, 0.9990981817245483, 0.9999996423721313, 0.7432786822319031, 1.0, 1.0, 1.0, 0.04284186661243439, 0.00012644358503166586, 0.0012601334601640701, 0.9999045133590698, 4.095253098057583e-05, 0.05033750459551811, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999231100082397, 0.9170622825622559, 0.18232697248458862, 3.756769956453354e-06, 0.0008382505038753152, 0.001783907413482666, 0.8928860425949097, 0.15009157359600067, 0.0005657888250425458, 1.0, 1.0, 1.0, 0.17314068973064423, 1.0, 1.0, 0.8565224409103394, 0.9213998913764954, 0.714292585849762, 0.9996654987335205, 0.9998977184295654, 0.9985538125038147, 0.9999996423721313, 1.0, 1.0, 0.9999371767044067, 0.9998791217803955, 0.9999970197677612, 1.0, 1.0, 1.0, 0.9561275243759155, 1.0, 1.0, 0.985784113407135, 1.0, 1.0, 1.0, 1.0, 0.9322072863578796, 1.0, 1.0, 1.0, 0.9991593360900879, 0.0036249819677323103, 9.726933147824468e-11, 1.0, 1.0, 1.0, 0.402014821767807, 0.9588399529457092, 0.2821159362792969, 0.9999998807907104, 0.9999971389770508, 0.9999994039535522, 1.0, 0.9127115607261658, 1.0, 0.9999947547912598, 0.9754000306129456, 0.9979546070098877, 1.0, 1.0, 1.0, 0.954058051109314, 0.03224389627575874, 0.06501447409391403, 1.0, 1.0, 1.0, 0.0031073996797204018, 0.8269851207733154, 0.0004920486244373024, 0.045037347823381424, 0.49919962882995605, 0.09731287509202957, 0.9036116003990173, 1.0, 0.9901642203330994, 0.9870404601097107, 0.9245648384094238, 2.299841435160488e-05, 0.9164133667945862, 0.9991269707679749, 0.9894953370094299, 0.9999722242355347, 0.9937399625778198, 0.0005087232566438615, 0.9999991655349731, 1.0, 1.0, 1.0, 1.0, 1.0, 0.29392164945602417, 0.8249218463897705, 0.00014030154852662235, 1.0, 1.0, 0.7371322512626648, 1.0, 1.0, 1.0, 1.0, 0.9854080080986023, 1.0, 0.9999998807907104, 0.9999945163726807, 0.9999994039535522, 0.485139399766922, 0.9997624754905701, 0.9709700345993042, 0.9963377714157104, 0.9097855091094971, 0.9918638467788696, 1.0, 0.9999845027923584, 1.0, 1.0, 1.0, 0.9988272786140442, 0.0568101704120636, 0.009536257945001125, 0.3273925185203552, 1.0, 1.0, 0.9993365406990051, 1.0, 1.0, 1.0, 0.9928966164588928, 1.0, 1.0, 0.9999974966049194, 0.9999994039535522, 0.9935064315795898, 0.9999957084655762, 0.9999920129776001, 0.9999996423721313, 1.0, 1.0, 0.9997485280036926, 1.0, 1.0, 1.0, 6.882417835640808e-08, 1.0, 1.0, 0.9999914169311523, 0.9999998807907104, 0.9999995231628418, 1.0, 1.0, 1.0, 0.9999998807907104, 0.999971866607666, 0.9997250437736511, 7.105042459443212e-05, 4.019464904558845e-05, 8.526481906301342e-06, 1.0, 0.9684842824935913, 1.0, 0.9994413256645203, 0.23811262845993042, 0.6160371899604797, 0.7871929407119751, 0.9997957348823547, 0.9999926090240479, 0.8046416640281677, 0.9993742108345032, 8.110196603183795e-08, 0.9896196722984314, 0.9999467134475708, 0.9906230568885803, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.8006301522254944, 0.23806864023208618, 0.13057906925678253, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9974685907363892, 0.9999090433120728, 0.9564679861068726, 0.9329842925071716, 0.6307148933410645, 0.5699298977851868, 0.9999957084655762, 0.9999998807907104, 0.999998927116394, 1.0, 0.999983549118042, 0.9999915361404419, 0.010316227562725544 ], "eval_math_runtime": 201.1907, "eval_math_samples_per_second": 3.728, "eval_math_score": -0.16692234575748444, "eval_math_steps_per_second": 0.119, "step": 425 }, { "epoch": 7.47, "learning_rate": 0.0002, "loss": 0.0001, "step": 426 }, { "epoch": 7.49, "learning_rate": 0.0002, "loss": 0.0001, "step": 427 }, { "epoch": 7.51, "learning_rate": 0.0002, "loss": 0.0002, "step": 428 }, { "epoch": 7.53, "learning_rate": 0.0002, "loss": 0.0002, "step": 429 }, { "epoch": 7.54, "learning_rate": 0.0002, "loss": 0.0002, "step": 430 }, { "epoch": 7.56, "learning_rate": 0.0002, "loss": 0.0001, "step": 431 }, { "epoch": 7.58, "learning_rate": 0.0002, "loss": 0.0047, "step": 432 }, { "epoch": 7.6, "learning_rate": 0.0002, "loss": 0.0009, "step": 433 }, { "epoch": 7.61, "learning_rate": 0.0002, "loss": 0.0002, "step": 434 }, { "epoch": 7.63, "learning_rate": 0.0002, "loss": 0.0028, "step": 435 }, { "epoch": 7.65, "learning_rate": 0.0002, "loss": 0.0002, "step": 436 }, { "epoch": 7.67, "learning_rate": 0.0002, "loss": 0.0, "step": 437 }, { "epoch": 7.68, "learning_rate": 0.0002, "loss": 0.0014, "step": 438 }, { "epoch": 7.7, "learning_rate": 0.0002, "loss": 0.0, "step": 439 }, { "epoch": 7.72, "learning_rate": 0.0002, "loss": 0.0, "step": 440 }, { "epoch": 7.74, "learning_rate": 0.0002, "loss": 0.0, "step": 441 }, { "epoch": 7.75, "learning_rate": 0.0002, "loss": 0.0012, "step": 442 }, { "epoch": 7.77, "learning_rate": 0.0002, "loss": 0.0, "step": 443 }, { "epoch": 7.79, "learning_rate": 0.0002, "loss": 0.0029, "step": 444 }, { "epoch": 7.81, "learning_rate": 0.0002, "loss": 0.001, "step": 445 }, { "epoch": 7.82, "learning_rate": 0.0002, "loss": 0.0002, "step": 446 }, { "epoch": 7.84, "learning_rate": 0.0002, "loss": 0.0001, "step": 447 }, { "epoch": 7.86, "learning_rate": 0.0002, "loss": 0.0, "step": 448 }, { "epoch": 7.88, "learning_rate": 0.0002, "loss": 0.0023, "step": 449 }, { "epoch": 7.89, "learning_rate": 0.0002, "loss": 0.0007, "step": 450 }, { "epoch": 7.89, "eval_math_accuracy": 0.8226666666666667, "eval_math_average_probability": 0.8231486678123474, "eval_math_brier_score": 0.15087273716926575, "eval_math_loss": 1.4901773929595947, "eval_math_probabilities": [ 0.9239053726196289, 0.9914353489875793, 0.921599805355072, 0.9999994039535522, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9913091659545898, 0.9596307277679443, 0.9996600151062012, 0.44431233406066895, 0.0030062461737543344, 0.995681881904602, 0.5948647856712341, 0.8882448077201843, 0.9956990480422974, 0.9999998807907104, 0.0027931039221584797, 0.058440908789634705, 0.784626841545105, 0.3819577097892761, 0.06096562370657921, 0.9999974966049194, 1.0, 1.0, 0.9435833692550659, 0.8093113303184509, 0.00023006211267784238, 0.00941490102559328, 0.0009112543193623424, 6.099693905525783e-08, 0.8883617520332336, 1.0, 0.9999996423721313, 1.0, 1.0, 1.0, 0.01351217646151781, 0.5524713397026062, 0.00025684060528874397, 1.0, 1.0, 1.0, 0.2181817591190338, 0.7950264811515808, 0.9649515151977539, 1.0, 1.0, 0.9999971389770508, 1.0, 0.999998927116394, 1.0, 0.4840643107891083, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999185800552368, 0.9986773133277893, 0.7882561087608337, 0.976597011089325, 1.0, 2.6140506648175688e-08, 0.036801569163799286, 0.9917424917221069, 0.9999079704284668, 0.9999979734420776, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.9999924898147583, 1.0, 0.9999988079071045, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.8731946056504967e-06, 0.002899725688621402, 0.02183137834072113, 1.0, 1.0, 1.0, 1.3679346011485904e-05, 0.9998447895050049, 0.007827834226191044, 1.0, 1.0, 1.0, 0.9999973773956299, 1.0, 0.9996342658996582, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9997289776802063, 0.0770987793803215, 0.43676233291625977, 0.03264642506837845, 0.008658229373395443, 7.702442239576612e-09, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999992847442627, 1.0, 1.0, 2.8098320399294607e-05, 0.0009188771364279091, 0.9850959181785583, 1.0, 1.0, 1.0, 0.9999982118606567, 0.9999587535858154, 0.9999582767486572, 0.4582568407058716, 0.9582631587982178, 0.9994751811027527, 1.0, 1.0, 1.0, 0.04642268270254135, 1.0, 1.0, 0.9999995231628418, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 1.1851168437715387e-06, 0.9574934840202332, 0.9921191930770874, 1.0, 1.0, 1.0, 1.3126104931870941e-06, 0.00022904806246515363, 0.32020890712738037, 0.9999997615814209, 0.9888445734977722, 0.9945164322853088, 1.0, 0.9712098836898804, 0.9999996423721313, 1.0, 0.9999264478683472, 1.0, 0.9195393323898315, 3.0430180944507335e-12, 0.9092803001403809, 0.999991774559021, 0.9996827840805054, 0.9999270439147949, 1.0, 1.0, 1.0, 0.9993854761123657, 0.9996569156646729, 0.9999822378158569, 0.0732436552643776, 0.3402455747127533, 0.0005144833703525364, 0.9998973608016968, 0.9999876022338867, 0.9999921321868896, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999974250793457, 1.0, 0.9995405673980713, 0.9999878406524658, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999977350234985, 1.0, 0.10239828377962112, 0.04974702373147011, 0.1481255143880844, 1.0, 0.985121488571167, 0.04474596306681633, 0.9999998807907104, 1.0, 0.999998927116394, 1.0, 1.0, 1.0, 0.9999998807907104, 3.14048447762616e-05, 1.0, 0.588689923286438, 0.9988573789596558, 0.03614448755979538, 0.9992820620536804, 0.995924711227417, 0.9808118343353271, 1.0, 1.0, 1.0, 1.0, 0.9991642236709595, 0.3002437353134155, 1.0, 0.9999678134918213, 0.9999997615814209, 1.0, 1.0, 1.0, 0.9990770816802979, 1.0, 0.9999994039535522, 0.9999696016311646, 0.005247556138783693, 1.6901117305678781e-06, 1.0, 1.0, 1.0, 0.9999994039535522, 0.9999995231628418, 0.9446089267730713, 1.0, 1.0, 0.9999994039535522, 1.0, 1.0, 1.0, 0.18130998313426971, 0.9241143465042114, 0.9995156526565552, 0.9999991655349731, 0.9999964237213135, 0.9999991655349731, 0.00029783774516545236, 0.9999966621398926, 0.9992720484733582, 0.9999902248382568, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999994039535522, 1.0, 0.9577848315238953, 4.943424869452429e-07, 0.9480537176132202, 0.3113512098789215, 0.9999508857727051, 0.9394336342811584, 0.9999984502792358, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.99998939037323, 0.9999973773956299, 0.9999997615814209, 0.9997233748435974, 0.9980523586273193, 0.9656923413276672, 1.0, 1.0, 0.9999998807907104, 0.9160833358764648, 0.5492163896560669, 0.08401793241500854, 1.0, 0.9999992847442627, 1.0, 0.3519839942455292, 0.7853103280067444, 0.5517084002494812, 0.8601536750793457, 0.38083046674728394, 0.729615330696106, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0213258264082417e-25, 4.821225244289976e-16, 4.896013080325593e-22, 1.0, 1.0, 0.9999998807907104, 5.73167471884517e-06, 0.9999983310699463, 0.11611205339431763, 0.01825742982327938, 0.9999973773956299, 0.30883508920669556, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999998927116394, 0.9999730587005615, 0.9999656677246094, 0.37369856238365173, 0.27871283888816833, 0.6080510020256042, 0.9999688863754272, 0.8688474297523499, 0.9999549388885498, 0.9999886751174927, 2.73392771532599e-07, 0.9999935626983643, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9994915723800659, 1.0, 1.0, 0.84340500831604, 3.61705296825221e-08, 0.0027160155586898327, 0.9997060894966125, 1.8469190621317466e-09, 1.6744067840285416e-19, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9237469434738159, 0.9548180103302002, 0.0005167446797713637, 0.9930068254470825, 0.09534699469804764, 1.1124318177735404e-07, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.49935436248779297, 0.9999961853027344, 0.9928207993507385, 0.9986525774002075, 0.010878274217247963, 0.7615596055984497, 0.8041813373565674, 1.0, 0.9999998807907104, 1.0, 0.9999992847442627, 0.9999998807907104, 0.9999986886978149, 0.25856664776802063, 0.2049965262413025, 0.4124404191970825, 0.999995231628418, 0.9999736547470093, 0.9999970197677612, 9.8270591664118e-10, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999970197677612, 1.0, 1.0, 0.9995539784431458, 1.0, 1.0, 1.0, 1.0, 0.999925971031189, 0.999817430973053, 0.999998927116394, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999997615814209, 0.9987339377403259, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999595880508423, 0.9996155500411987, 0.9999510049819946, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.5243324637413025, 0.8197103142738342, 0.9999879598617554, 1.1736015492758156e-09, 0.27829185128211975, 5.975554252801718e-13, 1.0, 1.0, 1.0, 1.0, 0.059172868728637695, 0.9999998807907104, 0.6861754059791565, 0.7072870135307312, 0.9892241358757019, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9977534413337708, 0.8695911765098572, 0.9997572302818298, 0.9989548921585083, 0.9999650716781616, 8.790813444647938e-05, 1.0, 1.0, 0.002240023110061884, 1.0, 1.0, 1.0, 0.982358992099762, 0.99094557762146, 0.9999955892562866, 5.570710072788643e-06, 3.384095575379581e-13, 0.9898569583892822, 1.0, 1.0, 1.0, 0.9680998921394348, 0.9929165840148926, 0.7218322157859802, 0.007455885410308838, 3.7163031847827974e-14, 0.7168830037117004, 1.0, 1.0, 1.0, 2.626086847978826e-10, 0.2648669481277466, 0.9866816997528076, 0.196028470993042, 0.9984558820724487, 3.594160972908234e-18, 1.0, 1.0, 1.0, 1.0, 0.9993607401847839, 1.0, 1.0, 1.0, 1.0, 0.48612046241760254, 2.6694876864574724e-10, 0.9898063540458679, 0.7095587849617004, 0.9993749260902405, 0.997785210609436, 0.23270659148693085, 1.0, 0.9999325275421143, 0.9999686479568481, 1.0, 0.7869887948036194, 1.0, 1.0, 1.0, 0.3207952678203583, 0.004731073975563049, 0.0005691531114280224, 0.9999923706054688, 1.0497638868400827e-05, 0.06314487755298615, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9992094039916992, 0.5074410438537598, 0.050677862018346786, 9.450040576453045e-12, 0.1405748575925827, 3.778605517368305e-08, 0.7739189267158508, 0.267483651638031, 0.0006217024056240916, 1.0, 1.0, 1.0, 0.71587735414505, 1.0, 0.9999998807907104, 0.9999972581863403, 0.9999758005142212, 0.9998742341995239, 1.0, 0.9999997615814209, 0.9999986886978149, 0.9716106057167053, 0.9999899864196777, 0.9999732971191406, 0.9999827146530151, 0.9999700784683228, 0.9999990463256836, 1.0, 1.0, 1.0, 0.7871241569519043, 1.0, 1.0, 0.9997413754463196, 1.0, 0.9999961853027344, 1.0, 1.0, 0.9154285192489624, 1.0, 1.0, 1.0, 0.9874365329742432, 0.03577687218785286, 2.2873113181276494e-08, 0.9999995231628418, 1.0, 1.0, 0.29337573051452637, 0.9707481861114502, 0.3059193789958954, 1.0, 0.9999998807907104, 1.0, 1.0, 0.8543777465820312, 1.0, 0.9999767541885376, 0.5028933882713318, 0.9814267754554749, 0.9999998807907104, 1.0, 1.0, 0.4589194059371948, 0.0031717868987470865, 0.1995445340871811, 1.0, 1.0, 1.0, 0.017423370853066444, 0.932735800743103, 0.00034494130522944033, 0.1460781991481781, 0.5285971164703369, 0.3104550838470459, 0.9691990613937378, 1.0, 0.9999990463256836, 0.9960052371025085, 0.947685718536377, 0.08451879024505615, 0.9986949563026428, 0.9998329877853394, 0.9995916485786438, 0.9997366070747375, 0.9999561309814453, 0.2768760025501251, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 0.13963018357753754, 0.7366341948509216, 0.0003211094008293003, 1.0, 1.0, 0.7871561050415039, 1.0, 1.0, 1.0, 1.0, 0.9931434392929077, 1.0, 0.9999877214431763, 0.999872088432312, 0.9999040365219116, 0.8578472137451172, 0.9999938011169434, 0.9966552257537842, 0.9999580383300781, 0.9935801029205322, 0.9762104749679565, 1.0, 0.9999942779541016, 1.0, 0.9999997615814209, 1.0, 0.9991713762283325, 0.5521931052207947, 0.886752724647522, 0.4335101842880249, 1.0, 1.0, 0.9999598264694214, 0.9999998807907104, 0.9999991655349731, 1.0, 1.0, 1.0, 1.0, 0.991171658039093, 0.9869080781936646, 0.7598368525505066, 0.9999867677688599, 0.9999927282333374, 0.9999973773956299, 1.0, 1.0, 0.9999912977218628, 1.0, 1.0, 1.0, 3.261148231104016e-05, 1.0, 0.9999998807907104, 0.9994763731956482, 0.9997290968894958, 0.9996564388275146, 1.0, 1.0, 1.0, 0.9999809265136719, 0.9999111890792847, 0.99977046251297, 0.003256274852901697, 1.0568313882686198e-05, 0.0021818047389388084, 1.0, 0.9988057613372803, 1.0, 0.9631175994873047, 0.05034251511096954, 0.40571507811546326, 0.009977717883884907, 0.9992716908454895, 0.998954176902771, 0.9883847236633301, 0.9935011267662048, 2.1372079217485407e-08, 0.9975237250328064, 0.9998492002487183, 0.8964678049087524, 0.9999979734420776, 1.0, 1.0, 1.0, 1.0, 1.0, 0.21022698283195496, 0.054552774876356125, 0.11311953514814377, 1.0, 1.0, 1.0, 0.9999997615814209, 1.0, 0.9999662637710571, 0.996638298034668, 0.9127888679504395, 0.8756287097930908, 0.9517530798912048, 0.6561786532402039, 0.9998680353164673, 0.9999420642852783, 0.99873286485672, 1.0, 0.9999878406524658, 0.9999885559082031, 0.016727229580283165 ], "eval_math_runtime": 201.1466, "eval_math_samples_per_second": 3.729, "eval_math_score": -0.15087273716926575, "eval_math_steps_per_second": 0.119, "step": 450 }, { "train_runtime": 4.0665, "train_samples_per_second": 786.918, "train_steps_per_second": 24.591, "total_flos": 0.0, "train_loss": 0.0, "epoch": 7.89, "step": 450 } ]