[ { "loss": 0.7082, "learning_rate": 7.2e-05, "epoch": 0.02, "step": 1 }, { "loss": 0.7006, "learning_rate": 7.2e-05, "epoch": 0.04, "step": 2 }, { "loss": 0.6979, "learning_rate": 7.2e-05, "epoch": 0.05, "step": 3 }, { "loss": 0.6887, "learning_rate": 7.2e-05, "epoch": 0.07, "step": 4 }, { "loss": 0.6946, "learning_rate": 7.2e-05, "epoch": 0.09, "step": 5 }, { "loss": 0.6997, "learning_rate": 7.2e-05, "epoch": 0.11, "step": 6 }, { "loss": 0.6956, "learning_rate": 7.2e-05, "epoch": 0.12, "step": 7 }, { "loss": 0.6916, "learning_rate": 7.2e-05, "epoch": 0.14, "step": 8 }, { "loss": 0.6935, "learning_rate": 7.2e-05, "epoch": 0.16, "step": 9 }, { "loss": 0.6894, "learning_rate": 7.2e-05, "epoch": 0.18, "step": 10 }, { "loss": 0.6924, "learning_rate": 7.2e-05, "epoch": 0.19, "step": 11 }, { "loss": 0.6834, "learning_rate": 7.2e-05, "epoch": 0.21, "step": 12 }, { "loss": 0.6911, "learning_rate": 7.2e-05, "epoch": 0.23, "step": 13 }, { "loss": 0.6945, "learning_rate": 7.2e-05, "epoch": 0.25, "step": 14 }, { "loss": 0.6819, "learning_rate": 7.2e-05, "epoch": 0.26, "step": 15 }, { "loss": 0.6824, "learning_rate": 7.2e-05, "epoch": 0.28, "step": 16 }, { "loss": 0.692, "learning_rate": 7.2e-05, "epoch": 0.3, "step": 17 }, { "loss": 0.6878, "learning_rate": 7.2e-05, "epoch": 0.32, "step": 18 }, { "loss": 0.6739, "learning_rate": 7.2e-05, "epoch": 0.33, "step": 19 }, { "loss": 0.6814, "learning_rate": 7.2e-05, "epoch": 0.35, "step": 20 }, { "loss": 0.6755, "learning_rate": 7.2e-05, "epoch": 0.37, "step": 21 }, { "loss": 0.6525, "learning_rate": 7.2e-05, "epoch": 0.39, "step": 22 }, { "loss": 0.6933, "learning_rate": 7.2e-05, "epoch": 0.4, "step": 23 }, { "loss": 0.6912, "learning_rate": 7.2e-05, "epoch": 0.42, "step": 24 }, { "loss": 0.6837, "learning_rate": 7.2e-05, "epoch": 0.44, "step": 25 }, { "eval_math_hard_loss": 0.6894748210906982, "eval_math_hard_score": -0.24721547961235046, "eval_math_hard_brier_score": 0.24721547961235046, "eval_math_hard_average_probability": 0.503162682056427, "eval_math_hard_accuracy": 0.67, "eval_math_hard_probabilities": [ 0.4227713644504547, 0.4243110716342926, 0.4217226803302765, 0.5080846548080444, 0.5003512501716614, 0.5066218972206116, 0.5015118718147278, 0.500447154045105, 0.5005831122398376, 0.5008090734481812, 0.4988376200199127, 0.5015636682510376, 0.49952030181884766, 0.5036075115203857, 0.5045143961906433, 0.4983898401260376, 0.5007873773574829, 0.5014252662658691, 0.5002598166465759, 0.5008907318115234, 0.5009533166885376, 0.5221489071846008, 0.5234034657478333, 0.5247792601585388, 0.5126287937164307, 0.5133108496665955, 0.5110536813735962, 0.5020310282707214, 0.4892224371433258, 0.5109142065048218, 0.5004593729972839, 0.5045181512832642, 0.49915167689323425, 0.49843019247055054, 0.4997433125972748, 0.49867600202560425, 0.502083957195282, 0.501447856426239, 0.5003753304481506, 0.5011199712753296, 0.49873456358909607, 0.49848291277885437, 0.48643049597740173, 0.49849626421928406, 0.48845013976097107, 0.5013667345046997, 0.500347375869751, 0.5004876255989075, 0.5421925783157349, 0.557721734046936, 0.5099676847457886, 0.49849411845207214, 0.4995008707046509, 0.49974963068962097, 0.5455760955810547, 0.5438253283500671, 0.5432474613189697, 0.5029205679893494, 0.4974336326122284, 0.5029483437538147, 0.5062002539634705, 0.509421169757843, 0.5076862573623657, 0.4995964765548706, 0.502112090587616, 0.5017081499099731, 0.49831974506378174, 0.4960530996322632, 0.4953078627586365, 0.5019406676292419, 0.4999215304851532, 0.498506635427475, 0.5036457777023315, 0.5040311217308044, 0.5019571185112, 0.5034784078598022, 0.5008260011672974, 0.5031225681304932, 0.5478922128677368, 0.5407694578170776, 0.5346946120262146, 0.5009269714355469, 0.501581072807312, 0.5043609142303467, 0.5141059756278992, 0.5151600241661072, 0.4976750612258911, 0.5016065239906311, 0.501369833946228, 0.5012784600257874, 0.49994927644729614, 0.5037755370140076, 0.5020310878753662, 0.4963326156139374, 0.49563106894493103, 0.49556463956832886, 0.49954840540885925, 0.49477893114089966, 0.5013437867164612, 0.502220630645752 ], "eval_math_hard_runtime": 19.1857, "eval_math_hard_samples_per_second": 5.212, "eval_math_hard_steps_per_second": 0.104, "epoch": 0.44, "step": 25 }, { "loss": 0.6608, "learning_rate": 7.2e-05, "epoch": 0.46, "step": 26 }, { "loss": 0.6878, "learning_rate": 7.2e-05, "epoch": 0.47, "step": 27 }, { "loss": 0.6559, "learning_rate": 7.2e-05, "epoch": 0.49, "step": 28 }, { "loss": 0.6863, "learning_rate": 7.2e-05, "epoch": 0.51, "step": 29 }, { "loss": 0.6592, "learning_rate": 7.2e-05, "epoch": 0.53, "step": 30 }, { "loss": 0.6823, "learning_rate": 7.2e-05, "epoch": 0.54, "step": 31 }, { "loss": 0.6765, "learning_rate": 7.2e-05, "epoch": 0.56, "step": 32 }, { "loss": 0.6858, "learning_rate": 7.2e-05, "epoch": 0.58, "step": 33 }, { "loss": 0.6909, "learning_rate": 7.2e-05, "epoch": 0.6, "step": 34 }, { "loss": 0.6811, "learning_rate": 7.2e-05, "epoch": 0.61, "step": 35 }, { "loss": 0.6753, "learning_rate": 7.2e-05, "epoch": 0.63, "step": 36 }, { "loss": 0.6758, "learning_rate": 7.2e-05, "epoch": 0.65, "step": 37 }, { "loss": 0.6865, "learning_rate": 7.2e-05, "epoch": 0.67, "step": 38 }, { "loss": 0.6402, "learning_rate": 7.2e-05, "epoch": 0.68, "step": 39 }, { "loss": 0.6536, "learning_rate": 7.2e-05, "epoch": 0.7, "step": 40 }, { "loss": 0.645, "learning_rate": 7.2e-05, "epoch": 0.72, "step": 41 }, { "loss": 0.6855, "learning_rate": 7.2e-05, "epoch": 0.74, "step": 42 }, { "loss": 0.6286, "learning_rate": 7.2e-05, "epoch": 0.75, "step": 43 }, { "loss": 0.6574, "learning_rate": 7.2e-05, "epoch": 0.77, "step": 44 }, { "loss": 0.668, "learning_rate": 7.2e-05, "epoch": 0.79, "step": 45 }, { "loss": 0.6643, "learning_rate": 7.2e-05, "epoch": 0.81, "step": 46 }, { "loss": 0.6755, "learning_rate": 7.2e-05, "epoch": 0.82, "step": 47 }, { "loss": 0.6663, "learning_rate": 7.2e-05, "epoch": 0.84, "step": 48 }, { "loss": 0.6525, "learning_rate": 7.2e-05, "epoch": 0.86, "step": 49 }, { "loss": 0.676, "learning_rate": 7.2e-05, "epoch": 0.88, "step": 50 }, { "eval_math_hard_loss": 0.6725212931632996, "eval_math_hard_score": -0.24000222980976105, "eval_math_hard_brier_score": 0.24000222980976105, "eval_math_hard_average_probability": 0.5112404823303223, "eval_math_hard_accuracy": 0.71, "eval_math_hard_probabilities": [ 0.45277896523475647, 0.45469722151756287, 0.45128071308135986, 0.5148431658744812, 0.5021870732307434, 0.5043631792068481, 0.5066627860069275, 0.5054929256439209, 0.5019177794456482, 0.5219594240188599, 0.5049334764480591, 0.5112125277519226, 0.5003976821899414, 0.5065910220146179, 0.5072922110557556, 0.4964824318885803, 0.5019433498382568, 0.5026321411132812, 0.5000293850898743, 0.49963968992233276, 0.5028585195541382, 0.5398517847061157, 0.5473343729972839, 0.5544767379760742, 0.5060956478118896, 0.5239856839179993, 0.5277472734451294, 0.4985102713108063, 0.47175613045692444, 0.5033620595932007, 0.49817827343940735, 0.5102205872535706, 0.49686363339424133, 0.4992176294326782, 0.503284752368927, 0.5037179589271545, 0.5031449794769287, 0.5042518973350525, 0.5031511783599854, 0.49838143587112427, 0.4941232204437256, 0.4982997477054596, 0.4887068271636963, 0.4955118000507355, 0.4895956814289093, 0.5002733469009399, 0.5003429055213928, 0.49709463119506836, 0.5760056972503662, 0.571745753288269, 0.5338752865791321, 0.4955299496650696, 0.5003539323806763, 0.49888306856155396, 0.6243072748184204, 0.6245272755622864, 0.6229971647262573, 0.5035498738288879, 0.49556151032447815, 0.5018459558486938, 0.5172255039215088, 0.5213637948036194, 0.5222153067588806, 0.5011674165725708, 0.5060593485832214, 0.504572868347168, 0.4984975755214691, 0.5009143352508545, 0.4929470717906952, 0.4994816482067108, 0.49936628341674805, 0.4988759160041809, 0.5091677904129028, 0.5084511637687683, 0.5050278902053833, 0.5068730115890503, 0.5035209059715271, 0.5078574419021606, 0.6247063279151917, 0.6266769170761108, 0.6112779974937439, 0.5065394639968872, 0.5045663118362427, 0.5105231404304504, 0.5081201791763306, 0.5091950297355652, 0.5013695955276489, 0.5074512362480164, 0.50473552942276, 0.5031643509864807, 0.5013434290885925, 0.5119460225105286, 0.5085548162460327, 0.5006793737411499, 0.503533661365509, 0.4990837275981903, 0.47225868701934814, 0.4665180742740631, 0.47514545917510986, 0.5062111020088196 ], "eval_math_hard_runtime": 19.1606, "eval_math_hard_samples_per_second": 5.219, "eval_math_hard_steps_per_second": 0.104, "epoch": 0.88, "step": 50 }, { "loss": 0.6385, "learning_rate": 7.2e-05, "epoch": 0.89, "step": 51 }, { "loss": 0.6424, "learning_rate": 7.2e-05, "epoch": 0.91, "step": 52 }, { "loss": 0.6859, "learning_rate": 7.2e-05, "epoch": 0.93, "step": 53 }, { "loss": 0.6738, "learning_rate": 7.2e-05, "epoch": 0.95, "step": 54 }, { "loss": 0.6795, "learning_rate": 7.2e-05, "epoch": 0.96, "step": 55 }, { "loss": 0.6794, "learning_rate": 7.2e-05, "epoch": 0.98, "step": 56 }, { "loss": 0.6308, "learning_rate": 7.2e-05, "epoch": 1.0, "step": 57 }, { "loss": 0.5867, "learning_rate": 7.2e-05, "epoch": 1.02, "step": 58 }, { "loss": 0.651, "learning_rate": 7.2e-05, "epoch": 1.04, "step": 59 }, { "loss": 0.6177, "learning_rate": 7.2e-05, "epoch": 1.05, "step": 60 }, { "loss": 0.6132, "learning_rate": 7.2e-05, "epoch": 1.07, "step": 61 }, { "loss": 0.6702, "learning_rate": 7.2e-05, "epoch": 1.09, "step": 62 }, { "loss": 0.6141, "learning_rate": 7.2e-05, "epoch": 1.11, "step": 63 }, { "loss": 0.6563, "learning_rate": 7.2e-05, "epoch": 1.12, "step": 64 }, { "loss": 0.6674, "learning_rate": 7.2e-05, "epoch": 1.14, "step": 65 }, { "loss": 0.6499, "learning_rate": 7.2e-05, "epoch": 1.16, "step": 66 }, { "loss": 0.6782, "learning_rate": 7.2e-05, "epoch": 1.18, "step": 67 }, { "loss": 0.6058, "learning_rate": 7.2e-05, "epoch": 1.19, "step": 68 }, { "loss": 0.5962, "learning_rate": 7.2e-05, "epoch": 1.21, "step": 69 }, { "loss": 0.6426, "learning_rate": 7.2e-05, "epoch": 1.23, "step": 70 }, { "loss": 0.626, "learning_rate": 7.2e-05, "epoch": 1.25, "step": 71 }, { "loss": 0.6095, "learning_rate": 7.2e-05, "epoch": 1.26, "step": 72 }, { "loss": 0.6375, "learning_rate": 7.2e-05, "epoch": 1.28, "step": 73 }, { "loss": 0.5938, "learning_rate": 7.2e-05, "epoch": 1.3, "step": 74 }, { "loss": 0.5915, "learning_rate": 7.2e-05, "epoch": 1.32, "step": 75 }, { "eval_math_hard_loss": 0.6123586893081665, "eval_math_hard_score": -0.2185293436050415, "eval_math_hard_brier_score": 0.2185293436050415, "eval_math_hard_average_probability": 0.5461798310279846, "eval_math_hard_accuracy": 0.7, "eval_math_hard_probabilities": [ 0.6981080174446106, 0.6993874907493591, 0.6964402198791504, 0.496179461479187, 0.5118089318275452, 0.4348101019859314, 0.5450701713562012, 0.5478569865226746, 0.5073054432868958, 0.6003513336181641, 0.48766252398490906, 0.5207421183586121, 0.5321508646011353, 0.5228312611579895, 0.5217955112457275, 0.4980320930480957, 0.5108472108840942, 0.5094117522239685, 0.5452646613121033, 0.5308429002761841, 0.5391503572463989, 0.685689389705658, 0.7256925106048584, 0.7535527348518372, 0.492637038230896, 0.5849336385726929, 0.6581502556800842, 0.507750391960144, 0.4166055917739868, 0.537865400314331, 0.480641633272171, 0.5339422821998596, 0.4952820837497711, 0.5112771987915039, 0.5374191403388977, 0.5484182834625244, 0.5139420032501221, 0.5436358451843262, 0.535308301448822, 0.4862540364265442, 0.46842843294143677, 0.5044496655464172, 0.47761040925979614, 0.47824832797050476, 0.49812138080596924, 0.49636951088905334, 0.5025320053100586, 0.45967310667037964, 0.47252291440963745, 0.43059277534484863, 0.34971874952316284, 0.47613152861595154, 0.50247722864151, 0.5095160603523254, 0.948936939239502, 0.9514877200126648, 0.9500554800033569, 0.5087370276451111, 0.4877012372016907, 0.49044281244277954, 0.5669111609458923, 0.5985153317451477, 0.6142491698265076, 0.5062389969825745, 0.5240121483802795, 0.5009501576423645, 0.5466399788856506, 0.5929512977600098, 0.4971684515476227, 0.4791565537452698, 0.49307700991630554, 0.4976717531681061, 0.5357528328895569, 0.534887969493866, 0.5193175673484802, 0.5436345338821411, 0.5458875298500061, 0.5654334425926208, 0.8299615979194641, 0.8604872822761536, 0.8265635967254639, 0.5350908637046814, 0.5183643102645874, 0.5320155620574951, 0.4727846086025238, 0.46650999784469604, 0.5301773548126221, 0.5392518043518066, 0.532899022102356, 0.5097134113311768, 0.5105643272399902, 0.5698909163475037, 0.5556212663650513, 0.5259840488433838, 0.5478115081787109, 0.5297166705131531, 0.3596650958061218, 0.3327234983444214, 0.3539780080318451, 0.5469507575035095 ], "eval_math_hard_runtime": 19.1569, "eval_math_hard_samples_per_second": 5.22, "eval_math_hard_steps_per_second": 0.104, "epoch": 1.32, "step": 75 }, { "loss": 0.6574, "learning_rate": 7.2e-05, "epoch": 1.33, "step": 76 }, { "loss": 0.5659, "learning_rate": 7.2e-05, "epoch": 1.35, "step": 77 }, { "loss": 0.6504, "learning_rate": 7.2e-05, "epoch": 1.37, "step": 78 }, { "loss": 0.6161, "learning_rate": 7.2e-05, "epoch": 1.39, "step": 79 }, { "loss": 0.5772, "learning_rate": 7.2e-05, "epoch": 1.4, "step": 80 }, { "loss": 0.5762, "learning_rate": 7.2e-05, "epoch": 1.42, "step": 81 }, { "loss": 0.5572, "learning_rate": 7.2e-05, "epoch": 1.44, "step": 82 }, { "loss": 0.5432, "learning_rate": 7.2e-05, "epoch": 1.46, "step": 83 }, { "loss": 0.5356, "learning_rate": 7.2e-05, "epoch": 1.47, "step": 84 }, { "loss": 0.4974, "learning_rate": 7.2e-05, "epoch": 1.49, "step": 85 }, { "loss": 0.5639, "learning_rate": 7.2e-05, "epoch": 1.51, "step": 86 }, { "loss": 0.585, "learning_rate": 7.2e-05, "epoch": 1.53, "step": 87 }, { "loss": 0.5924, "learning_rate": 7.2e-05, "epoch": 1.54, "step": 88 }, { "loss": 0.5241, "learning_rate": 7.2e-05, "epoch": 1.56, "step": 89 }, { "loss": 0.591, "learning_rate": 7.2e-05, "epoch": 1.58, "step": 90 }, { "loss": 0.5843, "learning_rate": 7.2e-05, "epoch": 1.6, "step": 91 }, { "loss": 0.5517, "learning_rate": 7.2e-05, "epoch": 1.61, "step": 92 }, { "loss": 0.552, "learning_rate": 7.2e-05, "epoch": 1.63, "step": 93 }, { "loss": 0.5687, "learning_rate": 7.2e-05, "epoch": 1.65, "step": 94 }, { "loss": 0.5504, "learning_rate": 7.2e-05, "epoch": 1.67, "step": 95 }, { "loss": 0.6031, "learning_rate": 7.2e-05, "epoch": 1.68, "step": 96 }, { "loss": 0.5703, "learning_rate": 7.2e-05, "epoch": 1.7, "step": 97 }, { "loss": 0.5655, "learning_rate": 7.2e-05, "epoch": 1.72, "step": 98 }, { "loss": 0.5707, "learning_rate": 7.2e-05, "epoch": 1.74, "step": 99 }, { "loss": 0.5428, "learning_rate": 7.2e-05, "epoch": 1.75, "step": 100 }, { "eval_math_hard_loss": 0.5149410963058472, "eval_math_hard_score": -0.18658693134784698, "eval_math_hard_brier_score": 0.18658693134784698, "eval_math_hard_average_probability": 0.6249247193336487, "eval_math_hard_accuracy": 0.74, "eval_math_hard_probabilities": [ 0.9090185761451721, 0.9152910113334656, 0.920225203037262, 0.544651210308075, 0.48588231205940247, 0.26481539011001587, 0.6502981185913086, 0.7012529373168945, 0.5503808259963989, 0.6474319696426392, 0.42047441005706787, 0.4609397053718567, 0.626591682434082, 0.6665865778923035, 0.657002329826355, 0.5227519869804382, 0.5618593692779541, 0.5485963821411133, 0.8084971904754639, 0.7115694880485535, 0.7779558300971985, 0.9740842580795288, 0.9867558479309082, 0.9904892444610596, 0.7436046004295349, 0.7511422634124756, 0.8598321676254272, 0.7189204692840576, 0.6654929518699646, 0.7797940969467163, 0.49751776456832886, 0.6186977624893188, 0.5393147468566895, 0.5485488176345825, 0.6180264949798584, 0.6347217559814453, 0.42208293080329895, 0.5922693610191345, 0.5913844704627991, 0.4507058262825012, 0.36954668164253235, 0.5368402004241943, 0.4939379096031189, 0.4328914284706116, 0.585762083530426, 0.5262035727500916, 0.5042811632156372, 0.23688159883022308, 0.3037083148956299, 0.12116531282663345, 0.2997088134288788, 0.4748251438140869, 0.5383250713348389, 0.5640963315963745, 0.9970376491546631, 0.9975969195365906, 0.997580885887146, 0.513490617275238, 0.47000354528427124, 0.44651105999946594, 0.9373555183410645, 0.9684251546859741, 0.9780910015106201, 0.5609255433082581, 0.6275558471679688, 0.5644670724868774, 0.8380681276321411, 0.9534356594085693, 0.6312075257301331, 0.40665751695632935, 0.5042629837989807, 0.48140040040016174, 0.6677272915840149, 0.6427435278892517, 0.5668158531188965, 0.7906490564346313, 0.8034231662750244, 0.8900921940803528, 0.9583730697631836, 0.9730780124664307, 0.9701274633407593, 0.6236186623573303, 0.5862740278244019, 0.5670204162597656, 0.4843604266643524, 0.4715549647808075, 0.6955848336219788, 0.687962532043457, 0.7231170535087585, 0.4752002954483032, 0.31005188822746277, 0.7067242860794067, 0.6296723484992981, 0.6213487386703491, 0.7203496098518372, 0.6451394557952881, 0.10958302021026611, 0.08802775293588638, 0.10785944014787674, 0.7782877683639526 ], "eval_math_hard_runtime": 19.1566, "eval_math_hard_samples_per_second": 5.22, "eval_math_hard_steps_per_second": 0.104, "epoch": 1.75, "step": 100 }, { "train_runtime": 1950.9713, "train_samples_per_second": 1.64, "train_steps_per_second": 0.051, "total_flos": 0.0, "train_loss": 0.6416401875019073, "epoch": 1.75, "step": 100 } ]