[ { "loss": 0.6593, "learning_rate": 0.0002, "epoch": 0.03, "step": 1 }, { "loss": 0.4945, "learning_rate": 0.0002, "epoch": 0.05, "step": 2 }, { "loss": 0.3929, "learning_rate": 0.0002, "epoch": 0.08, "step": 3 }, { "loss": 0.2804, "learning_rate": 0.0002, "epoch": 0.11, "step": 4 }, { "loss": 0.276, "learning_rate": 0.0002, "epoch": 0.13, "step": 5 }, { "loss": 0.3343, "learning_rate": 0.0002, "epoch": 0.16, "step": 6 }, { "loss": 0.1975, "learning_rate": 0.0002, "epoch": 0.18, "step": 7 }, { "loss": 0.274, "learning_rate": 0.0002, "epoch": 0.21, "step": 8 }, { "loss": 0.2602, "learning_rate": 0.0002, "epoch": 0.24, "step": 9 }, { "loss": 0.2084, "learning_rate": 0.0002, "epoch": 0.26, "step": 10 }, { "loss": 0.1054, "learning_rate": 0.0002, "epoch": 0.29, "step": 11 }, { "loss": 0.0939, "learning_rate": 0.0002, "epoch": 0.32, "step": 12 }, { "loss": 0.135, "learning_rate": 0.0002, "epoch": 0.34, "step": 13 }, { "loss": 0.0468, "learning_rate": 0.0002, "epoch": 0.37, "step": 14 }, { "loss": 0.2461, "learning_rate": 0.0002, "epoch": 0.39, "step": 15 }, { "loss": 0.1158, "learning_rate": 0.0002, "epoch": 0.42, "step": 16 }, { "loss": 0.3144, "learning_rate": 0.0002, "epoch": 0.45, "step": 17 }, { "loss": 0.1785, "learning_rate": 0.0002, "epoch": 0.47, "step": 18 }, { "loss": 0.1156, "learning_rate": 0.0002, "epoch": 0.5, "step": 19 }, { "loss": 0.0616, "learning_rate": 0.0002, "epoch": 0.53, "step": 20 }, { "loss": 0.0447, "learning_rate": 0.0002, "epoch": 0.55, "step": 21 }, { "loss": 0.0044, "learning_rate": 0.0002, "epoch": 0.58, "step": 22 }, { "loss": 0.0612, "learning_rate": 0.0002, "epoch": 0.61, "step": 23 }, { "loss": 0.0515, "learning_rate": 0.0002, "epoch": 0.63, "step": 24 }, { "loss": 0.0108, "learning_rate": 0.0002, "epoch": 0.66, "step": 25 }, { "eval_code_low_quality_loss": 0.010171000845730305, "eval_code_low_quality_score": -0.0019669600296765566, "eval_code_low_quality_brier_score": 0.0019669600296765566, "eval_code_low_quality_average_probability": 0.9910862445831299, "eval_code_low_quality_accuracy": 1.0, "eval_code_low_quality_probabilities": [ 0.9999998807907104, 0.9999998807907104, 0.9999916553497314, 0.9999791383743286, 0.9999998807907104, 0.9999997615814209, 0.9999990463256836, 0.9999992847442627, 0.9999996423721313, 0.9999985694885254, 0.9999996423721313, 0.9999994039535522, 0.9999995231628418, 0.9999998807907104, 0.9999997615814209, 0.9999998807907104, 0.9999974966049194, 0.9999810457229614, 0.9999998807907104, 0.9999997615814209, 0.9999979734420776, 0.9999966621398926, 0.9999923706054688, 0.9999973773956299, 0.9998645782470703, 0.9999245405197144, 0.9626507759094238, 0.9710566401481628, 0.9999980926513672, 0.9999955892562866, 0.9980201721191406, 0.9999994039535522, 0.9999995231628418, 0.9999991655349731, 0.999997615814209, 0.9999970197677612, 0.999995231628418, 0.999994158744812, 0.9999849796295166, 0.9999797344207764, 0.9999872446060181, 0.9999929666519165, 0.9999995231628418, 0.9999985694885254, 0.99998939037323, 0.9999997615814209, 0.9999953508377075, 0.999991774559021, 0.9996731281280518, 0.9995961785316467, 0.9999998807907104, 0.9999998807907104, 0.9999982118606567, 0.9999980926513672, 0.9999994039535522, 0.9999996423721313, 0.9999988079071045, 0.9999992847442627, 0.9999977350234985, 0.9999911785125732, 0.9999998807907104, 0.9999998807907104, 0.9999996423721313, 0.9999990463256836, 0.9917247295379639, 0.9974627494812012, 1.0, 0.9999998807907104, 0.9999998807907104, 0.9999995231628418, 0.9999998807907104, 1.0, 0.9999978542327881, 0.9999996423721313, 0.9999998807907104, 0.9999998807907104, 0.9999954700469971, 0.9999988079071045, 0.8898673057556152, 0.95624178647995, 0.9999982118606567, 0.9999994039535522, 0.9999997615814209, 0.9999995231628418, 0.9999998807907104, 0.9999997615814209, 0.7369291186332703, 0.6688874363899231, 0.9999933242797852, 0.9999909400939941, 0.9999688863754272, 0.9999462366104126, 0.9999872446060181, 0.9999003410339355, 0.9898979663848877, 0.9894485473632812, 0.9999990463256836, 0.9999994039535522, 0.9648559093475342, 0.992939829826355 ], "eval_code_low_quality_runtime": 108.3354, "eval_code_low_quality_samples_per_second": 0.923, "eval_code_low_quality_steps_per_second": 0.037, "epoch": 0.66, "step": 25 }, { "eval_code_loss": 0.775557279586792, "eval_code_score": -0.21216197311878204, "eval_code_brier_score": 0.21216197311878204, "eval_code_average_probability": 0.6170614361763, "eval_code_accuracy": 0.77, "eval_code_probabilities": [ 0.0018926338525488973, 0.012711296789348125, 0.007091669365763664, 0.6062625646591187, 0.9943353533744812, 0.5690382719039917, 0.6241586208343506, 0.662219226360321, 0.5325962901115417, 0.5391229391098022, 0.7178332805633545, 0.6171442866325378, 0.577951967716217, 0.8548311591148376, 0.7104359865188599, 0.5026382803916931, 0.5293322801589966, 0.5492123365402222, 0.6345873475074768, 0.7990339398384094, 0.5863059163093567, 0.48554468154907227, 0.6499708294868469, 0.5989818572998047, 0.2676376402378082, 0.2834436595439911, 0.28170374035835266, 0.8311360478401184, 0.9110060334205627, 0.9641320109367371, 0.45280739665031433, 0.7613933086395264, 0.5464147329330444, 0.01752450130879879, 0.005836487282067537, 0.006046702619642019, 0.5162467956542969, 0.5298649668693542, 0.5247464179992676, 0.9592331647872925, 0.8196842670440674, 0.7410209774971008, 0.796080470085144, 0.9008417725563049, 0.6857371926307678, 0.5978904962539673, 0.9823793768882751, 0.9868221282958984, 0.5604033470153809, 0.5046380758285522, 0.999763548374176, 0.9999983310699463, 0.9999935626983643, 0.9927141070365906, 0.516162097454071, 0.521334171295166, 0.513815701007843, 0.5127142667770386, 0.5125176906585693, 0.5335236191749573, 0.3885745108127594, 0.449074923992157, 0.43242695927619934, 0.42709216475486755, 0.509745180606842, 0.5419602394104004, 0.9643940329551697, 0.46200674772262573, 0.44968515634536743, 0.7517949342727661, 0.35403740406036377, 0.9996168613433838, 0.43991619348526, 0.2799178659915924, 0.6076914072036743, 0.9999991655349731, 0.9997984766960144, 0.9999959468841553, 0.9999561309814453, 0.6099094748497009, 0.6852646470069885, 0.8096278309822083, 0.5049552321434021, 0.818763017654419, 0.6465492248535156, 0.5962660312652588, 0.9850568175315857, 0.9976211190223694, 0.9992263317108154, 0.6331233978271484, 0.6343858242034912, 0.49390336871147156, 0.5998658537864685, 0.5048991441726685, 0.507156252861023, 0.5149410367012024, 0.9476234316825867, 0.39861536026000977, 0.34747856855392456, 0.5127823948860168 ], "eval_code_runtime": 105.3963, "eval_code_samples_per_second": 0.949, "eval_code_steps_per_second": 0.038, "epoch": 0.66, "step": 25 }, { "loss": 0.0077, "learning_rate": 0.0002, "epoch": 0.68, "step": 26 }, { "loss": 0.0157, "learning_rate": 0.0002, "epoch": 0.71, "step": 27 }, { "loss": 0.0055, "learning_rate": 0.0002, "epoch": 0.74, "step": 28 }, { "loss": 0.0043, "learning_rate": 0.0002, "epoch": 0.76, "step": 29 }, { "loss": 0.0007, "learning_rate": 0.0002, "epoch": 0.79, "step": 30 }, { "loss": 0.0017, "learning_rate": 0.0002, "epoch": 0.82, "step": 31 }, { "loss": 0.0046, "learning_rate": 0.0002, "epoch": 0.84, "step": 32 }, { "loss": 0.0002, "learning_rate": 0.0002, "epoch": 0.87, "step": 33 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 0.89, "step": 34 }, { "loss": 0.0148, "learning_rate": 0.0002, "epoch": 0.92, "step": 35 }, { "loss": 0.0026, "learning_rate": 0.0002, "epoch": 0.95, "step": 36 }, { "loss": 0.0006, "learning_rate": 0.0002, "epoch": 0.97, "step": 37 }, { "loss": 0.0043, "learning_rate": 0.0002, "epoch": 1.0, "step": 38 }, { "loss": 0.0002, "learning_rate": 0.0002, "epoch": 1.03, "step": 39 }, { "loss": 0.0004, "learning_rate": 0.0002, "epoch": 1.05, "step": 40 }, { "loss": 0.0003, "learning_rate": 0.0002, "epoch": 1.08, "step": 41 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.11, "step": 42 }, { "loss": 0.0095, "learning_rate": 0.0002, "epoch": 1.13, "step": 43 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 1.16, "step": 44 }, { "loss": 0.2013, "learning_rate": 0.0002, "epoch": 1.18, "step": 45 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.21, "step": 46 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.24, "step": 47 }, { "loss": 0.0047, "learning_rate": 0.0002, "epoch": 1.26, "step": 48 }, { "loss": 0.0004, "learning_rate": 0.0002, "epoch": 1.29, "step": 49 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.32, "step": 50 }, { "eval_code_low_quality_loss": 0.001378062181174755, "eval_code_low_quality_score": -5.075635272078216e-05, "eval_code_low_quality_brier_score": 5.075635272078216e-05, "eval_code_low_quality_average_probability": 0.9987315535545349, "eval_code_low_quality_accuracy": 1.0, "eval_code_low_quality_probabilities": [ 1.0, 1.0, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 0.9999840259552002, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.967201828956604, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9908334612846375, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999980926513672, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.999922513961792, 0.9999967813491821, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9702784419059753, 0.9449317455291748, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 0.9999991655349731, 1.0 ], "eval_code_low_quality_runtime": 108.1154, "eval_code_low_quality_samples_per_second": 0.925, "eval_code_low_quality_steps_per_second": 0.037, "epoch": 1.32, "step": 50 }, { "eval_code_loss": 1.3461368083953857, "eval_code_score": -0.22116898000240326, "eval_code_brier_score": 0.22116898000240326, "eval_code_average_probability": 0.5982358455657959, "eval_code_accuracy": 0.8, "eval_code_probabilities": [ 4.050308746172959e-07, 2.979102418976254e-06, 2.6617096864356427e-06, 0.5738264918327332, 0.8691526651382446, 0.5516966581344604, 0.5616106986999512, 0.5491132140159607, 0.5290331244468689, 0.49235308170318604, 0.5810630321502686, 0.5722699761390686, 0.5287314057350159, 0.6949906349182129, 0.5635644197463989, 0.5054471492767334, 0.4994816780090332, 0.5129610896110535, 0.6220285296440125, 0.6764118671417236, 0.5921300649642944, 0.503677248954773, 0.5439413785934448, 0.5423399806022644, 0.431194007396698, 0.42188534140586853, 0.42363011837005615, 0.9709718227386475, 0.9995226860046387, 0.9999279975891113, 0.4847673773765564, 0.5603877305984497, 0.5247597694396973, 3.816174285020679e-06, 1.9298215647722827e-06, 1.9306407921249047e-06, 0.527335524559021, 0.5305987596511841, 0.5162070393562317, 0.946389377117157, 0.8050153255462646, 0.8141985535621643, 0.5671536326408386, 0.6023316383361816, 0.5614919066429138, 0.5858514904975891, 0.9122728705406189, 0.9817299842834473, 0.532357931137085, 0.5182923674583435, 0.9870670437812805, 0.999982476234436, 0.9999992847442627, 0.9999778270721436, 0.5067487359046936, 0.5095696449279785, 0.5025925040245056, 0.4237653911113739, 0.5117032527923584, 0.4223073124885559, 0.6444336175918579, 0.6726469993591309, 0.6397074460983276, 0.7292462587356567, 0.5063377618789673, 0.5283511281013489, 0.706869900226593, 0.46199607849121094, 0.4430694580078125, 0.9500992894172668, 0.22525879740715027, 0.9999823570251465, 0.47554466128349304, 0.51363205909729, 0.6031032800674438, 0.9999370574951172, 0.658456563949585, 0.9959049820899963, 0.902746856212616, 0.5577074289321899, 0.5983836650848389, 0.7882758975028992, 0.5046991109848022, 0.8182088732719421, 0.549981951713562, 0.5202911496162415, 0.9605872631072998, 0.9999349117279053, 0.9999911785125732, 0.7577045559883118, 0.6290202736854553, 0.5034119486808777, 0.569599449634552, 0.503978431224823, 0.507115364074707, 0.5144593715667725, 0.770204484462738, 0.23782096803188324, 0.22504965960979462, 0.5020108222961426 ], "eval_code_runtime": 105.4075, "eval_code_samples_per_second": 0.949, "eval_code_steps_per_second": 0.038, "epoch": 1.32, "step": 50 }, { "loss": 0.0015, "learning_rate": 0.0002, "epoch": 1.34, "step": 51 }, { "loss": 0.0049, "learning_rate": 0.0002, "epoch": 1.37, "step": 52 }, { "loss": 0.0119, "learning_rate": 0.0002, "epoch": 1.39, "step": 53 }, { "loss": 0.0028, "learning_rate": 0.0002, "epoch": 1.42, "step": 54 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.45, "step": 55 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.47, "step": 56 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.5, "step": 57 }, { "loss": 0.0024, "learning_rate": 0.0002, "epoch": 1.53, "step": 58 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.55, "step": 59 }, { "loss": 0.0002, "learning_rate": 0.0002, "epoch": 1.58, "step": 60 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 1.61, "step": 61 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.63, "step": 62 }, { "loss": 0.0017, "learning_rate": 0.0002, "epoch": 1.66, "step": 63 }, { "loss": 0.0018, "learning_rate": 0.0002, "epoch": 1.68, "step": 64 }, { "loss": 0.0008, "learning_rate": 0.0002, "epoch": 1.71, "step": 65 }, { "loss": 0.0068, "learning_rate": 0.0002, "epoch": 1.74, "step": 66 }, { "loss": 0.001, "learning_rate": 0.0002, "epoch": 1.76, "step": 67 }, { "loss": 0.0002, "learning_rate": 0.0002, "epoch": 1.79, "step": 68 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.82, "step": 69 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.84, "step": 70 }, { "loss": 0.0006, "learning_rate": 0.0002, "epoch": 1.87, "step": 71 }, { "loss": 0.0003, "learning_rate": 0.0002, "epoch": 1.89, "step": 72 }, { "loss": 0.1335, "learning_rate": 0.0002, "epoch": 1.92, "step": 73 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 1.95, "step": 74 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.97, "step": 75 }, { "eval_code_low_quality_loss": 0.0005032618064433336, "eval_code_low_quality_score": -1.0583773473626934e-05, "eval_code_low_quality_brier_score": 1.0583773473626934e-05, "eval_code_low_quality_average_probability": 0.9995136857032776, "eval_code_low_quality_accuracy": 1.0, "eval_code_low_quality_probabilities": [ 1.0, 0.9999967813491821, 0.9999997615814209, 0.9983976483345032, 1.0, 0.9999837875366211, 1.0, 0.9997871518135071, 1.0, 1.0, 1.0, 1.0, 0.9918645620346069, 1.0, 1.0, 1.0, 0.9998249411582947, 0.998837411403656, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999996423721313, 1.0, 1.0, 1.0, 0.9688511490821838, 0.9999998807907104, 1.0, 0.9999991655349731, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999998807907104, 1.0, 0.999982476234436, 0.9999701976776123, 0.995941698551178, 0.9999995231628418, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999868869781494, 0.9999997615814209, 0.9999061822891235, 1.0, 1.0, 0.9999092817306519, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999996423721313, 0.9999997615814209, 1.0, 0.9999204874038696, 1.0, 1.0, 1.0, 0.9989272952079773, 1.0, 0.9999998807907104, 1.0, 0.9994589686393738, 1.0, 0.9999996423721313, 1.0, 1.0, 1.0, 0.9999737739562988, 0.999944806098938, 0.9999998807907104, 0.9999788999557495, 1.0, 1.0, 1.0, 0.9999411106109619, 1.0, 1.0, 1.0, 1.,, 0.9999876022338867, 1.0 ], "eval_code_low_quality_runtime": 108.2376, "eval_code_low_quality_samples_per_second": 0.924, "eval_code_low_quality_steps_per_second": 0.037, "epoch": 1.97, "step": 75 }, { "eval_code_loss": 1.5990806818008423, "eval_code_score": -0.2409353256225586, "eval_code_brier_score": 0.2409353256225586, "eval_code_average_probability": 0.5683663487434387, "eval_code_accuracy": 0.8, "eval_code_probabilities": [ 1.1873796168515582e-08, 5.058638308241825e-08, 6.313541689451085e-08, 0.5709640979766846, 0.6853320002555847, 0.5568627715110779, 0.5487821102142334, 0.5347866415977478, 0.5317322611808777, 0.512122631072998, 0.5734414458274841, 0.5738123059272766, 0.5303495526313782, 0.6757323741912842, 0.6369258165359497, 0.5054691433906555, 0.4862286150455475, 0.4997119903564453, 0.5902368426322937, 0.6018257737159729, 0.541638970375061, 0.5033149123191833, 0.5362597703933716, 0.5289673209190369, 0.24309313297271729, 0.22363527119159698, 0.22765608131885529, 0.7798057794570923, 0.9960242509841919, 0.9997923970222473, 0.5013885498046875, 0.528499186038971, 0.5185747146606445, 4.462568199414818e-07, 2.2847591196750727e-07, 2.316882046216051e-07, 0.5187056660652161, 0.5277567505836487, 0.510230541229248, 0.9069125056266785, 0.8473342061042786, 0.8101637363433838, 0.537501335144043, 0.5229093432426453, 0.5179290175437927, 0.594524621963501, 0.8149073123931885, 0.9026350378990173, 0.5351212024688721, 0.5195194482803345, 0.9832677245140076, 0.9752768874168396, 0.9901442527770996, 0.9911841154098511, 0.5086742043495178, 0.5045136213302612, 0.5005779266357422, 0.4479965567588806, 0.5039933919906616, 0.44930532574653625, 0.5485993027687073, 0.6136952042579651, 0.5874925255775452, 0.6819684505462646, 0.5115750432014465, 0.5058901309967041, 0.7632222771644592, 0.3942977488040924, 0.3785106837749481, 0.8528256416320801, 0.5036994814872742, 0.9950182437896729, 0.48869040608406067, 0.5160850882530212, 0.5451788306236267, 0.9758601188659668, 0.44595080614089966, 0.8039615750312805, 0.8271895051002502, 0.5377886891365051, 0.5619093775749207, 0.8048967123031616, 0.502302885055542, 0.766408383846283, 0.5268206000328064, 0.5031132102012634, 0.8771815896034241, 0.9855904579162598, 0.9990859031677246, 0.6270195841789246, 0.55865478515625, 0.5030545592308044, 0.5426568984985352, 0.5039815306663513, 0.5092061758041382, 0.5093463659286499, 0.4080256521701813, 0.24740169942378998, 0.2555961608886719, 0.5028347373008728 ], "eval_code_runtime": 105.2631, "eval_code_samples_per_second": 0.95, "eval_code_steps_per_second": 0.038, "epoch": 1.97, "step": 75 }, { "loss": 0.012, "learning_rate": 0.0002, "epoch": 2.0, "step": 76 }, { "loss": 0.0006, "learning_rate": 0.0002, "epoch": 2.03, "step": 77 }, { "loss": 0.0006, "learning_rate": 0.0002, "epoch": 2.05, "step": 78 }, { "loss": 0.0006, "learning_rate": 0.0002, "epoch": 2.08, "step": 79 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 2.11, "step": 80 }, { "loss": 0.005, "learning_rate": 0.0002, "epoch": 2.13, "step": 81 }, { "loss": 0.0007, "learning_rate": 0.0002, "epoch": 2.16, "step": 82 }, { "loss": 0.0002, "learning_rate": 0.0002, "epoch": 2.18, "step": 83 }, { "loss": 0.0019, "learning_rate": 0.0002, "epoch": 2.21, "step": 84 }, { "loss": 0.0007, "learning_rate": 0.0002, "epoch": 2.24, "step": 85 }, { "loss": 0.0014, "learning_rate": 0.0002, "epoch": 2.26, "step": 86 }, { "loss": 0.0005, "learning_rate": 0.0002, "epoch": 2.29, "step": 87 }, { "loss": 0.001, "learning_rate": 0.0002, "epoch": 2.32, "step": 88 }, { "loss": 0.0006, "learning_rate": 0.0002, "epoch": 2.34, "step": 89 }, { "loss": 0.0004, "learning_rate": 0.0002, "epoch": 2.37, "step": 90 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 2.39, "step": 91 }, { "loss": 0.0006, "learning_rate": 0.0002, "epoch": 2.42, "step": 92 }, { "loss": 0.0028, "learning_rate": 0.0002, "epoch": 2.45, "step": 93 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 2.47, "step": 94 }, { "loss": 0.0024, "learning_rate": 0.0002, "epoch": 2.5, "step": 95 }, { "loss": 0.0059, "learning_rate": 0.0002, "epoch": 2.53, "step": 96 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 2.55, "step": 97 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 2.58, "step": 98 }, { "loss": 0.0003, "learning_rate": 0.0002, "epoch": 2.61, "step": 99 }, { "loss": 0.0003, "learning_rate": 0.0002, "epoch": 2.63, "step": 100 }, { "eval_code_low_quality_loss": 6.671607116004452e-05, "eval_code_low_quality_score": -3.4999186482309597e-07, "eval_code_low_quality_brier_score": 3.4999186482309597e-07, "eval_code_low_quality_average_probability": 0.9999365210533142, "eval_code_low_quality_accuracy": 1.0, "eval_code_low_quality_probabilities": [ 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999998927116394, 1.0, 1.0, 1.0, 1.0, 0.9999990463256836, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9996960163116455, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9940925240516663, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.,, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999995231628418, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999983310699463, 1.0, 1.0, 1.0, 0.9999991655349731, 1.0, 0.9999901056289673, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999704360961914, 0.999913215637207, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0 ], "eval_code_low_quality_runtime": 108.4514, "eval_code_low_quality_samples_per_second": 0.922, "eval_code_low_quality_steps_per_second": 0.037, "epoch": 2.63, "step": 100 }, { "eval_code_loss": 1.2588822841644287, "eval_code_score": -0.24486389756202698, "eval_code_brier_score": 0.24486389756202698, "eval_code_average_probability": 0.6122177839279175, "eval_code_accuracy": 0.78, "eval_code_probabilities": [ 3.716594960678776e-07, 4.86033532069996e-05, 5.94538141740486e-05, 0.7322285175323486, 0.992759108543396, 0.6937164068222046, 0.6719813346862793, 0.5284847021102905, 0.5714943408966064, 0.5305595397949219, 0.7621225118637085, 0.7049319744110107, 0.5994599461555481, 0.9482231736183167, 0.9427314400672913, 0.5233908295631409, 0.5151730179786682, 0.5592909455299377, 0.6389124989509583, 0.7489423155784607, 0.5400505661964417, 0.4894372224807739, 0.7627068758010864, 0.676575243473053, 0.001497809775173664, 0.0012255371548235416, 0.0013199239037930965, 0.9070805907249451, 0.9999668598175049, 0.9999922513961792, 0.48677918314933777, 0.6579598784446716, 0.5528249740600586, 0.0031468200031667948, 0.0008608169737271965, 0.0007525159744545817, 0.628882110118866, 0.5596430897712708, 0.5554695725440979, 0.9984580278396606, 0.989458441734314, 0.9929828643798828, 0.7459701895713806, 0.8483384251594543, 0.5955826044082642, 0.8648329377174377, 0.9960275888442993, 0.9993523955345154, 0.5829755067825317, 0.6307886838912964, 0.994866132736206, 0.9999991655349731, 0.9999984502792358, 0.9999934434890747, 0.5436527132987976, 0.5340330600738525, 0.5099152326583862, 0.5169093608856201, 0.5082399249076843, 0.5305851697921753, 0.0689636766910553, 0.09695249050855637, 0.09122244268655777, 0.4549616277217865, 0.5240060091018677, 0.539696216583252, 0.9665416479110718, 0.2522982358932495, 0.24534465372562408, 0.905021071434021, 0.31865352392196655, 0.999656081199646, 0.4672524631023407, 0.5117397308349609, 0.5817976593971252, 0.9999037981033325, 0.9686040282249451, 0.9996315240859985, 0.996566653251648, 0.7026336789131165, 0.7814198732376099, 0.8912621140480042, 0.5140696167945862, 0.9321841597557068, 0.673382580280304, 0.6223154664039612, 0.9992823004722595, 0.9998123049736023, 0.9999938011169434, 0.697952926158905, 0.7329107522964478, 0.4842481017112732, 0.6284154057502747, 0.5115850567817688, 0.525327205657959, 0.5679951310157776, 0.5145466923713684, 0.02526971884071827, 0.02999242953956127, 0.5247264504432678 ], "eval_code_runtime": 105.3153, "eval_code_samples_per_second": 0.95, "eval_code_steps_per_second": 0.038, "epoch": 2.63, "step": 100 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 2.66, "step": 101 }, { "loss": 0.0009, "learning_rate": 0.0002, "epoch": 2.68, "step": 102 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 2.71, "step": 103 }, { "loss": 0.0002, "learning_rate": 0.0002, "epoch": 2.74, "step": 104 }, { "loss": 0.0016, "learning_rate": 0.0002, "epoch": 2.76, "step": 105 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 2.79, "step": 106 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 2.82, "step": 107 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 2.84, "step": 108 }, { "loss": 0.0005, "learning_rate": 0.0002, "epoch": 2.87, "step": 109 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 2.89, "step": 110 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 2.92, "step": 111 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 2.95, "step": 112 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 2.97, "step": 113 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.0, "step": 114 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.03, "step": 115 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.05, "step": 116 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 3.08, "step": 117 }, { "loss": 0.0002, "learning_rate": 0.0002, "epoch": 3.11, "step": 118 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.13, "step": 119 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.16, "step": 120 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.18, "step": 121 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.21, "step": 122 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.24, "step": 123 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 3.26, "step": 124 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.29, "step": 125 }, { "eval_code_low_quality_loss": 0.0007014500442892313, "eval_code_low_quality_score": -3.61457969120238e-05, "eval_code_low_quality_brier_score": 3.61457969120238e-05, "eval_code_low_quality_average_probability": 0.9993457198143005, "eval_code_low_quality_accuracy": 1.0, "eval_code_low_quality_probabilities": [ 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.,, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999996423721313, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 0.9999995231628418, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 0.9399757981300354, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.99994957447052, 0.9999979734420776, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999996423721313, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9985740184783936, 0.9999673366546631, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9990741014480591, 0.9970368146896362, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999984502792358, 1.0, 1.0, 1.0, 1.0 ], "eval_code_low_quality_runtime": 108.4065, "eval_code_low_quality_samples_per_second": 0.922, "eval_code_low_quality_steps_per_second": 0.037, "epoch": 3.29, "step": 125 }, { "eval_code_loss": 1.043724775314331, "eval_code_score": -0.21790370345115662, "eval_code_brier_score": 0.21790370345115662, "eval_code_average_probability": 0.6578189134597778, "eval_code_accuracy": 0.77, "eval_code_probabilities": [ 2.9980761610204354e-05, 0.16327866911888123, 0.1223980113863945, 0.8630220293998718, 0.9999371767044067, 0.8081788420677185, 0.7690643668174744, 0.4431692361831665, 0.6145693063735962, 0.5692129731178284, 0.8545891046524048, 0.7837128043174744, 0.678038477897644, 0.9840186238288879, 0.9795506000518799, 0.541788637638092, 0.5379593372344971, 0.6108262538909912, 0.6568173766136169, 0.9312652349472046, 0.5693832039833069, 0.491776704788208, 0.865976095199585, 0.7813358306884766, 1.2309145859035198e-05, 9.09055961528793e-06, 1.0214143912889995e-05, 0.9485948085784912, 0.9997069239616394, 0.999749481678009, 0.45955172181129456, 0.8172199726104736, 0.5752690434455872, 0.6527258157730103, 0.2048613727092743, 0.13845929503440857, 0.7823963761329651, 0.6123839616775513, 0.6217948198318481, 0.9999850988388062, 0.999450147151947, 0.9998420476913452, 0.9847567677497864, 0.9996198415756226, 0.6785285472869873, 0.9706732630729675, 0.9999459981918335, 0.9999982118606567, 0.6881040930747986, 0.7350975871086121, 0.9948760867118835, 1.0, 1.0, 1.0, 0.5983561873435974, 0.5580247640609741, 0.5120639801025391, 0.5918711423873901, 0.5148324370384216, 0.6228303909301758, 0.006977998651564121, 0.011295206844806671, 0.012422475032508373, 0.4554630219936371, 0.5428009033203125, 0.5566087961196899, 0.9991586208343506, 0.11367473751306534, 0.12123917788267136, 0.9770430326461792, 0.1478639841079712, 0.9995866417884827, 0.4416849911212921, 0.491413414478302, 0.6343856453895569, 0.9999972581863403, 0.9927133917808533, 0.9999967813491821, 0.9998946189880371, 0.8279895186424255, 0.914436936378479, 0.9620551466941833, 0.5265487432479858, 0.9861032962799072, 0.8208467960357666, 0.7353063821792603, 0.9999938011169434, 0.9998844861984253, 0.999961256980896, 0.8301354050636292, 0.8745093941688538, 0.46109309792518616, 0.7134401798248291, 0.5036332011222839, 0.5366954207420349, 0.6171916127204895, 0.5420334339141846, 0.0013571635354310274, 0.0021216413006186485, 0.5408289432525635 ], "eval_code_runtime": 105.5069, "eval_code_samples_per_second": 0.948, "eval_code_steps_per_second": 0.038, "epoch": 3.29, "step": 125 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.32, "step": 126 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.34, "step": 127 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.37, "step": 128 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.39, "step": 129 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.42, "step": 130 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.45, "step": 131 }, { "loss": 0.0004, "learning_rate": 0.0002, "epoch": 3.47, "step": 132 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.5, "step": 133 }, { "loss": 0.08, "learning_rate": 0.0002, "epoch": 3.53, "step": 134 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.55, "step": 135 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.58, "step": 136 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.61, "step": 137 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 3.63, "step": 138 }, { "loss": 0.001, "learning_rate": 0.0002, "epoch": 3.66, "step": 139 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.68, "step": 140 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 3.71, "step": 141 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 3.74, "step": 142 }, { "loss": 0.0003, "learning_rate": 0.0002, "epoch": 3.76, "step": 143 }, { "loss": 0.0114, "learning_rate": 0.0002, "epoch": 3.79, "step": 144 }, { "loss": 0.006, "learning_rate": 0.0002, "epoch": 3.82, "step": 145 }, { "loss": 0.0011, "learning_rate": 0.0002, "epoch": 3.84, "step": 146 }, { "loss": 0.0042, "learning_rate": 0.0002, "epoch": 3.87, "step": 147 }, { "loss": 0.0015, "learning_rate": 0.0002, "epoch": 3.89, "step": 148 }, { "loss": 0.0003, "learning_rate": 0.0002, "epoch": 3.92, "step": 149 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 3.95, "step": 150 }, { "eval_code_low_quality_loss": 0.00038435429451055825, "eval_code_low_quality_score": -6.823713192716241e-06, "eval_code_low_quality_brier_score": 6.823713192716241e-06, "eval_code_low_quality_average_probability": 0.9996289014816284, "eval_code_low_quality_accuracy": 1.0, "eval_code_low_quality_probabilities": [ 1.0, 1.0, 1.0, 0.9999984502792358, 1.0, 1.0, 0.9999983310699463, 0.9999969005584717, 1.0, 1.0, 1.0, 1.0, 0.9999916553497314, 1.0, 1.0, 1.0, 0.9999995231628418, 0.9999638795852661, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999983310699463, 1.0, 1.0, 1.0, 0.9766356945037842, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9885169267654419, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999992847442627, 1.0, 1.0, 1.0, 0.9999996423721313, 1.0, 0.9999995231628418, 1.0, 0.9999998807907104, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999713897705078, 0.9978513717651367, 0.9999997615814209, 0.9999988079071045, 1.0, 1.0, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 0.9999719858169556, 1.0 ], "eval_code_low_quality_runtime": 108.3342, "eval_code_low_quality_samples_per_second": 0.923, "eval_code_low_quality_steps_per_second": 0.037, "epoch": 3.95, "step": 150 }, { "eval_code_loss": 2.0963048934936523, "eval_code_score": -0.2217760533094406, "eval_code_brier_score": 0.2217760533094406, "eval_code_average_probability": 0.6159726977348328, "eval_code_accuracy": 0.76, "eval_code_probabilities": [ 3.5287172489573138e-12, 5.817486076198364e-11, 1.8693878389708374e-10, 0.765636146068573, 0.9234081506729126, 0.7391408085823059, 0.659432590007782, 0.6729235053062439, 0.5623210668563843, 0.5150139331817627, 0.8085805177688599, 0.7596898674964905, 0.5972597002983093, 0.9820079803466797, 0.9745085835456848, 0.5273155570030212, 0.5324531197547913, 0.5789834260940552, 0.7247386574745178, 0.7544905543327332, 0.5884762406349182, 0.4842914938926697, 0.8123393058776855, 0.7054367661476135, 0.09308263659477234, 0.08973666280508041, 0.09202855080366135, 0.7089231014251709, 0.9720393419265747, 0.9964279532432556, 0.49923038482666016, 0.6134451031684875, 0.5499404072761536, 6.11895881186264e-11, 1.4576943818678245e-11, 1.735799351476608e-11, 0.6023713946342468, 0.553157389163971, 0.5503317713737488, 0.9796992540359497, 0.9182886481285095, 0.8607842922210693, 0.6422979831695557, 0.6638745665550232, 0.6075322031974792, 0.7293029427528381, 0.9844130873680115, 0.993526816368103, 0.547633707523346, 0.6227739453315735, 0.9998313188552856, 0.9999940395355225, 0.9999951124191284, 0.9999775886535645, 0.5366966128349304, 0.5250415802001953, 0.5051754117012024, 0.48833295702934265, 0.5131838321685791, 0.5317294597625732, 0.29897043108940125, 0.3597976565361023, 0.32535555958747864, 0.4676964282989502, 0.526648998260498, 0.548362672328949, 0.6692071557044983, 0.35373201966285706, 0.3534887731075287, 0.6637941002845764, 0.47728481888771057, 0.9986295700073242, 0.46758249402046204, 0.5160676836967468, 0.5609508156776428, 0.9999833106994629, 0.9855866432189941, 0.9997468590736389, 0.9985565543174744, 0.7168160080909729, 0.7617760300636292, 0.7155187726020813, 0.4970121681690216, 0.8666588664054871, 0.6338189840316772, 0.5993514060974121, 0.9967523813247681, 0.9662074446678162, 0.9995986819267273, 0.5130647420883179, 0.7217807173728943, 0.4925132691860199, 0.5792981386184692, 0.5104650259017944, 0.5129127502441406, 0.5114725828170776, 0.8539605140686035, 0.19493471086025238, 0.22762958705425262, 0.5150301456451416 ], "eval_code_runtime": 105.5057, "eval_code_samples_per_second": 0.948, "eval_code_steps_per_second": 0.038, "epoch": 3.95, "step": 150 }, { "train_runtime": 14494.0652, "train_samples_per_second": 0.331, "train_steps_per_second": 0.01, "total_flos": 0.0, "train_loss": 0.03708522860984015, "epoch": 3.95, "step": 150 } ]