[ { "loss": 0.6935, "learning_rate": 0.0002, "epoch": 0.02, "step": 1 }, { "loss": 0.6301, "learning_rate": 0.0002, "epoch": 0.04, "step": 2 }, { "loss": 0.6073, "learning_rate": 0.0002, "epoch": 0.05, "step": 3 }, { "loss": 0.5667, "learning_rate": 0.0002, "epoch": 0.07, "step": 4 }, { "loss": 0.4627, "learning_rate": 0.0002, "epoch": 0.09, "step": 5 }, { "loss": 0.4737, "learning_rate": 0.0002, "epoch": 0.11, "step": 6 }, { "loss": 0.3356, "learning_rate": 0.0002, "epoch": 0.12, "step": 7 }, { "loss": 0.27, "learning_rate": 0.0002, "epoch": 0.14, "step": 8 }, { "loss": 0.28, "learning_rate": 0.0002, "epoch": 0.16, "step": 9 }, { "loss": 0.3491, "learning_rate": 0.0002, "epoch": 0.18, "step": 10 }, { "loss": 0.2803, "learning_rate": 0.0002, "epoch": 0.19, "step": 11 }, { "loss": 0.1596, "learning_rate": 0.0002, "epoch": 0.21, "step": 12 }, { "loss": 0.1118, "learning_rate": 0.0002, "epoch": 0.23, "step": 13 }, { "loss": 0.2215, "learning_rate": 0.0002, "epoch": 0.25, "step": 14 }, { "loss": 0.0815, "learning_rate": 0.0002, "epoch": 0.26, "step": 15 }, { "loss": 0.1581, "learning_rate": 0.0002, "epoch": 0.28, "step": 16 }, { "loss": 0.1447, "learning_rate": 0.0002, "epoch": 0.3, "step": 17 }, { "loss": 0.0793, "learning_rate": 0.0002, "epoch": 0.32, "step": 18 }, { "loss": 0.0634, "learning_rate": 0.0002, "epoch": 0.33, "step": 19 }, { "loss": 0.0868, "learning_rate": 0.0002, "epoch": 0.35, "step": 20 }, { "loss": 0.1339, "learning_rate": 0.0002, "epoch": 0.37, "step": 21 }, { "loss": 0.0436, "learning_rate": 0.0002, "epoch": 0.39, "step": 22 }, { "loss": 0.0326, "learning_rate": 0.0002, "epoch": 0.4, "step": 23 }, { "loss": 0.0309, "learning_rate": 0.0002, "epoch": 0.42, "step": 24 }, { "loss": 0.4613, "learning_rate": 0.0002, "epoch": 0.44, "step": 25 }, { "eval_code_easy_loss": 0.22846165299415588, "eval_code_easy_score": -0.034886911511421204, "eval_code_easy_brier_score": 0.034886911511421204, "eval_code_easy_average_probability": 0.9493436217308044, "eval_code_easy_accuracy": 0.96, "eval_code_easy_probabilities": [ 1.0, 1.0, 0.9999986886978149, 0.9999988079071045, 0.9999972581863403, 0.9999972581863403, 0.8807934522628784, 0.9996591806411743, 1.0, 0.9997110962867737, 0.996894359588623, 0.9885761141777039, 0.9846639037132263, 0.9999998807907104, 0.9999992847442627, 0.9217069745063782, 0.9999998807907104, 0.9999992847442627, 0.9999531507492065, 0.971138596534729, 0.9644115567207336, 0.9999998807907104, 0.9999998807907104, 0.9999996423721313, 1.0, 1.0, 0.9992501139640808, 0.9999996423721313, 0.999998927116394, 0.9999997615814209, 0.9999358654022217, 0.9999948740005493, 0.9999706745147705, 0.9182361364364624, 0.9777969717979431, 0.7950476408004761, 0.07089971750974655, 0.9999998807907104, 0.9611170887947083, 0.999824583530426, 0.9999998807907104, 0.9999997615814209, 0.9999994039535522, 0.9999918937683105, 0.9999996423721313, 0.9999992847442627, 0.9999583959579468, 0.9999964237213135, 0.9999970197677612, 1.0, 0.9999992847442627, 0.7631391286849976, 0.9999997615814209, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9999991655349731, 0.4372449815273285, 0.9999960660934448, 0.9999992847442627, 1.0, 0.989567220211029, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.6681390404701233, 1.02999701994122e-05, 0.0022490699775516987, 1.0, 1.0, 0.9999945163726807, 0.9999951124191284, 0.999752938747406, 0.9999997615814209, 1.0, 1.0, 1.0, 0.9668532013893127, 0.9999983310699463, 0.9879446029663086, 0.9999827146530151, 1.0, 0.9999997615814209, 0.9972673654556274, 0.9581230878829956, 0.9999821186065674, 0.9999935626983643, 0.7346240282058716, 0.9999959468841553, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999996423721313 ], "eval_code_easy_runtime": 41.4523, "eval_code_easy_samples_per_second": 2.412, "eval_code_easy_steps_per_second": 0.096, "epoch": 0.44, "step": 25 }, { "eval_code_hard_loss": 0.8444641828536987, "eval_code_hard_score": -0.21481266617774963, "eval_code_hard_brier_score": 0.21481266617774963, "eval_code_hard_average_probability": 0.6489911675453186, "eval_code_hard_accuracy": 0.71, "eval_code_hard_probabilities": [ 0.9999761581420898, 0.4704570770263672, 0.38770198822021484, 0.9957898259162903, 0.9971027970314026, 0.6636011004447937, 0.3829995095729828, 0.4488725960254669, 0.3862934112548828, 0.4944641590118408, 0.6597261428833008, 0.5888834595680237, 0.9994460940361023, 0.00023105263244360685, 9.57881347858347e-05, 0.9383717179298401, 0.9582164287567139, 0.9960324168205261, 0.0013776113046333194, 0.004925197456032038, 0.0024418227840214968, 0.9448224306106567, 0.8293406367301941, 0.990691065788269, 0.6144397258758545, 0.37276336550712585, 0.7497667670249939, 0.9995079040527344, 0.8595492243766785, 0.8565853238105774, 0.9049152731895447, 0.842837393283844, 0.7425481081008911, 0.9970250725746155, 0.9908040761947632, 0.9856406450271606, 0.23333661258220673, 0.3644156754016876, 0.9999799728393555, 0.5256256461143494, 0.4714035987854004, 0.5990293622016907, 0.7481530904769897, 0.6265391111373901, 0.7847771644592285, 0.9998830556869507, 0.4729439914226532, 0.5146611332893372, 0.9899987578392029, 0.999963641166687, 0.9999411106109619, 0.017366401851177216, 0.25775712728500366, 0.9997989535331726, 0.2128974348306656, 0.27310115098953247, 0.6709675192832947, 0.5412147045135498, 0.5308579206466675, 0.5533190369606018, 0.11031078547239304, 0.0799262598156929, 0.12423858046531677, 0.6619316339492798, 0.6491618156433105, 0.9998986721038818, 0.5845221281051636, 0.9992774128913879, 0.7275769710540771, 0.9403572082519531, 0.9309749007225037, 0.871741771697998, 0.9114173650741577, 0.9771295189857483, 0.9557876586914062, 0.9182456135749817, 0.32342132925987244, 0.5013740062713623, 0.5234308242797852, 0.5439746975898743, 0.5095937252044678, 0.7398637533187866, 0.7255550026893616, 0.7406316995620728, 0.984710156917572, 0.9945735335350037, 0.9810420274734497, 0.5697446465492249, 0.6282893419265747, 0.6032753586769104, 0.40384215116500854, 0.26884448528289795, 0.45188671350479126, 0.6884511709213257, 0.4971124827861786, 0.6430377960205078, 0.6951863169670105, 0.8902100920677185, 0.13663697242736816, 0.9657577872276306 ], "eval_code_hard_runtime": 140.0766, "eval_code_hard_samples_per_second": 0.714, "eval_code_hard_steps_per_second": 0.029, "epoch": 0.44, "step": 25 }, { "loss": 0.1113, "learning_rate": 0.0002, "epoch": 0.46, "step": 26 }, { "loss": 0.0564, "learning_rate": 0.0002, "epoch": 0.47, "step": 27 }, { "loss": 0.0685, "learning_rate": 0.0002, "epoch": 0.49, "step": 28 }, { "loss": 0.1366, "learning_rate": 0.0002, "epoch": 0.51, "step": 29 }, { "loss": 0.0012, "learning_rate": 0.0002, "epoch": 0.53, "step": 30 }, { "loss": 0.0288, "learning_rate": 0.0002, "epoch": 0.54, "step": 31 }, { "loss": 0.0287, "learning_rate": 0.0002, "epoch": 0.56, "step": 32 }, { "loss": 0.0668, "learning_rate": 0.0002, "epoch": 0.58, "step": 33 }, { "loss": 0.0054, "learning_rate": 0.0002, "epoch": 0.6, "step": 34 }, { "loss": 0.0058, "learning_rate": 0.0002, "epoch": 0.61, "step": 35 }, { "loss": 0.1321, "learning_rate": 0.0002, "epoch": 0.63, "step": 36 }, { "loss": 0.0438, "learning_rate": 0.0002, "epoch": 0.65, "step": 37 }, { "loss": 0.035, "learning_rate": 0.0002, "epoch": 0.67, "step": 38 }, { "loss": 0.03, "learning_rate": 0.0002, "epoch": 0.68, "step": 39 }, { "loss": 0.0043, "learning_rate": 0.0002, "epoch": 0.7, "step": 40 }, { "loss": 0.0158, "learning_rate": 0.0002, "epoch": 0.72, "step": 41 }, { "loss": 0.0097, "learning_rate": 0.0002, "epoch": 0.74, "step": 42 }, { "loss": 0.0104, "learning_rate": 0.0002, "epoch": 0.75, "step": 43 }, { "loss": 0.0854, "learning_rate": 0.0002, "epoch": 0.77, "step": 44 }, { "loss": 0.0115, "learning_rate": 0.0002, "epoch": 0.79, "step": 45 }, { "loss": 0.0903, "learning_rate": 0.0002, "epoch": 0.81, "step": 46 }, { "loss": 0.0082, "learning_rate": 0.0002, "epoch": 0.82, "step": 47 }, { "loss": 0.0841, "learning_rate": 0.0002, "epoch": 0.84, "step": 48 }, { "loss": 0.0379, "learning_rate": 0.0002, "epoch": 0.86, "step": 49 }, { "loss": 0.1163, "learning_rate": 0.0002, "epoch": 0.88, "step": 50 }, { "eval_code_easy_loss": 0.28712284564971924, "eval_code_easy_score": -0.026069259271025658, "eval_code_easy_brier_score": 0.026069259271025658, "eval_code_easy_average_probability": 0.9709805250167847, "eval_code_easy_accuracy": 0.97, "eval_code_easy_probabilities": [ 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999997615814209, 0.9602830410003662, 1.0, 1.0, 0.9999963045120239, 0.999914288520813, 0.9999732971191406, 0.9999974966049194, 1.0, 1.0, 0.9866946935653687, 1.0, 1.0, 0.9999997615814209, 0.9994608759880066, 0.9999551773071289, 1.0, 1.0, 1.0, 1.0, 1.0, 0.999995231628418, 0.9999997615814209, 0.9999998807907104, 1.0, 0.9999250173568726, 0.9999978542327881, 0.9999946355819702, 0.9998421669006348, 0.9999990463256836, 0.9997969269752502, 0.9818890690803528, 1.0, 0.9999922513961792, 0.9999998807907104, 0.9999998807907104, 0.9999998807907104, 1.0, 1.0, 1.0, 0.9997735619544983, 0.9998974800109863, 0.9999257326126099, 0.9999967813491821, 0.9999998807907104, 0.9999998807907104, 0.9922711849212646, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.223012313246727, 0.9999998807907104, 1.0, 1.0, 0.9999990463256836, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9665756225585938, 4.0422314384613856e-08, 4.318383798818104e-05, 1.0, 1.0, 1.0, 0.9998561143875122, 0.999182403087616, 0.9999680519104004, 1.0, 1.0, 1.0, 0.9999822378158569, 1.0, 1.0, 0.9959767460823059, 0.9999539852142334, 0.9995007514953613, 0.9999942779541016, 0.9996492862701416, 0.9998260140419006, 1.0, 0.9949652552604675, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0 ], "eval_code_easy_runtime": 41.3563, "eval_code_easy_samples_per_second": 2.418, "eval_code_easy_steps_per_second": 0.097, "epoch": 0.88, "step": 50 }, { "eval_code_hard_loss": 0.9237764477729797, "eval_code_hard_score": -0.20848987996578217, "eval_code_hard_brier_score": 0.20848987996578217, "eval_code_hard_average_probability": 0.683417558670044, "eval_code_hard_accuracy": 0.71, "eval_code_hard_probabilities": [ 0.9991462230682373, 0.39208656549453735, 0.4176894426345825, 0.999220609664917, 0.9982213377952576, 0.9070152640342712, 0.15849868953227997, 0.28745439648628235, 0.3027569651603699, 0.24870805442333221, 0.7417134642601013, 0.5444478392601013, 0.9999140501022339, 0.0021548818331211805, 0.00024593042326159775, 0.9696754217147827, 0.9635093212127686, 0.9924002885818481, 0.00320712779648602, 0.004237341228872538, 0.000593981530983001, 0.9999964237213135, 0.9995344877243042, 0.999998927116394, 0.6726424098014832, 0.20489203929901123, 0.906218409538269, 0.1464991718530655, 0.8866965770721436, 0.9025827050209045, 0.9838942885398865, 0.9865344762802124, 0.4193040132522583, 0.9865899085998535, 0.9603983759880066, 0.958928644657135, 0.6753811240196228, 0.573758602142334, 0.6913469433784485, 0.3839159607887268, 0.42377495765686035, 0.9371411204338074, 0.997376561164856, 0.9381016492843628, 0.9976379871368408, 0.9994822144508362, 0.5902647376060486, 0.583461582660675, 0.9944129586219788, 0.9991785883903503, 0.9986459612846375, 0.012307150289416313, 0.8033295273780823, 0.9979121088981628, 0.00042291387217119336, 0.0005228969966992736, 0.00923232827335596, 0.7242734432220459, 0.6451666951179504, 0.7488073110580444, 0.3765398859977722, 0.14819785952568054, 0.39486005902290344, 0.6967870593070984, 0.8443142175674438, 0.9988842606544495, 0.9835836291313171, 0.9990014433860779, 0.9992020726203918, 0.9539203643798828, 0.9750897288322449, 0.850548267364502, 0.8060330152511597, 0.9476742744445801, 0.9418892860412598, 0.9725985527038574, 0.17615075409412384, 0.5268995761871338, 0.5463316440582275, 0.7340309023857117, 0.45826229453086853, 0.758548378944397, 0.9831669926643372, 0.8220421671867371, 0.9986447691917419, 0.9994031190872192, 0.9962872266769409, 0.7291285395622253, 0.8422561883926392, 0.7621178030967712, 0.4166759252548218, 0.4946196973323822, 0.4451850652694702, 0.7629806995391846, 0.7204477190971375, 0.7885748744010925, 0.6446090340614319, 0.8708204030990601, 0.32380175590515137, 0.9781871438026428 ], "eval_code_hard_runtime": 140.1048, "eval_code_hard_samples_per_second": 0.714, "eval_code_hard_steps_per_second": 0.029, "epoch": 0.88, "step": 50 }, { "loss": 0.0203, "learning_rate": 0.0002, "epoch": 0.89, "step": 51 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 0.91, "step": 52 }, { "loss": 0.0373, "learning_rate": 0.0002, "epoch": 0.93, "step": 53 }, { "loss": 0.2778, "learning_rate": 0.0002, "epoch": 0.95, "step": 54 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 0.96, "step": 55 }, { "loss": 0.0011, "learning_rate": 0.0002, "epoch": 0.98, "step": 56 }, { "loss": 0.0148, "learning_rate": 0.0002, "epoch": 1.0, "step": 57 }, { "loss": 0.0051, "learning_rate": 0.0002, "epoch": 1.02, "step": 58 }, { "loss": 0.0092, "learning_rate": 0.0002, "epoch": 1.04, "step": 59 }, { "loss": 0.0004, "learning_rate": 0.0002, "epoch": 1.05, "step": 60 }, { "loss": 0.1744, "learning_rate": 0.0002, "epoch": 1.07, "step": 61 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 1.09, "step": 62 }, { "loss": 0.0018, "learning_rate": 0.0002, "epoch": 1.11, "step": 63 }, { "loss": 0.0078, "learning_rate": 0.0002, "epoch": 1.12, "step": 64 }, { "loss": 0.0121, "learning_rate": 0.0002, "epoch": 1.14, "step": 65 }, { "loss": 0.0001, "learning_rate": 0.0002, "epoch": 1.16, "step": 66 }, { "loss": 0.0004, "learning_rate": 0.0002, "epoch": 1.18, "step": 67 }, { "loss": 0.0188, "learning_rate": 0.0002, "epoch": 1.19, "step": 68 }, { "loss": 0.0005, "learning_rate": 0.0002, "epoch": 1.21, "step": 69 }, { "loss": 0.0007, "learning_rate": 0.0002, "epoch": 1.23, "step": 70 }, { "loss": 0.0112, "learning_rate": 0.0002, "epoch": 1.25, "step": 71 }, { "loss": 0.0034, "learning_rate": 0.0002, "epoch": 1.26, "step": 72 }, { "loss": 0.0012, "learning_rate": 0.0002, "epoch": 1.28, "step": 73 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.3, "step": 74 }, { "loss": 0.0246, "learning_rate": 0.0002, "epoch": 1.32, "step": 75 }, { "eval_code_easy_loss": 0.18898575007915497, "eval_code_easy_score": -0.02407282404601574, "eval_code_easy_brier_score": 0.02407282404601574, "eval_code_easy_average_probability": 0.9731456637382507, "eval_code_easy_accuracy": 0.97, "eval_code_easy_probabilities": [ 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9942795038223267, 0.9999982118606567, 1.0, 0.9999651908874512, 0.9998317956924438, 0.9999611377716064, 0.9999415874481201, 1.0, 1.0, 0.9984660148620605, 1.0, 1.0, 1.0, 0.9995312690734863, 0.9939040541648865, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999691247940063, 0.9999864101409912, 0.9999852180480957, 0.9999997615814209, 0.9999762773513794, 0.9999992847442627, 0.9999895095825195, 0.9994505047798157, 0.9999997615814209, 0.9999996423721313, 0.999316930770874, 1.0, 0.9999549388885498, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999998807907104, 0.9999992847442627, 0.9991188645362854, 0.9999963045120239, 1.0, 1.0, 1.0, 0.9998277425765991, 1.0, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 0.3605167269706726, 1.0, 1.0, 1.0, 0.9999949932098389, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.97076416015625, 1.4138274309516419e-05, 0.001279860152862966, 1.0, 1.0, 1.0, 0.9999953508377075, 0.999148964881897, 0.9999984502792358, 1.0, 1.0, 1.0, 0.9999393224716187, 1.0, 1.0, 0.9999922513961792, 1.0, 0.9999986886978149, 0.9999806880950928, 0.9999102354049683, 0.9999845027923584, 1.0, 0.9995985627174377, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0 ], "eval_code_easy_runtime": 41.4851, "eval_code_easy_samples_per_second": 2.411, "eval_code_easy_steps_per_second": 0.096, "epoch": 1.32, "step": 75 }, { "eval_code_hard_loss": 2.2544667720794678, "eval_code_hard_score": -0.2460768073797226, "eval_code_hard_brier_score": 0.2460768073797226, "eval_code_hard_average_probability": 0.6746283173561096, "eval_code_hard_accuracy": 0.71, "eval_code_hard_probabilities": [ 0.9999983310699463, 0.5661250948905945, 0.7090879678726196, 0.09080829471349716, 0.09405586123466492, 6.130974361440167e-05, 0.24737045168876648, 0.201746866106987, 0.3449346125125885, 0.14900989830493927, 0.7652262449264526, 0.5247918367385864, 0.9998658895492554, 1.7507378657910522e-08, 2.665373033394758e-09, 0.9900109171867371, 0.9922283291816711, 0.9896736145019531, 3.136615077892202e-06, 9.850871720118448e-06, 1.0493128002053709e-06, 0.9999830722808838, 0.9980818033218384, 0.999981164932251, 0.9334778189659119, 0.28829115629196167, 0.9874013066291809, 0.9867030382156372, 0.9521355032920837, 0.975749135017395, 0.9921451210975647, 0.998805046081543, 0.6474704742431641, 0.9896721839904785, 0.9654123783111572, 0.9551592469215393, 0.12296662479639053, 0.17879928648471832, 0.9942314624786377, 0.29071682691574097, 0.26718518137931824, 0.9962670207023621, 0.9932090640068054, 0.9184593558311462, 0.9924524426460266, 0.9999681711196899, 0.5355503559112549, 0.62375807762146, 0.9999186992645264, 0.9999804496765137, 0.9999536275863647, 0.0012312890030443668, 0.9840332865715027, 0.9999861717224121, 1.4762352407160506e-07, 1.6458953666642628e-07, 1.1647493920463603e-05, 0.6963649988174438, 0.5160571932792664, 0.5119415521621704, 2.806163301727338e-08, 6.523485085452307e-10, 1.9155359964884155e-08, 0.9288567304611206, 0.9914976954460144, 0.999998927116394, 0.9736488461494446, 0.9999374151229858, 0.9989074468612671, 0.9604309797286987, 0.9418864250183105, 0.9515325427055359, 0.9813504219055176, 0.9903180599212646, 0.9985818862915039, 0.9873167276382446, 0.12791942059993744, 0.40380606055259705, 0.5523675680160522, 0.7548352479934692, 0.46443045139312744, 0.9042721390724182, 0.9984411597251892, 0.9024229645729065, 0.9884786009788513, 0.9960446357727051, 0.940305769443512, 0.784172534942627, 0.862592339515686, 0.6879691481590271, 0.41794973611831665, 0.5900482535362244, 0.540920078754425, 0.8815944194793701, 0.8355022668838501, 0.9159291982650757, 0.8655431866645813, 0.9957410097122192, 0.4074825942516327, 0.9812780022621155 ], "eval_code_hard_runtime": 140.1017, "eval_code_hard_samples_per_second": 0.714, "eval_code_hard_steps_per_second": 0.029, "epoch": 1.32, "step": 75 }, { "loss": 0.0063, "learning_rate": 0.0002, "epoch": 1.33, "step": 76 }, { "loss": 0.0109, "learning_rate": 0.0002, "epoch": 1.35, "step": 77 }, { "loss": 0.0002, "learning_rate": 0.0002, "epoch": 1.37, "step": 78 }, { "loss": 0.0854, "learning_rate": 0.0002, "epoch": 1.39, "step": 79 }, { "loss": 0.0327, "learning_rate": 0.0002, "epoch": 1.4, "step": 80 }, { "loss": 0.0002, "learning_rate": 0.0002, "epoch": 1.42, "step": 81 }, { "loss": 0.0705, "learning_rate": 0.0002, "epoch": 1.44, "step": 82 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.46, "step": 83 }, { "loss": 0.0031, "learning_rate": 0.0002, "epoch": 1.47, "step": 84 }, { "loss": 0.0199, "learning_rate": 0.0002, "epoch": 1.49, "step": 85 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.51, "step": 86 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.53, "step": 87 }, { "loss": 0.0011, "learning_rate": 0.0002, "epoch": 1.54, "step": 88 }, { "loss": 0.237, "learning_rate": 0.0002, "epoch": 1.56, "step": 89 }, { "loss": 0.0064, "learning_rate": 0.0002, "epoch": 1.58, "step": 90 }, { "loss": 0.0005, "learning_rate": 0.0002, "epoch": 1.6, "step": 91 }, { "loss": 0.0021, "learning_rate": 0.0002, "epoch": 1.61, "step": 92 }, { "loss": 0.0004, "learning_rate": 0.0002, "epoch": 1.63, "step": 93 }, { "loss": 0.0019, "learning_rate": 0.0002, "epoch": 1.65, "step": 94 }, { "loss": 0.0009, "learning_rate": 0.0002, "epoch": 1.67, "step": 95 }, { "loss": 0.0009, "learning_rate": 0.0002, "epoch": 1.68, "step": 96 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.7, "step": 97 }, { "loss": 0.0, "learning_rate": 0.0002, "epoch": 1.72, "step": 98 }, { "loss": 0.0005, "learning_rate": 0.0002, "epoch": 1.74, "step": 99 }, { "loss": 0.0016, "learning_rate": 0.0002, "epoch": 1.75, "step": 100 }, { "eval_code_easy_loss": 0.25820469856262207, "eval_code_easy_score": -0.020117390900850296, "eval_code_easy_brier_score": 0.020117390900850296, "eval_code_easy_average_probability": 0.9781191945075989, "eval_code_easy_accuracy": 0.98, "eval_code_easy_probabilities": [ 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9856951832771301, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999998807907104, 0.8996143937110901, 1.0, 1.0, 0.9800459146499634, 1.0, 1.0, 1.0, 0.9999831914901733, 0.9999853372573853, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999538660049438, 0.9999998807907104, 1.0, 1.0, 0.9999990463256836, 1.0, 0.9999998807907104, 0.9980992674827576, 0.999997615814209, 0.9975267052650452, 0.9988257288932, 1.0, 0.9999734163284302, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999279975891113, 1.0, 1.0, 1.0, 1.0, 0.9663723707199097, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999686479568481, 1.0, 1.0, 1.0, 0.999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9941490888595581, 9.479013840518746e-08, 7.865727820899338e-05, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9985870122909546, 1.0, 1.0, 1.0, 1.0, 0.9996020197868347, 1.0, 1.0, 0.9999988079071045, 1.0, 0.9999998807907104, 0.9997178912162781, 0.9999922513961792, 0.9999991655349731, 1.0, 0.9938370585441589, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0 ], "eval_code_easy_runtime": 41.4766, "eval_code_easy_samples_per_second": 2.411, "eval_code_easy_steps_per_second": 0.096, "epoch": 1.75, "step": 100 }, { "eval_code_hard_loss": 2.8355469703674316, "eval_code_hard_score": -0.24508047103881836, "eval_code_hard_brier_score": 0.24508047103881836, "eval_code_hard_average_probability": 0.6834875345230103, "eval_code_hard_accuracy": 0.71, "eval_code_hard_probabilities": [ 1.0, 0.49802687764167786, 0.7207960486412048, 0.01915053464472294, 0.022134896367788315, 4.0801442082738504e-05, 0.3737213611602783, 0.2865481376647949, 0.30831632018089294, 0.24947436153888702, 0.7978243231773376, 0.5949852466583252, 0.9999364614486694, 2.1756743628920105e-10, 2.9773794540943754e-11, 0.9936490654945374, 0.9942991733551025, 0.993448793888092, 3.583797980599712e-10, 3.8425835846567225e-09, 2.1109008985220612e-10, 0.9996128678321838, 0.9975799322128296, 0.9994070529937744, 0.9748783707618713, 0.47572091221809387, 0.996880054473877, 0.9991859793663025, 0.987097442150116, 0.9944655299186707, 0.9830182790756226, 0.995845377445221, 0.5017166137695312, 0.9952012300491333, 0.8540241122245789, 0.9487936496734619, 0.02690940722823143, 0.03413669392466545, 0.9999390840530396, 0.14402766525745392, 0.1746188849210739, 0.9748719930648804, 0.9814805388450623, 0.9264845848083496, 0.974022388458252, 0.9999991655349731, 0.7958990931510925, 0.6329552531242371, 0.9999284744262695, 0.9999613761901855, 0.9999935626983643, 8.354127930942923e-05, 0.9636399149894714, 0.999997615814209, 5.748397313709575e-10, 4.4799397524997175e-10, 1.1092028273651522e-07, 0.7891486883163452, 0.5943530797958374, 0.6597400307655334, 3.084578281686845e-08, 1.9499866998895499e-10, 7.682257319174823e-08, 0.988332211971283, 0.9993404746055603, 0.9999953508377075, 0.7918521761894226, 0.9975425004959106, 0.9782871603965759, 0.9723710417747498, 0.973602831363678, 0.9903439283370972, 0.9704287052154541, 0.9830175638198853, 0.9929106831550598, 0.9866513013839722, 0.16249682009220123, 0.3364860415458679, 0.5504053235054016, 0.8576055765151978, 0.5424798727035522, 0.9613667130470276, 0.9995546936988831, 0.8739398717880249, 0.9984847903251648, 0.9997493624687195, 0.980169951915741, 0.8975971341133118, 0.9636164903640747, 0.7637275457382202, 0.5357650518417358, 0.6792539358139038, 0.39096373319625854, 0.951950192451477, 0.8796238899230957, 0.9461458921432495, 0.7978929281234741, 0.991081178188324, 0.4479399621486664, 0.9878178834915161 ], "eval_code_hard_runtime": 140.1067, "eval_code_hard_samples_per_second": 0.714, "eval_code_hard_steps_per_second": 0.029, "epoch": 1.75, "step": 100 }, { "train_runtime": 4333.8818, "train_samples_per_second": 0.738, "train_steps_per_second": 0.023, "total_flos": 0.0, "train_loss": 0.09087586780193589, "epoch": 1.75, "step": 100 } ]