| [ |
| { |
| "loss": 0.6935, |
| "learning_rate": 0.0002, |
| "epoch": 0.02, |
| "step": 1 |
| }, |
| { |
| "loss": 0.6301, |
| "learning_rate": 0.0002, |
| "epoch": 0.04, |
| "step": 2 |
| }, |
| { |
| "loss": 0.6073, |
| "learning_rate": 0.0002, |
| "epoch": 0.05, |
| "step": 3 |
| }, |
| { |
| "loss": 0.5667, |
| "learning_rate": 0.0002, |
| "epoch": 0.07, |
| "step": 4 |
| }, |
| { |
| "loss": 0.4627, |
| "learning_rate": 0.0002, |
| "epoch": 0.09, |
| "step": 5 |
| }, |
| { |
| "loss": 0.4737, |
| "learning_rate": 0.0002, |
| "epoch": 0.11, |
| "step": 6 |
| }, |
| { |
| "loss": 0.3356, |
| "learning_rate": 0.0002, |
| "epoch": 0.12, |
| "step": 7 |
| }, |
| { |
| "loss": 0.27, |
| "learning_rate": 0.0002, |
| "epoch": 0.14, |
| "step": 8 |
| }, |
| { |
| "loss": 0.28, |
| "learning_rate": 0.0002, |
| "epoch": 0.16, |
| "step": 9 |
| }, |
| { |
| "loss": 0.3491, |
| "learning_rate": 0.0002, |
| "epoch": 0.18, |
| "step": 10 |
| }, |
| { |
| "loss": 0.2803, |
| "learning_rate": 0.0002, |
| "epoch": 0.19, |
| "step": 11 |
| }, |
| { |
| "loss": 0.1596, |
| "learning_rate": 0.0002, |
| "epoch": 0.21, |
| "step": 12 |
| }, |
| { |
| "loss": 0.1118, |
| "learning_rate": 0.0002, |
| "epoch": 0.23, |
| "step": 13 |
| }, |
| { |
| "loss": 0.2215, |
| "learning_rate": 0.0002, |
| "epoch": 0.25, |
| "step": 14 |
| }, |
| { |
| "loss": 0.0815, |
| "learning_rate": 0.0002, |
| "epoch": 0.26, |
| "step": 15 |
| }, |
| { |
| "loss": 0.1581, |
| "learning_rate": 0.0002, |
| "epoch": 0.28, |
| "step": 16 |
| }, |
| { |
| "loss": 0.1447, |
| "learning_rate": 0.0002, |
| "epoch": 0.3, |
| "step": 17 |
| }, |
| { |
| "loss": 0.0793, |
| "learning_rate": 0.0002, |
| "epoch": 0.32, |
| "step": 18 |
| }, |
| { |
| "loss": 0.0634, |
| "learning_rate": 0.0002, |
| "epoch": 0.33, |
| "step": 19 |
| }, |
| { |
| "loss": 0.0868, |
| "learning_rate": 0.0002, |
| "epoch": 0.35, |
| "step": 20 |
| }, |
| { |
| "loss": 0.1339, |
| "learning_rate": 0.0002, |
| "epoch": 0.37, |
| "step": 21 |
| }, |
| { |
| "loss": 0.0436, |
| "learning_rate": 0.0002, |
| "epoch": 0.39, |
| "step": 22 |
| }, |
| { |
| "loss": 0.0326, |
| "learning_rate": 0.0002, |
| "epoch": 0.4, |
| "step": 23 |
| }, |
| { |
| "loss": 0.0309, |
| "learning_rate": 0.0002, |
| "epoch": 0.42, |
| "step": 24 |
| }, |
| { |
| "loss": 0.4613, |
| "learning_rate": 0.0002, |
| "epoch": 0.44, |
| "step": 25 |
| }, |
| { |
| "eval_code_easy_loss": 0.22846165299415588, |
| "eval_code_easy_score": -0.034886911511421204, |
| "eval_code_easy_brier_score": 0.034886911511421204, |
| "eval_code_easy_average_probability": 0.9493436217308044, |
| "eval_code_easy_accuracy": 0.96, |
| "eval_code_easy_probabilities": [ |
| 1.0, |
| 1.0, |
| 0.9999986886978149, |
| 0.9999988079071045, |
| 0.9999972581863403, |
| 0.9999972581863403, |
| 0.8807934522628784, |
| 0.9996591806411743, |
| 1.0, |
| 0.9997110962867737, |
| 0.996894359588623, |
| 0.9885761141777039, |
| 0.9846639037132263, |
| 0.9999998807907104, |
| 0.9999992847442627, |
| 0.9217069745063782, |
| 0.9999998807907104, |
| 0.9999992847442627, |
| 0.9999531507492065, |
| 0.971138596534729, |
| 0.9644115567207336, |
| 0.9999998807907104, |
| 0.9999998807907104, |
| 0.9999996423721313, |
| 1.0, |
| 1.0, |
| 0.9992501139640808, |
| 0.9999996423721313, |
| 0.999998927116394, |
| 0.9999997615814209, |
| 0.9999358654022217, |
| 0.9999948740005493, |
| 0.9999706745147705, |
| 0.9182361364364624, |
| 0.9777969717979431, |
| 0.7950476408004761, |
| 0.07089971750974655, |
| 0.9999998807907104, |
| 0.9611170887947083, |
| 0.999824583530426, |
| 0.9999998807907104, |
| 0.9999997615814209, |
| 0.9999994039535522, |
| 0.9999918937683105, |
| 0.9999996423721313, |
| 0.9999992847442627, |
| 0.9999583959579468, |
| 0.9999964237213135, |
| 0.9999970197677612, |
| 1.0, |
| 0.9999992847442627, |
| 0.7631391286849976, |
| 0.9999997615814209, |
| 0.9999998807907104, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999991655349731, |
| 0.4372449815273285, |
| 0.9999960660934448, |
| 0.9999992847442627, |
| 1.0, |
| 0.989567220211029, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.6681390404701233, |
| 1.02999701994122e-05, |
| 0.0022490699775516987, |
| 1.0, |
| 1.0, |
| 0.9999945163726807, |
| 0.9999951124191284, |
| 0.999752938747406, |
| 0.9999997615814209, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9668532013893127, |
| 0.9999983310699463, |
| 0.9879446029663086, |
| 0.9999827146530151, |
| 1.0, |
| 0.9999997615814209, |
| 0.9972673654556274, |
| 0.9581230878829956, |
| 0.9999821186065674, |
| 0.9999935626983643, |
| 0.7346240282058716, |
| 0.9999959468841553, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999996423721313 |
| ], |
| "eval_code_easy_runtime": 41.4523, |
| "eval_code_easy_samples_per_second": 2.412, |
| "eval_code_easy_steps_per_second": 0.096, |
| "epoch": 0.44, |
| "step": 25 |
| }, |
| { |
| "eval_code_hard_loss": 0.8444641828536987, |
| "eval_code_hard_score": -0.21481266617774963, |
| "eval_code_hard_brier_score": 0.21481266617774963, |
| "eval_code_hard_average_probability": 0.6489911675453186, |
| "eval_code_hard_accuracy": 0.71, |
| "eval_code_hard_probabilities": [ |
| 0.9999761581420898, |
| 0.4704570770263672, |
| 0.38770198822021484, |
| 0.9957898259162903, |
| 0.9971027970314026, |
| 0.6636011004447937, |
| 0.3829995095729828, |
| 0.4488725960254669, |
| 0.3862934112548828, |
| 0.4944641590118408, |
| 0.6597261428833008, |
| 0.5888834595680237, |
| 0.9994460940361023, |
| 0.00023105263244360685, |
| 9.57881347858347e-05, |
| 0.9383717179298401, |
| 0.9582164287567139, |
| 0.9960324168205261, |
| 0.0013776113046333194, |
| 0.004925197456032038, |
| 0.0024418227840214968, |
| 0.9448224306106567, |
| 0.8293406367301941, |
| 0.990691065788269, |
| 0.6144397258758545, |
| 0.37276336550712585, |
| 0.7497667670249939, |
| 0.9995079040527344, |
| 0.8595492243766785, |
| 0.8565853238105774, |
| 0.9049152731895447, |
| 0.842837393283844, |
| 0.7425481081008911, |
| 0.9970250725746155, |
| 0.9908040761947632, |
| 0.9856406450271606, |
| 0.23333661258220673, |
| 0.3644156754016876, |
| 0.9999799728393555, |
| 0.5256256461143494, |
| 0.4714035987854004, |
| 0.5990293622016907, |
| 0.7481530904769897, |
| 0.6265391111373901, |
| 0.7847771644592285, |
| 0.9998830556869507, |
| 0.4729439914226532, |
| 0.5146611332893372, |
| 0.9899987578392029, |
| 0.999963641166687, |
| 0.9999411106109619, |
| 0.017366401851177216, |
| 0.25775712728500366, |
| 0.9997989535331726, |
| 0.2128974348306656, |
| 0.27310115098953247, |
| 0.6709675192832947, |
| 0.5412147045135498, |
| 0.5308579206466675, |
| 0.5533190369606018, |
| 0.11031078547239304, |
| 0.0799262598156929, |
| 0.12423858046531677, |
| 0.6619316339492798, |
| 0.6491618156433105, |
| 0.9998986721038818, |
| 0.5845221281051636, |
| 0.9992774128913879, |
| 0.7275769710540771, |
| 0.9403572082519531, |
| 0.9309749007225037, |
| 0.871741771697998, |
| 0.9114173650741577, |
| 0.9771295189857483, |
| 0.9557876586914062, |
| 0.9182456135749817, |
| 0.32342132925987244, |
| 0.5013740062713623, |
| 0.5234308242797852, |
| 0.5439746975898743, |
| 0.5095937252044678, |
| 0.7398637533187866, |
| 0.7255550026893616, |
| 0.7406316995620728, |
| 0.984710156917572, |
| 0.9945735335350037, |
| 0.9810420274734497, |
| 0.5697446465492249, |
| 0.6282893419265747, |
| 0.6032753586769104, |
| 0.40384215116500854, |
| 0.26884448528289795, |
| 0.45188671350479126, |
| 0.6884511709213257, |
| 0.4971124827861786, |
| 0.6430377960205078, |
| 0.6951863169670105, |
| 0.8902100920677185, |
| 0.13663697242736816, |
| 0.9657577872276306 |
| ], |
| "eval_code_hard_runtime": 140.0766, |
| "eval_code_hard_samples_per_second": 0.714, |
| "eval_code_hard_steps_per_second": 0.029, |
| "epoch": 0.44, |
| "step": 25 |
| }, |
| { |
| "loss": 0.1113, |
| "learning_rate": 0.0002, |
| "epoch": 0.46, |
| "step": 26 |
| }, |
| { |
| "loss": 0.0564, |
| "learning_rate": 0.0002, |
| "epoch": 0.47, |
| "step": 27 |
| }, |
| { |
| "loss": 0.0685, |
| "learning_rate": 0.0002, |
| "epoch": 0.49, |
| "step": 28 |
| }, |
| { |
| "loss": 0.1366, |
| "learning_rate": 0.0002, |
| "epoch": 0.51, |
| "step": 29 |
| }, |
| { |
| "loss": 0.0012, |
| "learning_rate": 0.0002, |
| "epoch": 0.53, |
| "step": 30 |
| }, |
| { |
| "loss": 0.0288, |
| "learning_rate": 0.0002, |
| "epoch": 0.54, |
| "step": 31 |
| }, |
| { |
| "loss": 0.0287, |
| "learning_rate": 0.0002, |
| "epoch": 0.56, |
| "step": 32 |
| }, |
| { |
| "loss": 0.0668, |
| "learning_rate": 0.0002, |
| "epoch": 0.58, |
| "step": 33 |
| }, |
| { |
| "loss": 0.0054, |
| "learning_rate": 0.0002, |
| "epoch": 0.6, |
| "step": 34 |
| }, |
| { |
| "loss": 0.0058, |
| "learning_rate": 0.0002, |
| "epoch": 0.61, |
| "step": 35 |
| }, |
| { |
| "loss": 0.1321, |
| "learning_rate": 0.0002, |
| "epoch": 0.63, |
| "step": 36 |
| }, |
| { |
| "loss": 0.0438, |
| "learning_rate": 0.0002, |
| "epoch": 0.65, |
| "step": 37 |
| }, |
| { |
| "loss": 0.035, |
| "learning_rate": 0.0002, |
| "epoch": 0.67, |
| "step": 38 |
| }, |
| { |
| "loss": 0.03, |
| "learning_rate": 0.0002, |
| "epoch": 0.68, |
| "step": 39 |
| }, |
| { |
| "loss": 0.0043, |
| "learning_rate": 0.0002, |
| "epoch": 0.7, |
| "step": 40 |
| }, |
| { |
| "loss": 0.0158, |
| "learning_rate": 0.0002, |
| "epoch": 0.72, |
| "step": 41 |
| }, |
| { |
| "loss": 0.0097, |
| "learning_rate": 0.0002, |
| "epoch": 0.74, |
| "step": 42 |
| }, |
| { |
| "loss": 0.0104, |
| "learning_rate": 0.0002, |
| "epoch": 0.75, |
| "step": 43 |
| }, |
| { |
| "loss": 0.0854, |
| "learning_rate": 0.0002, |
| "epoch": 0.77, |
| "step": 44 |
| }, |
| { |
| "loss": 0.0115, |
| "learning_rate": 0.0002, |
| "epoch": 0.79, |
| "step": 45 |
| }, |
| { |
| "loss": 0.0903, |
| "learning_rate": 0.0002, |
| "epoch": 0.81, |
| "step": 46 |
| }, |
| { |
| "loss": 0.0082, |
| "learning_rate": 0.0002, |
| "epoch": 0.82, |
| "step": 47 |
| }, |
| { |
| "loss": 0.0841, |
| "learning_rate": 0.0002, |
| "epoch": 0.84, |
| "step": 48 |
| }, |
| { |
| "loss": 0.0379, |
| "learning_rate": 0.0002, |
| "epoch": 0.86, |
| "step": 49 |
| }, |
| { |
| "loss": 0.1163, |
| "learning_rate": 0.0002, |
| "epoch": 0.88, |
| "step": 50 |
| }, |
| { |
| "eval_code_easy_loss": 0.28712284564971924, |
| "eval_code_easy_score": -0.026069259271025658, |
| "eval_code_easy_brier_score": 0.026069259271025658, |
| "eval_code_easy_average_probability": 0.9709805250167847, |
| "eval_code_easy_accuracy": 0.97, |
| "eval_code_easy_probabilities": [ |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999997615814209, |
| 0.9602830410003662, |
| 1.0, |
| 1.0, |
| 0.9999963045120239, |
| 0.999914288520813, |
| 0.9999732971191406, |
| 0.9999974966049194, |
| 1.0, |
| 1.0, |
| 0.9866946935653687, |
| 1.0, |
| 1.0, |
| 0.9999997615814209, |
| 0.9994608759880066, |
| 0.9999551773071289, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.999995231628418, |
| 0.9999997615814209, |
| 0.9999998807907104, |
| 1.0, |
| 0.9999250173568726, |
| 0.9999978542327881, |
| 0.9999946355819702, |
| 0.9998421669006348, |
| 0.9999990463256836, |
| 0.9997969269752502, |
| 0.9818890690803528, |
| 1.0, |
| 0.9999922513961792, |
| 0.9999998807907104, |
| 0.9999998807907104, |
| 0.9999998807907104, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9997735619544983, |
| 0.9998974800109863, |
| 0.9999257326126099, |
| 0.9999967813491821, |
| 0.9999998807907104, |
| 0.9999998807907104, |
| 0.9922711849212646, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.223012313246727, |
| 0.9999998807907104, |
| 1.0, |
| 1.0, |
| 0.9999990463256836, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9665756225585938, |
| 4.0422314384613856e-08, |
| 4.318383798818104e-05, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9998561143875122, |
| 0.999182403087616, |
| 0.9999680519104004, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999822378158569, |
| 1.0, |
| 1.0, |
| 0.9959767460823059, |
| 0.9999539852142334, |
| 0.9995007514953613, |
| 0.9999942779541016, |
| 0.9996492862701416, |
| 0.9998260140419006, |
| 1.0, |
| 0.9949652552604675, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0 |
| ], |
| "eval_code_easy_runtime": 41.3563, |
| "eval_code_easy_samples_per_second": 2.418, |
| "eval_code_easy_steps_per_second": 0.097, |
| "epoch": 0.88, |
| "step": 50 |
| }, |
| { |
| "eval_code_hard_loss": 0.9237764477729797, |
| "eval_code_hard_score": -0.20848987996578217, |
| "eval_code_hard_brier_score": 0.20848987996578217, |
| "eval_code_hard_average_probability": 0.683417558670044, |
| "eval_code_hard_accuracy": 0.71, |
| "eval_code_hard_probabilities": [ |
| 0.9991462230682373, |
| 0.39208656549453735, |
| 0.4176894426345825, |
| 0.999220609664917, |
| 0.9982213377952576, |
| 0.9070152640342712, |
| 0.15849868953227997, |
| 0.28745439648628235, |
| 0.3027569651603699, |
| 0.24870805442333221, |
| 0.7417134642601013, |
| 0.5444478392601013, |
| 0.9999140501022339, |
| 0.0021548818331211805, |
| 0.00024593042326159775, |
| 0.9696754217147827, |
| 0.9635093212127686, |
| 0.9924002885818481, |
| 0.00320712779648602, |
| 0.004237341228872538, |
| 0.000593981530983001, |
| 0.9999964237213135, |
| 0.9995344877243042, |
| 0.999998927116394, |
| 0.6726424098014832, |
| 0.20489203929901123, |
| 0.906218409538269, |
| 0.1464991718530655, |
| 0.8866965770721436, |
| 0.9025827050209045, |
| 0.9838942885398865, |
| 0.9865344762802124, |
| 0.4193040132522583, |
| 0.9865899085998535, |
| 0.9603983759880066, |
| 0.958928644657135, |
| 0.6753811240196228, |
| 0.573758602142334, |
| 0.6913469433784485, |
| 0.3839159607887268, |
| 0.42377495765686035, |
| 0.9371411204338074, |
| 0.997376561164856, |
| 0.9381016492843628, |
| 0.9976379871368408, |
| 0.9994822144508362, |
| 0.5902647376060486, |
| 0.583461582660675, |
| 0.9944129586219788, |
| 0.9991785883903503, |
| 0.9986459612846375, |
| 0.012307150289416313, |
| 0.8033295273780823, |
| 0.9979121088981628, |
| 0.00042291387217119336, |
| 0.0005228969966992736, |
| 0.00923232827335596, |
| 0.7242734432220459, |
| 0.6451666951179504, |
| 0.7488073110580444, |
| 0.3765398859977722, |
| 0.14819785952568054, |
| 0.39486005902290344, |
| 0.6967870593070984, |
| 0.8443142175674438, |
| 0.9988842606544495, |
| 0.9835836291313171, |
| 0.9990014433860779, |
| 0.9992020726203918, |
| 0.9539203643798828, |
| 0.9750897288322449, |
| 0.850548267364502, |
| 0.8060330152511597, |
| 0.9476742744445801, |
| 0.9418892860412598, |
| 0.9725985527038574, |
| 0.17615075409412384, |
| 0.5268995761871338, |
| 0.5463316440582275, |
| 0.7340309023857117, |
| 0.45826229453086853, |
| 0.758548378944397, |
| 0.9831669926643372, |
| 0.8220421671867371, |
| 0.9986447691917419, |
| 0.9994031190872192, |
| 0.9962872266769409, |
| 0.7291285395622253, |
| 0.8422561883926392, |
| 0.7621178030967712, |
| 0.4166759252548218, |
| 0.4946196973323822, |
| 0.4451850652694702, |
| 0.7629806995391846, |
| 0.7204477190971375, |
| 0.7885748744010925, |
| 0.6446090340614319, |
| 0.8708204030990601, |
| 0.32380175590515137, |
| 0.9781871438026428 |
| ], |
| "eval_code_hard_runtime": 140.1048, |
| "eval_code_hard_samples_per_second": 0.714, |
| "eval_code_hard_steps_per_second": 0.029, |
| "epoch": 0.88, |
| "step": 50 |
| }, |
| { |
| "loss": 0.0203, |
| "learning_rate": 0.0002, |
| "epoch": 0.89, |
| "step": 51 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 0.0002, |
| "epoch": 0.91, |
| "step": 52 |
| }, |
| { |
| "loss": 0.0373, |
| "learning_rate": 0.0002, |
| "epoch": 0.93, |
| "step": 53 |
| }, |
| { |
| "loss": 0.2778, |
| "learning_rate": 0.0002, |
| "epoch": 0.95, |
| "step": 54 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 0.0002, |
| "epoch": 0.96, |
| "step": 55 |
| }, |
| { |
| "loss": 0.0011, |
| "learning_rate": 0.0002, |
| "epoch": 0.98, |
| "step": 56 |
| }, |
| { |
| "loss": 0.0148, |
| "learning_rate": 0.0002, |
| "epoch": 1.0, |
| "step": 57 |
| }, |
| { |
| "loss": 0.0051, |
| "learning_rate": 0.0002, |
| "epoch": 1.02, |
| "step": 58 |
| }, |
| { |
| "loss": 0.0092, |
| "learning_rate": 0.0002, |
| "epoch": 1.04, |
| "step": 59 |
| }, |
| { |
| "loss": 0.0004, |
| "learning_rate": 0.0002, |
| "epoch": 1.05, |
| "step": 60 |
| }, |
| { |
| "loss": 0.1744, |
| "learning_rate": 0.0002, |
| "epoch": 1.07, |
| "step": 61 |
| }, |
| { |
| "loss": 0.0001, |
| "learning_rate": 0.0002, |
| "epoch": 1.09, |
| "step": 62 |
| }, |
| { |
| "loss": 0.0018, |
| "learning_rate": 0.0002, |
| "epoch": 1.11, |
| "step": 63 |
| }, |
| { |
| "loss": 0.0078, |
| "learning_rate": 0.0002, |
| "epoch": 1.12, |
| "step": 64 |
| }, |
| { |
| "loss": 0.0121, |
| "learning_rate": 0.0002, |
| "epoch": 1.14, |
| "step": 65 |
| }, |
| { |
| "loss": 0.0001, |
| "learning_rate": 0.0002, |
| "epoch": 1.16, |
| "step": 66 |
| }, |
| { |
| "loss": 0.0004, |
| "learning_rate": 0.0002, |
| "epoch": 1.18, |
| "step": 67 |
| }, |
| { |
| "loss": 0.0188, |
| "learning_rate": 0.0002, |
| "epoch": 1.19, |
| "step": 68 |
| }, |
| { |
| "loss": 0.0005, |
| "learning_rate": 0.0002, |
| "epoch": 1.21, |
| "step": 69 |
| }, |
| { |
| "loss": 0.0007, |
| "learning_rate": 0.0002, |
| "epoch": 1.23, |
| "step": 70 |
| }, |
| { |
| "loss": 0.0112, |
| "learning_rate": 0.0002, |
| "epoch": 1.25, |
| "step": 71 |
| }, |
| { |
| "loss": 0.0034, |
| "learning_rate": 0.0002, |
| "epoch": 1.26, |
| "step": 72 |
| }, |
| { |
| "loss": 0.0012, |
| "learning_rate": 0.0002, |
| "epoch": 1.28, |
| "step": 73 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 0.0002, |
| "epoch": 1.3, |
| "step": 74 |
| }, |
| { |
| "loss": 0.0246, |
| "learning_rate": 0.0002, |
| "epoch": 1.32, |
| "step": 75 |
| }, |
| { |
| "eval_code_easy_loss": 0.18898575007915497, |
| "eval_code_easy_score": -0.02407282404601574, |
| "eval_code_easy_brier_score": 0.02407282404601574, |
| "eval_code_easy_average_probability": 0.9731456637382507, |
| "eval_code_easy_accuracy": 0.97, |
| "eval_code_easy_probabilities": [ |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9942795038223267, |
| 0.9999982118606567, |
| 1.0, |
| 0.9999651908874512, |
| 0.9998317956924438, |
| 0.9999611377716064, |
| 0.9999415874481201, |
| 1.0, |
| 1.0, |
| 0.9984660148620605, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9995312690734863, |
| 0.9939040541648865, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999691247940063, |
| 0.9999864101409912, |
| 0.9999852180480957, |
| 0.9999997615814209, |
| 0.9999762773513794, |
| 0.9999992847442627, |
| 0.9999895095825195, |
| 0.9994505047798157, |
| 0.9999997615814209, |
| 0.9999996423721313, |
| 0.999316930770874, |
| 1.0, |
| 0.9999549388885498, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999998807907104, |
| 0.9999998807907104, |
| 0.9999992847442627, |
| 0.9991188645362854, |
| 0.9999963045120239, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9998277425765991, |
| 1.0, |
| 1.0, |
| 0.9999997615814209, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.3605167269706726, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999949932098389, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.97076416015625, |
| 1.4138274309516419e-05, |
| 0.001279860152862966, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999953508377075, |
| 0.999148964881897, |
| 0.9999984502792358, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999393224716187, |
| 1.0, |
| 1.0, |
| 0.9999922513961792, |
| 1.0, |
| 0.9999986886978149, |
| 0.9999806880950928, |
| 0.9999102354049683, |
| 0.9999845027923584, |
| 1.0, |
| 0.9995985627174377, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0 |
| ], |
| "eval_code_easy_runtime": 41.4851, |
| "eval_code_easy_samples_per_second": 2.411, |
| "eval_code_easy_steps_per_second": 0.096, |
| "epoch": 1.32, |
| "step": 75 |
| }, |
| { |
| "eval_code_hard_loss": 2.2544667720794678, |
| "eval_code_hard_score": -0.2460768073797226, |
| "eval_code_hard_brier_score": 0.2460768073797226, |
| "eval_code_hard_average_probability": 0.6746283173561096, |
| "eval_code_hard_accuracy": 0.71, |
| "eval_code_hard_probabilities": [ |
| 0.9999983310699463, |
| 0.5661250948905945, |
| 0.7090879678726196, |
| 0.09080829471349716, |
| 0.09405586123466492, |
| 6.130974361440167e-05, |
| 0.24737045168876648, |
| 0.201746866106987, |
| 0.3449346125125885, |
| 0.14900989830493927, |
| 0.7652262449264526, |
| 0.5247918367385864, |
| 0.9998658895492554, |
| 1.7507378657910522e-08, |
| 2.665373033394758e-09, |
| 0.9900109171867371, |
| 0.9922283291816711, |
| 0.9896736145019531, |
| 3.136615077892202e-06, |
| 9.850871720118448e-06, |
| 1.0493128002053709e-06, |
| 0.9999830722808838, |
| 0.9980818033218384, |
| 0.999981164932251, |
| 0.9334778189659119, |
| 0.28829115629196167, |
| 0.9874013066291809, |
| 0.9867030382156372, |
| 0.9521355032920837, |
| 0.975749135017395, |
| 0.9921451210975647, |
| 0.998805046081543, |
| 0.6474704742431641, |
| 0.9896721839904785, |
| 0.9654123783111572, |
| 0.9551592469215393, |
| 0.12296662479639053, |
| 0.17879928648471832, |
| 0.9942314624786377, |
| 0.29071682691574097, |
| 0.26718518137931824, |
| 0.9962670207023621, |
| 0.9932090640068054, |
| 0.9184593558311462, |
| 0.9924524426460266, |
| 0.9999681711196899, |
| 0.5355503559112549, |
| 0.62375807762146, |
| 0.9999186992645264, |
| 0.9999804496765137, |
| 0.9999536275863647, |
| 0.0012312890030443668, |
| 0.9840332865715027, |
| 0.9999861717224121, |
| 1.4762352407160506e-07, |
| 1.6458953666642628e-07, |
| 1.1647493920463603e-05, |
| 0.6963649988174438, |
| 0.5160571932792664, |
| 0.5119415521621704, |
| 2.806163301727338e-08, |
| 6.523485085452307e-10, |
| 1.9155359964884155e-08, |
| 0.9288567304611206, |
| 0.9914976954460144, |
| 0.999998927116394, |
| 0.9736488461494446, |
| 0.9999374151229858, |
| 0.9989074468612671, |
| 0.9604309797286987, |
| 0.9418864250183105, |
| 0.9515325427055359, |
| 0.9813504219055176, |
| 0.9903180599212646, |
| 0.9985818862915039, |
| 0.9873167276382446, |
| 0.12791942059993744, |
| 0.40380606055259705, |
| 0.5523675680160522, |
| 0.7548352479934692, |
| 0.46443045139312744, |
| 0.9042721390724182, |
| 0.9984411597251892, |
| 0.9024229645729065, |
| 0.9884786009788513, |
| 0.9960446357727051, |
| 0.940305769443512, |
| 0.784172534942627, |
| 0.862592339515686, |
| 0.6879691481590271, |
| 0.41794973611831665, |
| 0.5900482535362244, |
| 0.540920078754425, |
| 0.8815944194793701, |
| 0.8355022668838501, |
| 0.9159291982650757, |
| 0.8655431866645813, |
| 0.9957410097122192, |
| 0.4074825942516327, |
| 0.9812780022621155 |
| ], |
| "eval_code_hard_runtime": 140.1017, |
| "eval_code_hard_samples_per_second": 0.714, |
| "eval_code_hard_steps_per_second": 0.029, |
| "epoch": 1.32, |
| "step": 75 |
| }, |
| { |
| "loss": 0.0063, |
| "learning_rate": 0.0002, |
| "epoch": 1.33, |
| "step": 76 |
| }, |
| { |
| "loss": 0.0109, |
| "learning_rate": 0.0002, |
| "epoch": 1.35, |
| "step": 77 |
| }, |
| { |
| "loss": 0.0002, |
| "learning_rate": 0.0002, |
| "epoch": 1.37, |
| "step": 78 |
| }, |
| { |
| "loss": 0.0854, |
| "learning_rate": 0.0002, |
| "epoch": 1.39, |
| "step": 79 |
| }, |
| { |
| "loss": 0.0327, |
| "learning_rate": 0.0002, |
| "epoch": 1.4, |
| "step": 80 |
| }, |
| { |
| "loss": 0.0002, |
| "learning_rate": 0.0002, |
| "epoch": 1.42, |
| "step": 81 |
| }, |
| { |
| "loss": 0.0705, |
| "learning_rate": 0.0002, |
| "epoch": 1.44, |
| "step": 82 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 0.0002, |
| "epoch": 1.46, |
| "step": 83 |
| }, |
| { |
| "loss": 0.0031, |
| "learning_rate": 0.0002, |
| "epoch": 1.47, |
| "step": 84 |
| }, |
| { |
| "loss": 0.0199, |
| "learning_rate": 0.0002, |
| "epoch": 1.49, |
| "step": 85 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 0.0002, |
| "epoch": 1.51, |
| "step": 86 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 0.0002, |
| "epoch": 1.53, |
| "step": 87 |
| }, |
| { |
| "loss": 0.0011, |
| "learning_rate": 0.0002, |
| "epoch": 1.54, |
| "step": 88 |
| }, |
| { |
| "loss": 0.237, |
| "learning_rate": 0.0002, |
| "epoch": 1.56, |
| "step": 89 |
| }, |
| { |
| "loss": 0.0064, |
| "learning_rate": 0.0002, |
| "epoch": 1.58, |
| "step": 90 |
| }, |
| { |
| "loss": 0.0005, |
| "learning_rate": 0.0002, |
| "epoch": 1.6, |
| "step": 91 |
| }, |
| { |
| "loss": 0.0021, |
| "learning_rate": 0.0002, |
| "epoch": 1.61, |
| "step": 92 |
| }, |
| { |
| "loss": 0.0004, |
| "learning_rate": 0.0002, |
| "epoch": 1.63, |
| "step": 93 |
| }, |
| { |
| "loss": 0.0019, |
| "learning_rate": 0.0002, |
| "epoch": 1.65, |
| "step": 94 |
| }, |
| { |
| "loss": 0.0009, |
| "learning_rate": 0.0002, |
| "epoch": 1.67, |
| "step": 95 |
| }, |
| { |
| "loss": 0.0009, |
| "learning_rate": 0.0002, |
| "epoch": 1.68, |
| "step": 96 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 0.0002, |
| "epoch": 1.7, |
| "step": 97 |
| }, |
| { |
| "loss": 0.0, |
| "learning_rate": 0.0002, |
| "epoch": 1.72, |
| "step": 98 |
| }, |
| { |
| "loss": 0.0005, |
| "learning_rate": 0.0002, |
| "epoch": 1.74, |
| "step": 99 |
| }, |
| { |
| "loss": 0.0016, |
| "learning_rate": 0.0002, |
| "epoch": 1.75, |
| "step": 100 |
| }, |
| { |
| "eval_code_easy_loss": 0.25820469856262207, |
| "eval_code_easy_score": -0.020117390900850296, |
| "eval_code_easy_brier_score": 0.020117390900850296, |
| "eval_code_easy_average_probability": 0.9781191945075989, |
| "eval_code_easy_accuracy": 0.98, |
| "eval_code_easy_probabilities": [ |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9856951832771301, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999998807907104, |
| 0.9999998807907104, |
| 0.8996143937110901, |
| 1.0, |
| 1.0, |
| 0.9800459146499634, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999831914901733, |
| 0.9999853372573853, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999538660049438, |
| 0.9999998807907104, |
| 1.0, |
| 1.0, |
| 0.9999990463256836, |
| 1.0, |
| 0.9999998807907104, |
| 0.9980992674827576, |
| 0.999997615814209, |
| 0.9975267052650452, |
| 0.9988257288932, |
| 1.0, |
| 0.9999734163284302, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999279975891113, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9663723707199097, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999686479568481, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.999997615814209, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9941490888595581, |
| 9.479013840518746e-08, |
| 7.865727820899338e-05, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999998807907104, |
| 0.9985870122909546, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9996020197868347, |
| 1.0, |
| 1.0, |
| 0.9999988079071045, |
| 1.0, |
| 0.9999998807907104, |
| 0.9997178912162781, |
| 0.9999922513961792, |
| 0.9999991655349731, |
| 1.0, |
| 0.9938370585441589, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0 |
| ], |
| "eval_code_easy_runtime": 41.4766, |
| "eval_code_easy_samples_per_second": 2.411, |
| "eval_code_easy_steps_per_second": 0.096, |
| "epoch": 1.75, |
| "step": 100 |
| }, |
| { |
| "eval_code_hard_loss": 2.8355469703674316, |
| "eval_code_hard_score": -0.24508047103881836, |
| "eval_code_hard_brier_score": 0.24508047103881836, |
| "eval_code_hard_average_probability": 0.6834875345230103, |
| "eval_code_hard_accuracy": 0.71, |
| "eval_code_hard_probabilities": [ |
| 1.0, |
| 0.49802687764167786, |
| 0.7207960486412048, |
| 0.01915053464472294, |
| 0.022134896367788315, |
| 4.0801442082738504e-05, |
| 0.3737213611602783, |
| 0.2865481376647949, |
| 0.30831632018089294, |
| 0.24947436153888702, |
| 0.7978243231773376, |
| 0.5949852466583252, |
| 0.9999364614486694, |
| 2.1756743628920105e-10, |
| 2.9773794540943754e-11, |
| 0.9936490654945374, |
| 0.9942991733551025, |
| 0.993448793888092, |
| 3.583797980599712e-10, |
| 3.8425835846567225e-09, |
| 2.1109008985220612e-10, |
| 0.9996128678321838, |
| 0.9975799322128296, |
| 0.9994070529937744, |
| 0.9748783707618713, |
| 0.47572091221809387, |
| 0.996880054473877, |
| 0.9991859793663025, |
| 0.987097442150116, |
| 0.9944655299186707, |
| 0.9830182790756226, |
| 0.995845377445221, |
| 0.5017166137695312, |
| 0.9952012300491333, |
| 0.8540241122245789, |
| 0.9487936496734619, |
| 0.02690940722823143, |
| 0.03413669392466545, |
| 0.9999390840530396, |
| 0.14402766525745392, |
| 0.1746188849210739, |
| 0.9748719930648804, |
| 0.9814805388450623, |
| 0.9264845848083496, |
| 0.974022388458252, |
| 0.9999991655349731, |
| 0.7958990931510925, |
| 0.6329552531242371, |
| 0.9999284744262695, |
| 0.9999613761901855, |
| 0.9999935626983643, |
| 8.354127930942923e-05, |
| 0.9636399149894714, |
| 0.999997615814209, |
| 5.748397313709575e-10, |
| 4.4799397524997175e-10, |
| 1.1092028273651522e-07, |
| 0.7891486883163452, |
| 0.5943530797958374, |
| 0.6597400307655334, |
| 3.084578281686845e-08, |
| 1.9499866998895499e-10, |
| 7.682257319174823e-08, |
| 0.988332211971283, |
| 0.9993404746055603, |
| 0.9999953508377075, |
| 0.7918521761894226, |
| 0.9975425004959106, |
| 0.9782871603965759, |
| 0.9723710417747498, |
| 0.973602831363678, |
| 0.9903439283370972, |
| 0.9704287052154541, |
| 0.9830175638198853, |
| 0.9929106831550598, |
| 0.9866513013839722, |
| 0.16249682009220123, |
| 0.3364860415458679, |
| 0.5504053235054016, |
| 0.8576055765151978, |
| 0.5424798727035522, |
| 0.9613667130470276, |
| 0.9995546936988831, |
| 0.8739398717880249, |
| 0.9984847903251648, |
| 0.9997493624687195, |
| 0.980169951915741, |
| 0.8975971341133118, |
| 0.9636164903640747, |
| 0.7637275457382202, |
| 0.5357650518417358, |
| 0.6792539358139038, |
| 0.39096373319625854, |
| 0.951950192451477, |
| 0.8796238899230957, |
| 0.9461458921432495, |
| 0.7978929281234741, |
| 0.991081178188324, |
| 0.4479399621486664, |
| 0.9878178834915161 |
| ], |
| "eval_code_hard_runtime": 140.1067, |
| "eval_code_hard_samples_per_second": 0.714, |
| "eval_code_hard_steps_per_second": 0.029, |
| "epoch": 1.75, |
| "step": 100 |
| }, |
| { |
| "train_runtime": 4333.8818, |
| "train_samples_per_second": 0.738, |
| "train_steps_per_second": 0.023, |
| "total_flos": 0.0, |
| "train_loss": 0.09087586780193589, |
| "epoch": 1.75, |
| "step": 100 |
| } |
| ] |