| [ |
| { |
| "loss": 0.7176, |
| "learning_rate": 0.0002, |
| "epoch": 0.02, |
| "step": 1 |
| }, |
| { |
| "loss": 0.626, |
| "learning_rate": 0.0002, |
| "epoch": 0.04, |
| "step": 2 |
| }, |
| { |
| "loss": 0.6406, |
| "learning_rate": 0.0002, |
| "epoch": 0.05, |
| "step": 3 |
| }, |
| { |
| "loss": 0.5599, |
| "learning_rate": 0.0002, |
| "epoch": 0.07, |
| "step": 4 |
| }, |
| { |
| "loss": 0.4681, |
| "learning_rate": 0.0002, |
| "epoch": 0.09, |
| "step": 5 |
| }, |
| { |
| "loss": 0.4553, |
| "learning_rate": 0.0002, |
| "epoch": 0.11, |
| "step": 6 |
| }, |
| { |
| "loss": 0.4104, |
| "learning_rate": 0.0002, |
| "epoch": 0.12, |
| "step": 7 |
| }, |
| { |
| "loss": 0.3978, |
| "learning_rate": 0.0002, |
| "epoch": 0.14, |
| "step": 8 |
| }, |
| { |
| "loss": 0.3848, |
| "learning_rate": 0.0002, |
| "epoch": 0.16, |
| "step": 9 |
| }, |
| { |
| "loss": 0.5363, |
| "learning_rate": 0.0002, |
| "epoch": 0.18, |
| "step": 10 |
| }, |
| { |
| "loss": 0.3722, |
| "learning_rate": 0.0002, |
| "epoch": 0.19, |
| "step": 11 |
| }, |
| { |
| "loss": 0.3675, |
| "learning_rate": 0.0002, |
| "epoch": 0.21, |
| "step": 12 |
| }, |
| { |
| "loss": 0.3061, |
| "learning_rate": 0.0002, |
| "epoch": 0.23, |
| "step": 13 |
| }, |
| { |
| "loss": 0.2357, |
| "learning_rate": 0.0002, |
| "epoch": 0.25, |
| "step": 14 |
| }, |
| { |
| "loss": 0.2983, |
| "learning_rate": 0.0002, |
| "epoch": 0.26, |
| "step": 15 |
| }, |
| { |
| "loss": 0.4426, |
| "learning_rate": 0.0002, |
| "epoch": 0.28, |
| "step": 16 |
| }, |
| { |
| "loss": 0.3633, |
| "learning_rate": 0.0002, |
| "epoch": 0.3, |
| "step": 17 |
| }, |
| { |
| "loss": 0.3673, |
| "learning_rate": 0.0002, |
| "epoch": 0.32, |
| "step": 18 |
| }, |
| { |
| "loss": 0.2728, |
| "learning_rate": 0.0002, |
| "epoch": 0.33, |
| "step": 19 |
| }, |
| { |
| "loss": 0.3937, |
| "learning_rate": 0.0002, |
| "epoch": 0.35, |
| "step": 20 |
| }, |
| { |
| "loss": 0.3076, |
| "learning_rate": 0.0002, |
| "epoch": 0.37, |
| "step": 21 |
| }, |
| { |
| "loss": 0.1257, |
| "learning_rate": 0.0002, |
| "epoch": 0.39, |
| "step": 22 |
| }, |
| { |
| "loss": 0.1323, |
| "learning_rate": 0.0002, |
| "epoch": 0.4, |
| "step": 23 |
| }, |
| { |
| "loss": 0.3184, |
| "learning_rate": 0.0002, |
| "epoch": 0.42, |
| "step": 24 |
| }, |
| { |
| "loss": 0.1576, |
| "learning_rate": 0.0002, |
| "epoch": 0.44, |
| "step": 25 |
| }, |
| { |
| "eval_code_easy_loss": 0.34121498465538025, |
| "eval_code_easy_score": -0.08921275287866592, |
| "eval_code_easy_brier_score": 0.08921275287866592, |
| "eval_code_easy_average_probability": 0.8383815884590149, |
| "eval_code_easy_accuracy": 0.91, |
| "eval_code_easy_probabilities": [ |
| 0.9973312616348267, |
| 0.9983710646629333, |
| 0.997231662273407, |
| 0.9965489506721497, |
| 0.9987871050834656, |
| 0.9933956265449524, |
| 0.6967766284942627, |
| 0.7963165044784546, |
| 0.8957101702690125, |
| 0.8911858797073364, |
| 0.6700810194015503, |
| 0.887999415397644, |
| 0.8513328433036804, |
| 0.7391810417175293, |
| 0.968675971031189, |
| 0.8287560939788818, |
| 0.8346096873283386, |
| 0.9987896084785461, |
| 0.7685402035713196, |
| 0.6702771186828613, |
| 0.6680448055267334, |
| 0.9981842637062073, |
| 0.9979216456413269, |
| 0.9962202906608582, |
| 0.999874472618103, |
| 0.9479197263717651, |
| 0.92351233959198, |
| 0.9997767806053162, |
| 0.9997504353523254, |
| 0.9994015693664551, |
| 0.8156358003616333, |
| 0.8976724147796631, |
| 0.35684335231781006, |
| 0.6020401120185852, |
| 0.695774257183075, |
| 0.5311483144760132, |
| 0.9899909496307373, |
| 0.9998482465744019, |
| 0.6876679062843323, |
| 0.9594499468803406, |
| 0.991589367389679, |
| 0.7725859880447388, |
| 0.9999998807907104, |
| 0.9900687336921692, |
| 0.9798843860626221, |
| 0.019548967480659485, |
| 0.10404925793409348, |
| 0.03977573662996292, |
| 0.638748049736023, |
| 0.9745407700538635, |
| 0.8131493330001831, |
| 0.4198451638221741, |
| 0.9959275126457214, |
| 0.9906547665596008, |
| 0.999859094619751, |
| 0.999954104423523, |
| 0.9999948740005493, |
| 0.9941011071205139, |
| 0.5232334733009338, |
| 0.996921181678772, |
| 0.9495030641555786, |
| 0.9917147755622864, |
| 0.9849343299865723, |
| 0.9999825954437256, |
| 0.999990701675415, |
| 0.9999847412109375, |
| 0.9999663829803467, |
| 0.9981877207756042, |
| 0.9100466370582581, |
| 0.8915355801582336, |
| 0.02915954403579235, |
| 0.004325248766690493, |
| 0.9999915361404419, |
| 0.9999961853027344, |
| 0.9984298348426819, |
| 0.9361048936843872, |
| 0.7488651871681213, |
| 0.9966148734092712, |
| 0.9871622920036316, |
| 0.41953274607658386, |
| 0.964065432548523, |
| 0.6713405251502991, |
| 0.7432451844215393, |
| 0.5503003597259521, |
| 0.9845474362373352, |
| 0.9991044402122498, |
| 0.9908291101455688, |
| 0.78965824842453, |
| 0.1398678869009018, |
| 0.7981515526771545, |
| 0.9919771552085876, |
| 0.6074525117874146, |
| 0.996113657951355, |
| 0.9997654557228088, |
| 0.9999492168426514, |
| 0.9985866546630859, |
| 0.9999914169311523, |
| 0.9999855756759644, |
| 0.9999876022338867, |
| 0.9762148261070251 |
| ], |
| "eval_code_easy_runtime": 17.1306, |
| "eval_code_easy_samples_per_second": 5.838, |
| "eval_code_easy_steps_per_second": 0.117, |
| "epoch": 0.44, |
| "step": 25 |
| }, |
| { |
| "eval_code_hard_loss": 1.0086419582366943, |
| "eval_code_hard_score": -0.28139397501945496, |
| "eval_code_hard_brier_score": 0.28139397501945496, |
| "eval_code_hard_average_probability": 0.5282384157180786, |
| "eval_code_hard_accuracy": 0.61, |
| "eval_code_hard_probabilities": [ |
| 0.9940557479858398, |
| 0.5578140020370483, |
| 0.4544859528541565, |
| 0.9417738914489746, |
| 0.9485132098197937, |
| 0.9686947464942932, |
| 0.34841597080230713, |
| 0.37181127071380615, |
| 0.25785237550735474, |
| 0.5207318067550659, |
| 0.4167640209197998, |
| 0.43461835384368896, |
| 0.9888814091682434, |
| 0.11123046278953552, |
| 0.15088781714439392, |
| 0.4391879737377167, |
| 0.4488320052623749, |
| 0.48593440651893616, |
| 0.902611255645752, |
| 0.8697171211242676, |
| 0.7664279937744141, |
| 0.5244131684303284, |
| 0.6065243482589722, |
| 0.6952157616615295, |
| 0.6103460192680359, |
| 0.5863346457481384, |
| 0.45322948694229126, |
| 0.15636862814426422, |
| 0.7031698226928711, |
| 0.6602889895439148, |
| 0.6120182275772095, |
| 0.5830819010734558, |
| 0.6418420076370239, |
| 0.6374729871749878, |
| 0.6232181191444397, |
| 0.6474714875221252, |
| 0.7186492085456848, |
| 0.5149539709091187, |
| 0.27517759799957275, |
| 0.5705553293228149, |
| 0.6419432163238525, |
| 0.7602654695510864, |
| 0.6087383031845093, |
| 0.6384655237197876, |
| 0.6501816511154175, |
| 0.7480051517486572, |
| 0.57122802734375, |
| 0.3884866237640381, |
| 0.692376971244812, |
| 0.6024836301803589, |
| 0.591353178024292, |
| 0.43030333518981934, |
| 0.2442779242992401, |
| 0.22508001327514648, |
| 0.0015732977772131562, |
| 0.001636496395803988, |
| 0.0015261240769177675, |
| 0.5446102023124695, |
| 0.5613898038864136, |
| 0.48322516679763794, |
| 0.004009010270237923, |
| 0.003701635170727968, |
| 0.0036944146268069744, |
| 0.5865771174430847, |
| 0.4441525340080261, |
| 0.8783551454544067, |
| 0.3124151825904846, |
| 0.9564208984375, |
| 0.3860621452331543, |
| 0.9370018243789673, |
| 0.8526004552841187, |
| 0.8547378182411194, |
| 0.5418311953544617, |
| 0.4870041012763977, |
| 0.6209992170333862, |
| 0.3137390911579132, |
| 0.1501292884349823, |
| 0.2207321971654892, |
| 0.508880615234375, |
| 0.4939533770084381, |
| 0.5084103345870972, |
| 0.5919321775436401, |
| 0.6774353384971619, |
| 0.5825659036636353, |
| 0.5430614948272705, |
| 0.5601528882980347, |
| 0.6737014651298523, |
| 0.45028504729270935, |
| 0.5943098664283752, |
| 0.4708901345729828, |
| 0.5047590732574463, |
| 0.5815862417221069, |
| 0.5608630776405334, |
| 0.2037791609764099, |
| 0.20710068941116333, |
| 0.1756637841463089, |
| 0.48647746443748474, |
| 0.9042562246322632, |
| 0.706450343132019, |
| 0.6964374780654907 |
| ], |
| "eval_code_hard_runtime": 57.8032, |
| "eval_code_hard_samples_per_second": 1.73, |
| "eval_code_hard_steps_per_second": 0.035, |
| "epoch": 0.44, |
| "step": 25 |
| }, |
| { |
| "loss": 0.1411, |
| "learning_rate": 0.0002, |
| "epoch": 0.46, |
| "step": 26 |
| }, |
| { |
| "loss": 0.2268, |
| "learning_rate": 0.0002, |
| "epoch": 0.47, |
| "step": 27 |
| }, |
| { |
| "loss": 0.1373, |
| "learning_rate": 0.0002, |
| "epoch": 0.49, |
| "step": 28 |
| }, |
| { |
| "loss": 0.2788, |
| "learning_rate": 0.0002, |
| "epoch": 0.51, |
| "step": 29 |
| }, |
| { |
| "loss": 0.0514, |
| "learning_rate": 0.0002, |
| "epoch": 0.53, |
| "step": 30 |
| }, |
| { |
| "loss": 0.174, |
| "learning_rate": 0.0002, |
| "epoch": 0.54, |
| "step": 31 |
| }, |
| { |
| "loss": 0.1099, |
| "learning_rate": 0.0002, |
| "epoch": 0.56, |
| "step": 32 |
| }, |
| { |
| "loss": 0.181, |
| "learning_rate": 0.0002, |
| "epoch": 0.58, |
| "step": 33 |
| }, |
| { |
| "loss": 0.0913, |
| "learning_rate": 0.0002, |
| "epoch": 0.6, |
| "step": 34 |
| }, |
| { |
| "loss": 0.1685, |
| "learning_rate": 0.0002, |
| "epoch": 0.61, |
| "step": 35 |
| }, |
| { |
| "loss": 0.1701, |
| "learning_rate": 0.0002, |
| "epoch": 0.63, |
| "step": 36 |
| }, |
| { |
| "loss": 0.054, |
| "learning_rate": 0.0002, |
| "epoch": 0.65, |
| "step": 37 |
| }, |
| { |
| "loss": 0.0469, |
| "learning_rate": 0.0002, |
| "epoch": 0.67, |
| "step": 38 |
| }, |
| { |
| "loss": 0.0865, |
| "learning_rate": 0.0002, |
| "epoch": 0.68, |
| "step": 39 |
| }, |
| { |
| "loss": 0.1743, |
| "learning_rate": 0.0002, |
| "epoch": 0.7, |
| "step": 40 |
| }, |
| { |
| "loss": 0.072, |
| "learning_rate": 0.0002, |
| "epoch": 0.72, |
| "step": 41 |
| }, |
| { |
| "loss": 0.1192, |
| "learning_rate": 0.0002, |
| "epoch": 0.74, |
| "step": 42 |
| }, |
| { |
| "loss": 0.056, |
| "learning_rate": 0.0002, |
| "epoch": 0.75, |
| "step": 43 |
| }, |
| { |
| "loss": 0.1633, |
| "learning_rate": 0.0002, |
| "epoch": 0.77, |
| "step": 44 |
| }, |
| { |
| "loss": 0.0487, |
| "learning_rate": 0.0002, |
| "epoch": 0.79, |
| "step": 45 |
| }, |
| { |
| "loss": 0.111, |
| "learning_rate": 0.0002, |
| "epoch": 0.81, |
| "step": 46 |
| }, |
| { |
| "loss": 0.0998, |
| "learning_rate": 0.0002, |
| "epoch": 0.82, |
| "step": 47 |
| }, |
| { |
| "loss": 0.162, |
| "learning_rate": 0.0002, |
| "epoch": 0.84, |
| "step": 48 |
| }, |
| { |
| "loss": 0.1508, |
| "learning_rate": 0.0002, |
| "epoch": 0.86, |
| "step": 49 |
| }, |
| { |
| "loss": 0.158, |
| "learning_rate": 0.0002, |
| "epoch": 0.88, |
| "step": 50 |
| }, |
| { |
| "eval_code_easy_loss": 0.26072654128074646, |
| "eval_code_easy_score": -0.07467034459114075, |
| "eval_code_easy_brier_score": 0.07467034459114075, |
| "eval_code_easy_average_probability": 0.8786800503730774, |
| "eval_code_easy_accuracy": 0.91, |
| "eval_code_easy_probabilities": [ |
| 0.993358314037323, |
| 0.9995765089988708, |
| 0.9998908042907715, |
| 0.9999998807907104, |
| 0.9999995231628418, |
| 0.9999985694885254, |
| 0.8484190106391907, |
| 0.9649071097373962, |
| 0.9977992177009583, |
| 0.6331314444541931, |
| 0.7679887413978577, |
| 0.7734430432319641, |
| 0.9972902536392212, |
| 0.9985353946685791, |
| 0.9985615611076355, |
| 0.9800190329551697, |
| 0.9999395608901978, |
| 0.9999872446060181, |
| 0.9737911820411682, |
| 0.36379221081733704, |
| 0.8597760796546936, |
| 1.0, |
| 1.0, |
| 0.9999998807907104, |
| 0.9999985694885254, |
| 0.9999895095825195, |
| 0.9909597635269165, |
| 0.9998130202293396, |
| 0.9994999170303345, |
| 0.9997158646583557, |
| 0.7183305621147156, |
| 0.6560869216918945, |
| 0.5542047023773193, |
| 0.9361991882324219, |
| 0.9441348314285278, |
| 0.7303879261016846, |
| 0.9999759197235107, |
| 0.9999983310699463, |
| 0.9700189828872681, |
| 0.9989641904830933, |
| 0.9984664916992188, |
| 0.9994432330131531, |
| 1.0, |
| 1.0, |
| 0.9999915361404419, |
| 0.3375416696071625, |
| 0.09802956134080887, |
| 0.1487502008676529, |
| 0.9902018904685974, |
| 0.9985565543174744, |
| 0.9950182437896729, |
| 0.147225022315979, |
| 0.9999966621398926, |
| 0.9999779462814331, |
| 0.999680757522583, |
| 0.9997058510780334, |
| 0.9998592138290405, |
| 0.9999998807907104, |
| 0.5950238108634949, |
| 0.999997615814209, |
| 0.999997615814209, |
| 1.0, |
| 0.9999998807907104, |
| 0.9999052286148071, |
| 0.9999927282333374, |
| 0.99998939037323, |
| 0.9201897382736206, |
| 0.9418489933013916, |
| 0.8507129549980164, |
| 0.609320342540741, |
| 0.07032223790884018, |
| 0.003869357518851757, |
| 0.9999988079071045, |
| 0.9999964237213135, |
| 0.999927282333374, |
| 0.9999841451644897, |
| 0.9998486042022705, |
| 0.9999936819076538, |
| 0.9999700784683228, |
| 0.9927895665168762, |
| 0.9999749660491943, |
| 0.9999265670776367, |
| 0.9999915361404419, |
| 0.9663752913475037, |
| 0.7864801287651062, |
| 0.8877244591712952, |
| 0.8446969985961914, |
| 0.968808114528656, |
| 0.03765033930540085, |
| 0.8669968247413635, |
| 0.9999896287918091, |
| 0.6672230958938599, |
| 0.9992057681083679, |
| 0.9999997615814209, |
| 1.0, |
| 0.9999957084655762, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.4983561038970947 |
| ], |
| "eval_code_easy_runtime": 17.1242, |
| "eval_code_easy_samples_per_second": 5.84, |
| "eval_code_easy_steps_per_second": 0.117, |
| "epoch": 0.88, |
| "step": 50 |
| }, |
| { |
| "eval_code_hard_loss": 0.6272040605545044, |
| "eval_code_hard_score": -0.2097242921590805, |
| "eval_code_hard_brier_score": 0.2097242921590805, |
| "eval_code_hard_average_probability": 0.6029007434844971, |
| "eval_code_hard_accuracy": 0.6, |
| "eval_code_hard_probabilities": [ |
| 0.9979154467582703, |
| 0.7335461378097534, |
| 0.4222542941570282, |
| 0.9998534917831421, |
| 0.9998674392700195, |
| 0.9999492168426514, |
| 0.5001015663146973, |
| 0.5079646706581116, |
| 0.5019187927246094, |
| 0.6476748585700989, |
| 0.3486829996109009, |
| 0.38149967789649963, |
| 0.9999423027038574, |
| 0.9999504089355469, |
| 0.9999474287033081, |
| 0.4916134774684906, |
| 0.5060228705406189, |
| 0.49220144748687744, |
| 0.9999898672103882, |
| 0.9999915361404419, |
| 0.9999905824661255, |
| 0.8047722578048706, |
| 0.8523899912834167, |
| 0.8705809116363525, |
| 0.3922067880630493, |
| 0.4324615001678467, |
| 0.3545004725456238, |
| 0.15673233568668365, |
| 0.6471846699714661, |
| 0.6424362063407898, |
| 0.510160505771637, |
| 0.5128241181373596, |
| 0.46828266978263855, |
| 0.43302497267723083, |
| 0.5793876051902771, |
| 0.5684614181518555, |
| 0.33457034826278687, |
| 0.3091184198856354, |
| 0.0008105101296678185, |
| 0.37077412009239197, |
| 0.4145500063896179, |
| 0.4761010408401489, |
| 0.7447249293327332, |
| 0.438394695520401, |
| 0.7413656115531921, |
| 0.4960051476955414, |
| 0.5138289928436279, |
| 0.5173673033714294, |
| 0.5924621820449829, |
| 0.7587030529975891, |
| 0.7857908606529236, |
| 0.3681909143924713, |
| 0.3770434856414795, |
| 0.6424773931503296, |
| 0.9851202368736267, |
| 0.9859110116958618, |
| 0.9855308532714844, |
| 0.5370909571647644, |
| 0.6129180192947388, |
| 0.5251724123954773, |
| 0.9999006986618042, |
| 0.9998983144760132, |
| 0.9998980760574341, |
| 0.8960296511650085, |
| 0.8455232977867126, |
| 0.9984153509140015, |
| 0.44011861085891724, |
| 0.5573714971542358, |
| 0.45769622921943665, |
| 0.5591621994972229, |
| 0.42212074995040894, |
| 0.5001301765441895, |
| 0.4822878837585449, |
| 0.7320272326469421, |
| 0.6362009048461914, |
| 0.429107666015625, |
| 0.41713282465934753, |
| 0.4034157991409302, |
| 0.5436654686927795, |
| 0.47678494453430176, |
| 0.5470160245895386, |
| 0.5428171157836914, |
| 0.5227158665657043, |
| 0.5470259785652161, |
| 0.4163595139980316, |
| 0.35028159618377686, |
| 0.5244665145874023, |
| 0.40996211767196655, |
| 0.9096313714981079, |
| 0.37183111906051636, |
| 0.47767525911331177, |
| 0.47421643137931824, |
| 0.46094876527786255, |
| 0.47423312067985535, |
| 0.4818762242794037, |
| 0.4068610668182373, |
| 0.497257262468338, |
| 0.559116542339325, |
| 0.5229799747467041, |
| 0.725604772567749 |
| ], |
| "eval_code_hard_runtime": 57.8139, |
| "eval_code_hard_samples_per_second": 1.73, |
| "eval_code_hard_steps_per_second": 0.035, |
| "epoch": 0.88, |
| "step": 50 |
| }, |
| { |
| "loss": 0.1258, |
| "learning_rate": 0.0002, |
| "epoch": 0.89, |
| "step": 51 |
| }, |
| { |
| "loss": 0.0618, |
| "learning_rate": 0.0002, |
| "epoch": 0.91, |
| "step": 52 |
| }, |
| { |
| "loss": 0.2478, |
| "learning_rate": 0.0002, |
| "epoch": 0.93, |
| "step": 53 |
| }, |
| { |
| "loss": 0.4399, |
| "learning_rate": 0.0002, |
| "epoch": 0.95, |
| "step": 54 |
| }, |
| { |
| "loss": 0.1653, |
| "learning_rate": 0.0002, |
| "epoch": 0.96, |
| "step": 55 |
| }, |
| { |
| "loss": 0.0441, |
| "learning_rate": 0.0002, |
| "epoch": 0.98, |
| "step": 56 |
| }, |
| { |
| "loss": 0.0223, |
| "learning_rate": 0.0002, |
| "epoch": 1.0, |
| "step": 57 |
| }, |
| { |
| "loss": 0.0056, |
| "learning_rate": 0.0002, |
| "epoch": 1.02, |
| "step": 58 |
| }, |
| { |
| "loss": 0.1784, |
| "learning_rate": 0.0002, |
| "epoch": 1.04, |
| "step": 59 |
| }, |
| { |
| "loss": 0.0642, |
| "learning_rate": 0.0002, |
| "epoch": 1.05, |
| "step": 60 |
| }, |
| { |
| "loss": 0.1516, |
| "learning_rate": 0.0002, |
| "epoch": 1.07, |
| "step": 61 |
| }, |
| { |
| "loss": 0.0548, |
| "learning_rate": 0.0002, |
| "epoch": 1.09, |
| "step": 62 |
| }, |
| { |
| "loss": 0.0663, |
| "learning_rate": 0.0002, |
| "epoch": 1.11, |
| "step": 63 |
| }, |
| { |
| "loss": 0.1384, |
| "learning_rate": 0.0002, |
| "epoch": 1.12, |
| "step": 64 |
| }, |
| { |
| "loss": 0.0505, |
| "learning_rate": 0.0002, |
| "epoch": 1.14, |
| "step": 65 |
| }, |
| { |
| "loss": 0.0631, |
| "learning_rate": 0.0002, |
| "epoch": 1.16, |
| "step": 66 |
| }, |
| { |
| "loss": 0.0532, |
| "learning_rate": 0.0002, |
| "epoch": 1.18, |
| "step": 67 |
| }, |
| { |
| "loss": 0.028, |
| "learning_rate": 0.0002, |
| "epoch": 1.19, |
| "step": 68 |
| }, |
| { |
| "loss": 0.0891, |
| "learning_rate": 0.0002, |
| "epoch": 1.21, |
| "step": 69 |
| }, |
| { |
| "loss": 0.0735, |
| "learning_rate": 0.0002, |
| "epoch": 1.23, |
| "step": 70 |
| }, |
| { |
| "loss": 0.0397, |
| "learning_rate": 0.0002, |
| "epoch": 1.25, |
| "step": 71 |
| }, |
| { |
| "loss": 0.0342, |
| "learning_rate": 0.0002, |
| "epoch": 1.26, |
| "step": 72 |
| }, |
| { |
| "loss": 0.0234, |
| "learning_rate": 0.0002, |
| "epoch": 1.28, |
| "step": 73 |
| }, |
| { |
| "loss": 0.0108, |
| "learning_rate": 0.0002, |
| "epoch": 1.3, |
| "step": 74 |
| }, |
| { |
| "loss": 0.0525, |
| "learning_rate": 0.0002, |
| "epoch": 1.32, |
| "step": 75 |
| }, |
| { |
| "eval_code_easy_loss": 0.22187194228172302, |
| "eval_code_easy_score": -0.044156476855278015, |
| "eval_code_easy_brier_score": 0.044156476855278015, |
| "eval_code_easy_average_probability": 0.9226246476173401, |
| "eval_code_easy_accuracy": 0.95, |
| "eval_code_easy_probabilities": [ |
| 0.9997438788414001, |
| 0.9999991655349731, |
| 0.9999997615814209, |
| 0.9999998807907104, |
| 0.9999997615814209, |
| 0.9999947547912598, |
| 0.8262179493904114, |
| 0.9995021820068359, |
| 0.998319685459137, |
| 0.988502025604248, |
| 0.9749259352684021, |
| 0.9808527827262878, |
| 0.9996113181114197, |
| 0.9993595480918884, |
| 0.9999059438705444, |
| 0.9027615189552307, |
| 0.9773653745651245, |
| 0.9999016523361206, |
| 0.9789873957633972, |
| 0.45622462034225464, |
| 0.9388629198074341, |
| 1.0, |
| 1.0, |
| 0.9999997615814209, |
| 0.9999998807907104, |
| 0.9999997615814209, |
| 0.9993877410888672, |
| 1.0, |
| 0.9999998807907104, |
| 0.9999998807907104, |
| 0.7212077379226685, |
| 0.7462506294250488, |
| 0.5923525094985962, |
| 0.9379615187644958, |
| 0.9973413348197937, |
| 0.881181001663208, |
| 0.9957089424133301, |
| 0.9999865293502808, |
| 0.9746310114860535, |
| 0.9999599456787109, |
| 0.9995377063751221, |
| 0.9997233748435974, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.7736052870750427, |
| 0.15912780165672302, |
| 0.6213001608848572, |
| 0.9973452687263489, |
| 0.9999977350234985, |
| 0.9999613761901855, |
| 0.5660737752914429, |
| 1.0, |
| 0.9999997615814209, |
| 0.999991774559021, |
| 0.9999953508377075, |
| 0.999993085861206, |
| 0.9999995231628418, |
| 0.6532827615737915, |
| 0.999998927116394, |
| 0.9999794960021973, |
| 0.9999988079071045, |
| 0.999998927116394, |
| 0.9999998807907104, |
| 1.0, |
| 1.0, |
| 0.997825026512146, |
| 0.999733030796051, |
| 0.9979919195175171, |
| 0.7770313024520874, |
| 0.011424303986132145, |
| 9.0804387582466e-05, |
| 1.0, |
| 1.0, |
| 0.9999986886978149, |
| 0.99936443567276, |
| 0.9927093982696533, |
| 0.9999185800552368, |
| 0.9999991655349731, |
| 0.9982544779777527, |
| 0.9999996423721313, |
| 0.9998847246170044, |
| 0.9999909400939941, |
| 0.9689223766326904, |
| 0.9911876916885376, |
| 0.9976316690444946, |
| 0.9958218336105347, |
| 0.993769109249115, |
| 0.40141063928604126, |
| 0.8972048759460449, |
| 0.9999942779541016, |
| 0.6255294680595398, |
| 0.9922812581062317, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9875762462615967 |
| ], |
| "eval_code_easy_runtime": 17.1185, |
| "eval_code_easy_samples_per_second": 5.842, |
| "eval_code_easy_steps_per_second": 0.117, |
| "epoch": 1.32, |
| "step": 75 |
| }, |
| { |
| "eval_code_hard_loss": 0.613934338092804, |
| "eval_code_hard_score": -0.20562565326690674, |
| "eval_code_hard_brier_score": 0.20562565326690674, |
| "eval_code_hard_average_probability": 0.6201408505439758, |
| "eval_code_hard_accuracy": 0.68, |
| "eval_code_hard_probabilities": [ |
| 0.9997522234916687, |
| 0.6726481318473816, |
| 0.4837990403175354, |
| 0.9999945163726807, |
| 0.9999929666519165, |
| 0.9999992847442627, |
| 0.5199088454246521, |
| 0.5684794783592224, |
| 0.5020670890808105, |
| 0.6793079376220703, |
| 0.3110067546367645, |
| 0.4360009431838989, |
| 0.999996542930603, |
| 0.9999467134475708, |
| 0.9999498128890991, |
| 0.5130871534347534, |
| 0.5327062010765076, |
| 0.5177708864212036, |
| 0.9999998807907104, |
| 0.9999998807907104, |
| 0.9999998807907104, |
| 0.8731643557548523, |
| 0.9360027313232422, |
| 0.9267758727073669, |
| 0.35389643907546997, |
| 0.39809563755989075, |
| 0.20879632234573364, |
| 0.07375767827033997, |
| 0.5250951051712036, |
| 0.5149143934249878, |
| 0.7871077656745911, |
| 0.7780881524085999, |
| 0.6657141447067261, |
| 0.5761507749557495, |
| 0.758147120475769, |
| 0.6872865557670593, |
| 0.29255661368370056, |
| 0.1509549617767334, |
| 0.004953588359057903, |
| 0.3843843936920166, |
| 0.4454701542854309, |
| 0.5638160705566406, |
| 0.6067726612091064, |
| 0.3357914388179779, |
| 0.5700987577438354, |
| 0.8174778819084167, |
| 0.5854097008705139, |
| 0.5972737073898315, |
| 0.6639817953109741, |
| 0.8354654908180237, |
| 0.8449712991714478, |
| 0.35150453448295593, |
| 0.25781506299972534, |
| 0.7074410319328308, |
| 0.9738778471946716, |
| 0.9760010242462158, |
| 0.9789164066314697, |
| 0.5705886483192444, |
| 0.642711341381073, |
| 0.5328339338302612, |
| 0.999995231628418, |
| 0.9999946355819702, |
| 0.9999946355819702, |
| 0.9326982498168945, |
| 0.7097592353820801, |
| 0.9997654557228088, |
| 0.446959525346756, |
| 0.6458287835121155, |
| 0.47074800729751587, |
| 0.6868018507957458, |
| 0.5448780059814453, |
| 0.5729479789733887, |
| 0.4683343768119812, |
| 0.570155918598175, |
| 0.5829461216926575, |
| 0.4596071243286133, |
| 0.407598614692688, |
| 0.38017627596855164, |
| 0.5608930587768555, |
| 0.49683383107185364, |
| 0.600445568561554, |
| 0.6426953077316284, |
| 0.8385844826698303, |
| 0.6047258377075195, |
| 0.2799336314201355, |
| 0.2773086130619049, |
| 0.6116948127746582, |
| 0.43185508251190186, |
| 0.8329448103904724, |
| 0.4886557459831238, |
| 0.4926038086414337, |
| 0.4693112373352051, |
| 0.4659242630004883, |
| 0.321489155292511, |
| 0.3335782587528229, |
| 0.1558743566274643, |
| 0.5026931762695312, |
| 0.7897409200668335, |
| 0.5024547576904297, |
| 0.9441749453544617 |
| ], |
| "eval_code_hard_runtime": 57.778, |
| "eval_code_hard_samples_per_second": 1.731, |
| "eval_code_hard_steps_per_second": 0.035, |
| "epoch": 1.32, |
| "step": 75 |
| }, |
| { |
| "loss": 0.0344, |
| "learning_rate": 0.0002, |
| "epoch": 1.33, |
| "step": 76 |
| }, |
| { |
| "loss": 0.0514, |
| "learning_rate": 0.0002, |
| "epoch": 1.35, |
| "step": 77 |
| }, |
| { |
| "loss": 0.0065, |
| "learning_rate": 0.0002, |
| "epoch": 1.37, |
| "step": 78 |
| }, |
| { |
| "loss": 0.0893, |
| "learning_rate": 0.0002, |
| "epoch": 1.39, |
| "step": 79 |
| }, |
| { |
| "loss": 0.0431, |
| "learning_rate": 0.0002, |
| "epoch": 1.4, |
| "step": 80 |
| }, |
| { |
| "loss": 0.0101, |
| "learning_rate": 0.0002, |
| "epoch": 1.42, |
| "step": 81 |
| }, |
| { |
| "loss": 0.0622, |
| "learning_rate": 0.0002, |
| "epoch": 1.44, |
| "step": 82 |
| }, |
| { |
| "loss": 0.0007, |
| "learning_rate": 0.0002, |
| "epoch": 1.46, |
| "step": 83 |
| }, |
| { |
| "loss": 0.0084, |
| "learning_rate": 0.0002, |
| "epoch": 1.47, |
| "step": 84 |
| }, |
| { |
| "loss": 0.0307, |
| "learning_rate": 0.0002, |
| "epoch": 1.49, |
| "step": 85 |
| }, |
| { |
| "loss": 0.0005, |
| "learning_rate": 0.0002, |
| "epoch": 1.51, |
| "step": 86 |
| }, |
| { |
| "loss": 0.001, |
| "learning_rate": 0.0002, |
| "epoch": 1.53, |
| "step": 87 |
| }, |
| { |
| "loss": 0.0243, |
| "learning_rate": 0.0002, |
| "epoch": 1.54, |
| "step": 88 |
| }, |
| { |
| "loss": 0.0417, |
| "learning_rate": 0.0002, |
| "epoch": 1.56, |
| "step": 89 |
| }, |
| { |
| "loss": 0.0418, |
| "learning_rate": 0.0002, |
| "epoch": 1.58, |
| "step": 90 |
| }, |
| { |
| "loss": 0.0207, |
| "learning_rate": 0.0002, |
| "epoch": 1.6, |
| "step": 91 |
| }, |
| { |
| "loss": 0.2464, |
| "learning_rate": 0.0002, |
| "epoch": 1.61, |
| "step": 92 |
| }, |
| { |
| "loss": 0.1456, |
| "learning_rate": 0.0002, |
| "epoch": 1.63, |
| "step": 93 |
| }, |
| { |
| "loss": 0.0005, |
| "learning_rate": 0.0002, |
| "epoch": 1.65, |
| "step": 94 |
| }, |
| { |
| "loss": 0.0025, |
| "learning_rate": 0.0002, |
| "epoch": 1.67, |
| "step": 95 |
| }, |
| { |
| "loss": 0.0456, |
| "learning_rate": 0.0002, |
| "epoch": 1.68, |
| "step": 96 |
| }, |
| { |
| "loss": 0.0069, |
| "learning_rate": 0.0002, |
| "epoch": 1.7, |
| "step": 97 |
| }, |
| { |
| "loss": 0.0092, |
| "learning_rate": 0.0002, |
| "epoch": 1.72, |
| "step": 98 |
| }, |
| { |
| "loss": 0.1516, |
| "learning_rate": 0.0002, |
| "epoch": 1.74, |
| "step": 99 |
| }, |
| { |
| "loss": 0.0164, |
| "learning_rate": 0.0002, |
| "epoch": 1.75, |
| "step": 100 |
| }, |
| { |
| "eval_code_easy_loss": 0.37038832902908325, |
| "eval_code_easy_score": -0.03134830296039581, |
| "eval_code_easy_brier_score": 0.03134830296039581, |
| "eval_code_easy_average_probability": 0.9487545490264893, |
| "eval_code_easy_accuracy": 0.97, |
| "eval_code_easy_probabilities": [ |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999997615814209, |
| 0.9346917271614075, |
| 1.0, |
| 0.9999998807907104, |
| 0.9997040629386902, |
| 0.9992467164993286, |
| 0.9994949102401733, |
| 0.9994587302207947, |
| 0.9999791383743286, |
| 0.9999996423721313, |
| 0.9992595314979553, |
| 0.9999998807907104, |
| 1.0, |
| 0.9998413324356079, |
| 0.6475287675857544, |
| 0.9992796778678894, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.8477630615234375, |
| 0.863884687423706, |
| 0.5967232584953308, |
| 0.8738592267036438, |
| 0.9956537485122681, |
| 0.7420057058334351, |
| 0.9940522313117981, |
| 1.0, |
| 0.9952139854431152, |
| 0.9999994039535522, |
| 1.0, |
| 0.9999545812606812, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9897578954696655, |
| 0.2987537980079651, |
| 0.9979766011238098, |
| 0.9999840259552002, |
| 1.0, |
| 1.0, |
| 0.9765376448631287, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.7584323883056641, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999982118606567, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9797248840332031, |
| 1.8104368791682646e-05, |
| 2.9319591199339357e-10, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9998795986175537, |
| 1.0, |
| 1.0, |
| 0.9999961853027344, |
| 1.0, |
| 0.9750629663467407, |
| 0.9934146404266357, |
| 0.9500468969345093, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.9999947547912598, |
| 0.843275785446167, |
| 0.9999544620513916, |
| 1.0, |
| 0.6250555515289307, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.999996542930603 |
| ], |
| "eval_code_easy_runtime": 17.1259, |
| "eval_code_easy_samples_per_second": 5.839, |
| "eval_code_easy_steps_per_second": 0.117, |
| "epoch": 1.75, |
| "step": 100 |
| }, |
| { |
| "eval_code_hard_loss": 1.3108476400375366, |
| "eval_code_hard_score": -0.238570898771286, |
| "eval_code_hard_brier_score": 0.238570898771286, |
| "eval_code_hard_average_probability": 0.637829601764679, |
| "eval_code_hard_accuracy": 0.69, |
| "eval_code_hard_probabilities": [ |
| 1.0, |
| 0.8749839663505554, |
| 0.6682276129722595, |
| 1.0, |
| 1.0, |
| 1.0, |
| 0.4749336838722229, |
| 0.7184466123580933, |
| 0.4824881851673126, |
| 0.7342566251754761, |
| 0.34355923533439636, |
| 0.3212933838367462, |
| 0.999998927116394, |
| 0.11708329617977142, |
| 0.2533932030200958, |
| 0.4083555340766907, |
| 0.49011072516441345, |
| 0.5354903340339661, |
| 0.9999998807907104, |
| 0.9999995231628418, |
| 0.9999921321868896, |
| 0.9668300151824951, |
| 0.9995100498199463, |
| 0.9995787739753723, |
| 0.5743376612663269, |
| 0.6365594267845154, |
| 0.19516201317310333, |
| 5.900204200770531e-07, |
| 0.6282064914703369, |
| 0.6691750884056091, |
| 0.9999256134033203, |
| 0.9999665021896362, |
| 0.9993390440940857, |
| 0.9999998807907104, |
| 0.9648662805557251, |
| 0.7553066611289978, |
| 0.15391865372657776, |
| 0.0059105814434587955, |
| 0.0041419873014092445, |
| 0.6582466959953308, |
| 0.6763702630996704, |
| 0.8389391303062439, |
| 0.8646246194839478, |
| 0.7645048499107361, |
| 0.873203456401825, |
| 0.9956676959991455, |
| 0.6906198263168335, |
| 0.7347480058670044, |
| 0.9999996423721313, |
| 0.9999585151672363, |
| 0.9992007613182068, |
| 0.034449804574251175, |
| 0.01096381526440382, |
| 0.8154931664466858, |
| 3.0823147767478076e-07, |
| 3.748235144485079e-07, |
| 3.7546107023445074e-07, |
| 0.507102370262146, |
| 0.7094148397445679, |
| 0.6129729151725769, |
| 0.8193482756614685, |
| 0.6906271576881409, |
| 0.7478002905845642, |
| 0.9924389123916626, |
| 0.7537370324134827, |
| 1.0, |
| 0.33823978900909424, |
| 0.8392996788024902, |
| 0.33018726110458374, |
| 0.9978412389755249, |
| 0.9927680492401123, |
| 0.9661868214607239, |
| 0.739952027797699, |
| 0.757354199886322, |
| 0.8434256911277771, |
| 0.5655504465103149, |
| 0.09736324101686478, |
| 0.15342624485492706, |
| 0.5846419930458069, |
| 0.5172314047813416, |
| 0.7640779614448547, |
| 0.7927785515785217, |
| 0.9958668947219849, |
| 0.6929405331611633, |
| 0.4140860140323639, |
| 0.4588907063007355, |
| 0.8826824426651001, |
| 0.4302871525287628, |
| 0.8620820045471191, |
| 0.5388514995574951, |
| 0.49043917655944824, |
| 0.4464437961578369, |
| 0.5461203455924988, |
| 0.01837478019297123, |
| 0.01984582096338272, |
| 0.0083817383274436, |
| 0.417593389749527, |
| 0.9964190721511841, |
| 0.5195274949073792, |
| 0.9980224370956421 |
| ], |
| "eval_code_hard_runtime": 57.8261, |
| "eval_code_hard_samples_per_second": 1.729, |
| "eval_code_hard_steps_per_second": 0.035, |
| "epoch": 1.75, |
| "step": 100 |
| }, |
| { |
| "train_runtime": 1718.4456, |
| "train_samples_per_second": 1.862, |
| "train_steps_per_second": 0.058, |
| "total_flos": 0.0, |
| "train_loss": 0.1626638910168549, |
| "epoch": 1.75, |
| "step": 100 |
| } |
| ] |