[ { "loss": 2.319, "learning_rate": 0.0002, "epoch": 0.05, "step": 1 }, { "loss": 1.1571, "learning_rate": 0.0002, "epoch": 0.11, "step": 2 }, { "loss": 0.8951, "learning_rate": 0.0002, "epoch": 0.16, "step": 3 }, { "loss": 0.7019, "learning_rate": 0.0002, "epoch": 0.21, "step": 4 }, { "loss": 0.6999, "learning_rate": 0.0002, "epoch": 0.26, "step": 5 }, { "loss": 0.7884, "learning_rate": 0.0002, "epoch": 0.32, "step": 6 }, { "loss": 0.6625, "learning_rate": 0.0002, "epoch": 0.37, "step": 7 }, { "loss": 0.6943, "learning_rate": 0.0002, "epoch": 0.42, "step": 8 }, { "loss": 0.7418, "learning_rate": 0.0002, "epoch": 0.47, "step": 9 }, { "loss": 0.6976, "learning_rate": 0.0002, "epoch": 0.53, "step": 10 }, { "loss": 0.7081, "learning_rate": 0.0002, "epoch": 0.58, "step": 11 }, { "loss": 0.6817, "learning_rate": 0.0002, "epoch": 0.63, "step": 12 }, { "loss": 0.6799, "learning_rate": 0.0002, "epoch": 0.68, "step": 13 }, { "loss": 0.7014, "learning_rate": 0.0002, "epoch": 0.74, "step": 14 }, { "loss": 0.7207, "learning_rate": 0.0002, "epoch": 0.79, "step": 15 }, { "loss": 0.681, "learning_rate": 0.0002, "epoch": 0.84, "step": 16 }, { "loss": 0.7092, "learning_rate": 0.0002, "epoch": 0.89, "step": 17 }, { "loss": 0.691, "learning_rate": 0.0002, "epoch": 0.95, "step": 18 }, { "loss": 0.6796, "learning_rate": 0.0002, "epoch": 1.0, "step": 19 }, { "loss": 0.7201, "learning_rate": 0.0002, "epoch": 1.05, "step": 20 }, { "loss": 0.6609, "learning_rate": 0.0002, "epoch": 1.11, "step": 21 }, { "loss": 0.716, "learning_rate": 0.0002, "epoch": 1.16, "step": 22 }, { "loss": 0.7015, "learning_rate": 0.0002, "epoch": 1.21, "step": 23 }, { "loss": 0.7698, "learning_rate": 0.0002, "epoch": 1.26, "step": 24 }, { "loss": 0.7193, "learning_rate": 0.0002, "epoch": 1.32, "step": 25 }, { "eval_code_is_correct_loss": 0.7040590047836304, "eval_code_is_correct_score": -0.25534066557884216, "eval_code_is_correct_brier_score": 0.25534066557884216, "eval_code_is_correct_average_probability": 0.4964892268180847, "eval_code_is_correct_accuracy": 0.48, "eval_code_is_correct_probabilities": [ 0.537757158279419, 0.45456114411354065, 0.46773606538772583, 0.5088943839073181, 0.44396457076072693, 0.5441208481788635, 0.46894216537475586, 0.5342907905578613, 0.5333516001701355, 0.543117105960846, 0.4494006931781769, 0.5351378321647644, 0.5340185761451721, 0.5496283173561096, 0.46146854758262634, 0.46118637919425964, 0.47490179538726807, 0.54707932472229, 0.4630311131477356, 0.46271002292633057, 0.553754448890686, 0.45833271741867065, 0.44106921553611755, 0.5405190587043762, 0.5340151786804199, 0.538471519947052, 0.44194644689559937, 0.4529338479042053, 0.46126678586006165, 0.547139585018158, 0.4498041272163391, 0.4580332040786743, 0.5330279469490051, 0.47573158144950867, 0.4609244763851166, 0.5373966693878174, 0.4560283422470093, 0.45565375685691833, 0.4430266320705414, 0.5496351718902588, 0.46626290678977966, 0.5276714563369751, 0.5368297696113586, 0.4585987329483032, 0.4506687819957733, 0.48509010672569275, 0.5378000736236572, 0.5482139587402344, 0.53798508644104, 0.5404862761497498, 0.5462475419044495, 0.5316811203956604, 0.545008659362793, 0.4452662467956543, 0.46562960743904114, 0.4650121331214905, 0.5360617637634277, 0.4509516656398773, 0.44952070713043213, 0.4582957625389099, 0.4517310857772827, 0.4437441825866699, 0.4606005549430847, 0.547730028629303, 0.4598681926727295, 0.46059927344322205, 0.4745525121688843, 0.5424997210502625, 0.5405730605125427, 0.5450511574745178, 0.4547448456287384, 0.5489879846572876, 0.5354413986206055, 0.4355437159538269, 0.5529230833053589, 0.44915857911109924, 0.44940751791000366, 0.4544369876384735, 0.45526307821273804, 0.5274561047554016, 0.44203782081604004, 0.4448660910129547, 0.520516574382782, 0.5427135825157166, 0.4694376587867737, 0.45909956097602844, 0.46876445412635803, 0.5469857454299927, 0.5509116053581238, 0.4485166072845459, 0.5540351867675781, 0.5366657972335815, 0.5381718277931213, 0.539725661277771, 0.5412744879722595, 0.5397677421569824, 0.5319379568099976, 0.5362846255302429, 0.45564961433410645, 0.44395512342453003 ], "eval_code_is_correct_runtime": 38.6775, "eval_code_is_correct_samples_per_second": 2.585, "eval_code_is_correct_steps_per_second": 0.052, "epoch": 1.32, "step": 25 }, { "loss": 0.6893, "learning_rate": 0.0002, "epoch": 1.37, "step": 26 }, { "loss": 0.6885, "learning_rate": 0.0002, "epoch": 1.42, "step": 27 }, { "loss": 0.6805, "learning_rate": 0.0002, "epoch": 1.47, "step": 28 }, { "loss": 0.7027, "learning_rate": 0.0002, "epoch": 1.53, "step": 29 }, { "loss": 0.7283, "learning_rate": 0.0002, "epoch": 1.58, "step": 30 }, { "loss": 0.6708, "learning_rate": 0.0002, "epoch": 1.63, "step": 31 }, { "loss": 0.7083, "learning_rate": 0.0002, "epoch": 1.68, "step": 32 }, { "loss": 0.7336, "learning_rate": 0.0002, "epoch": 1.74, "step": 33 }, { "loss": 0.7028, "learning_rate": 0.0002, "epoch": 1.79, "step": 34 }, { "loss": 0.695, "learning_rate": 0.0002, "epoch": 1.84, "step": 35 }, { "loss": 0.6997, "learning_rate": 0.0002, "epoch": 1.89, "step": 36 }, { "loss": 0.6743, "learning_rate": 0.0002, "epoch": 1.95, "step": 37 }, { "loss": 0.7388, "learning_rate": 0.0002, "epoch": 2.0, "step": 38 }, { "loss": 0.6464, "learning_rate": 0.0002, "epoch": 2.05, "step": 39 }, { "loss": 0.6772, "learning_rate": 0.0002, "epoch": 2.11, "step": 40 }, { "loss": 0.7009, "learning_rate": 0.0002, "epoch": 2.16, "step": 41 }, { "loss": 0.7021, "learning_rate": 0.0002, "epoch": 2.21, "step": 42 }, { "loss": 0.7051, "learning_rate": 0.0002, "epoch": 2.26, "step": 43 }, { "loss": 0.6816, "learning_rate": 0.0002, "epoch": 2.32, "step": 44 }, { "loss": 0.7047, "learning_rate": 0.0002, "epoch": 2.37, "step": 45 }, { "loss": 0.683, "learning_rate": 0.0002, "epoch": 2.42, "step": 46 }, { "loss": 0.6875, "learning_rate": 0.0002, "epoch": 2.47, "step": 47 }, { "loss": 0.6723, "learning_rate": 0.0002, "epoch": 2.53, "step": 48 }, { "loss": 0.6727, "learning_rate": 0.0002, "epoch": 2.58, "step": 49 }, { "loss": 0.6683, "learning_rate": 0.0002, "epoch": 2.63, "step": 50 }, { "eval_code_is_correct_loss": 0.6990968585014343, "eval_code_is_correct_score": -0.2527521252632141, "eval_code_is_correct_brier_score": 0.2527521252632141, "eval_code_is_correct_average_probability": 0.5049085021018982, "eval_code_is_correct_accuracy": 0.52, "eval_code_is_correct_probabilities": [ 0.4113783538341522, 0.5813317894935608, 0.5584416389465332, 0.41934269666671753, 0.5603463053703308, 0.4234032928943634, 0.5691850781440735, 0.45391106605529785, 0.41783419251441956, 0.3891553580760956, 0.5918279886245728, 0.39812296628952026, 0.3982398509979248, 0.4082736074924469, 0.5677108764648438, 0.6011993885040283, 0.5879720449447632, 0.3799493908882141, 0.6072862148284912, 0.5974151492118835, 0.41310346126556396, 0.563809871673584, 0.5413035750389099, 0.4107910394668579, 0.39933568239212036, 0.4007815718650818, 0.5928361415863037, 0.5920814871788025, 0.5649393200874329, 0.4397546648979187, 0.5982930660247803, 0.5736469030380249, 0.38247016072273254, 0.6029582023620605, 0.6050556302070618, 0.4481448829174042, 0.5958505272865295, 0.5872756838798523, 0.5685001015663147, 0.4170364737510681, 0.5979400873184204, 0.41077008843421936, 0.4539501667022705, 0.5808403491973877, 0.5866948962211609, 0.5965925455093384, 0.40257659554481506, 0.41161125898361206, 0.3845840096473694, 0.4100808799266815, 0.41701117157936096, 0.44743281602859497, 0.3830299377441406, 0.5776842832565308, 0.602536141872406, 0.6121425628662109, 0.4026949107646942, 0.6027580499649048, 0.5705916285514832, 0.5934571623802185, 0.5883546471595764, 0.5897589325904846, 0.5788743495941162, 0.42781656980514526, 0.6336899399757385, 0.5650004148483276, 0.5743370056152344, 0.4256901144981384, 0.4294798672199249, 0.4059537351131439, 0.5902615189552307, 0.4481872022151947, 0.46126502752304077, 0.5778518915176392, 0.409288614988327, 0.5872939229011536, 0.553527295589447, 0.6006361246109009, 0.6073405146598816, 0.3934749662876129, 0.5734230279922485, 0.5781282782554626, 0.4140267074108124, 0.4379793703556061, 0.5872884392738342, 0.5996562242507935, 0.6247859001159668, 0.42214199900627136, 0.4056937098503113, 0.5941511392593384, 0.4240345358848572, 0.3906824290752411, 0.4487050473690033, 0.4064308702945709, 0.4991621673107147, 0.3930267095565796, 0.4262542128562927, 0.39416787028312683, 0.6034715175628662, 0.5542858839035034 ], "eval_code_is_correct_runtime": 38.6577, "eval_code_is_correct_samples_per_second": 2.587, "eval_code_is_correct_steps_per_second": 0.052, "epoch": 2.63, "step": 50 }, { "loss": 0.6992, "learning_rate": 0.0002, "epoch": 2.68, "step": 51 }, { "loss": 0.7576, "learning_rate": 0.0002, "epoch": 2.74, "step": 52 }, { "loss": 0.6925, "learning_rate": 0.0002, "epoch": 2.79, "step": 53 }, { "loss": 0.6884, "learning_rate": 0.0002, "epoch": 2.84, "step": 54 }, { "loss": 0.6555, "learning_rate": 0.0002, "epoch": 2.89, "step": 55 }, { "loss": 0.7276, "learning_rate": 0.0002, "epoch": 2.95, "step": 56 }, { "loss": 0.6827, "learning_rate": 0.0002, "epoch": 3.0, "step": 57 }, { "loss": 0.6291, "learning_rate": 0.0002, "epoch": 3.05, "step": 58 }, { "loss": 0.7595, "learning_rate": 0.0002, "epoch": 3.11, "step": 59 }, { "loss": 0.6753, "learning_rate": 0.0002, "epoch": 3.16, "step": 60 }, { "loss": 0.7555, "learning_rate": 0.0002, "epoch": 3.21, "step": 61 }, { "loss": 0.6965, "learning_rate": 0.0002, "epoch": 3.26, "step": 62 }, { "loss": 0.6775, "learning_rate": 0.0002, "epoch": 3.32, "step": 63 }, { "loss": 0.6841, "learning_rate": 0.0002, "epoch": 3.37, "step": 64 }, { "loss": 0.6706, "learning_rate": 0.0002, "epoch": 3.42, "step": 65 }, { "loss": 0.7128, "learning_rate": 0.0002, "epoch": 3.47, "step": 66 }, { "loss": 0.7036, "learning_rate": 0.0002, "epoch": 3.53, "step": 67 }, { "loss": 0.67, "learning_rate": 0.0002, "epoch": 3.58, "step": 68 }, { "loss": 0.6816, "learning_rate": 0.0002, "epoch": 3.63, "step": 69 }, { "loss": 0.6635, "learning_rate": 0.0002, "epoch": 3.68, "step": 70 }, { "loss": 0.6457, "learning_rate": 0.0002, "epoch": 3.74, "step": 71 }, { "loss": 0.6369, "learning_rate": 0.0002, "epoch": 3.79, "step": 72 }, { "loss": 0.6955, "learning_rate": 0.0002, "epoch": 3.84, "step": 73 }, { "loss": 0.6937, "learning_rate": 0.0002, "epoch": 3.89, "step": 74 }, { "loss": 0.6842, "learning_rate": 0.0002, "epoch": 3.95, "step": 75 }, { "eval_code_is_correct_loss": 0.7020106315612793, "eval_code_is_correct_score": -0.2538911998271942, "eval_code_is_correct_brier_score": 0.2538911998271942, "eval_code_is_correct_average_probability": 0.502829372882843, "eval_code_is_correct_accuracy": 0.45, "eval_code_is_correct_probabilities": [ 0.5088492035865784, 0.4741206467151642, 0.4018367826938629, 0.49836266040802, 0.3702163100242615, 0.6138777732849121, 0.43586498498916626, 0.6494307518005371, 0.5666269063949585, 0.5525698065757751, 0.3989929258823395, 0.49194008111953735, 0.5326002836227417, 0.5366830825805664, 0.42133161425590515, 0.42769843339920044, 0.44886454939842224, 0.4730355739593506, 0.48204565048217773, 0.4801846444606781, 0.5868195295333862, 0.4399736523628235, 0.3782220780849457, 0.5690118074417114, 0.5845021605491638, 0.5171434283256531, 0.41184958815574646, 0.4574517011642456, 0.41264650225639343, 0.6442864537239075, 0.48700496554374695, 0.3954983949661255, 0.4781593382358551, 0.43342939019203186, 0.4707704186439514, 0.5405588746070862, 0.4150758981704712, 0.4007004499435425, 0.34886103868484497, 0.5174517631530762, 0.47847726941108704, 0.548160970211029, 0.7044894099235535, 0.45586660504341125, 0.4582586884498596, 0.5384201407432556, 0.5183372497558594, 0.5092693567276001, 0.5427851676940918, 0.5732136964797974, 0.5735348463058472, 0.6746758818626404, 0.49393337965011597, 0.42578810453414917, 0.4929383099079132, 0.4470900893211365, 0.574955940246582, 0.4823959767818451, 0.3653642237186432, 0.46867260336875916, 0.42166757583618164, 0.47335392236709595, 0.4112188518047333, 0.6188163757324219, 0.5855951905250549, 0.47489026188850403, 0.45155712962150574, 0.6093342900276184, 0.605854868888855, 0.562972903251648, 0.4357713460922241, 0.598077118396759, 0.5654999613761902, 0.43106329441070557, 0.5422348976135254, 0.40416285395622253, 0.4005366861820221, 0.46095961332321167, 0.490922749042511, 0.49807679653167725, 0.40843698382377625, 0.4329848885536194, 0.5059437155723572, 0.6385719180107117, 0.49556964635849, 0.43445929884910583, 0.49239978194236755, 0.6199828386306763, 0.5497725605964661, 0.40616798400878906, 0.6228035092353821, 0.5643633008003235, 0.5394735932350159, 0.5994738340377808, 0.7553389668464661, 0.5502137541770935, 0.579784631729126, 0.5687956809997559, 0.5465372800827026, 0.3481208384037018 ], "eval_code_is_correct_runtime": 38.6558, "eval_code_is_correct_samples_per_second": 2.587, "eval_code_is_correct_steps_per_second": 0.052, "epoch": 3.95, "step": 75 }, { "loss": 0.6694, "learning_rate": 0.0002, "epoch": 4.0, "step": 76 }, { "loss": 0.6634, "learning_rate": 0.0002, "epoch": 4.05, "step": 77 }, { "loss": 0.6602, "learning_rate": 0.0002, "epoch": 4.11, "step": 78 }, { "loss": 0.6396, "learning_rate": 0.0002, "epoch": 4.16, "step": 79 }, { "loss": 0.7378, "learning_rate": 0.0002, "epoch": 4.21, "step": 80 }, { "loss": 0.8125, "learning_rate": 0.0002, "epoch": 4.26, "step": 81 }, { "loss": 0.5817, "learning_rate": 0.0002, "epoch": 4.32, "step": 82 }, { "loss": 0.6169, "learning_rate": 0.0002, "epoch": 4.37, "step": 83 }, { "loss": 0.6157, "learning_rate": 0.0002, "epoch": 4.42, "step": 84 }, { "loss": 0.6109, "learning_rate": 0.0002, "epoch": 4.47, "step": 85 }, { "loss": 0.5057, "learning_rate": 0.0002, "epoch": 4.53, "step": 86 }, { "loss": 0.5264, "learning_rate": 0.0002, "epoch": 4.58, "step": 87 }, { "loss": 0.6092, "learning_rate": 0.0002, "epoch": 4.63, "step": 88 }, { "loss": 0.5337, "learning_rate": 0.0002, "epoch": 4.68, "step": 89 }, { "loss": 0.6412, "learning_rate": 0.0002, "epoch": 4.74, "step": 90 }, { "loss": 0.5222, "learning_rate": 0.0002, "epoch": 4.79, "step": 91 }, { "loss": 0.612, "learning_rate": 0.0002, "epoch": 4.84, "step": 92 }, { "loss": 0.6778, "learning_rate": 0.0002, "epoch": 4.89, "step": 93 }, { "loss": 0.673, "learning_rate": 0.0002, "epoch": 4.95, "step": 94 }, { "loss": 0.5896, "learning_rate": 0.0002, "epoch": 5.0, "step": 95 }, { "loss": 0.6669, "learning_rate": 0.0002, "epoch": 5.05, "step": 96 }, { "loss": 0.7279, "learning_rate": 0.0002, "epoch": 5.11, "step": 97 }, { "loss": 0.4678, "learning_rate": 0.0002, "epoch": 5.16, "step": 98 }, { "loss": 0.5572, "learning_rate": 0.0002, "epoch": 5.21, "step": 99 }, { "loss": 0.5173, "learning_rate": 0.0002, "epoch": 5.26, "step": 100 }, { "eval_code_is_correct_loss": 0.6044353246688843, "eval_code_is_correct_score": -0.20567844808101654, "eval_code_is_correct_brier_score": 0.20567844808101654, "eval_code_is_correct_average_probability": 0.5809673070907593, "eval_code_is_correct_accuracy": 0.69, "eval_code_is_correct_probabilities": [ 0.495758056640625, 0.6722157001495361, 0.5509936213493347, 0.30042609572410583, 0.4185842275619507, 0.6230117678642273, 0.6212649941444397, 0.6848446726799011, 0.6345605850219727, 0.3738310635089874, 0.4916575253009796, 0.4045080244541168, 0.43291226029396057, 0.4618946313858032, 0.6218451857566833, 0.3830638527870178, 0.6171413064002991, 0.2532573342323303, 0.6897477507591248, 0.6743988990783691, 0.7978313565254211, 0.6350521445274353, 0.5316161513328552, 0.347903311252594, 0.6238374710083008, 0.298748254776001, 0.5980588793754578, 0.6492370963096619, 0.5917383432388306, 0.6613048911094666, 0.6900146007537842, 0.5732241272926331, 0.23556573688983917, 0.5519108772277832, 0.7326077222824097, 0.856022834777832, 0.5683114528656006, 0.6112112402915955, 0.43082374334335327, 0.2740175426006317, 0.710313618183136, 0.3746766149997711, 0.9831528067588806, 0.7283727526664734, 0.6630771160125732, 0.7669262886047363, 0.310622900724411, 0.4299599826335907, 0.40406081080436707, 0.569300651550293, 0.3967253267765045, 0.9761428833007812, 0.25975796580314636, 0.5678868889808655, 0.6639503836631775, 0.5604276657104492, 0.5109429955482483, 0.7717424631118774, 0.5076764225959778, 0.480741024017334, 0.6118683218955994, 0.7221248149871826, 0.42638152837753296, 0.9544664621353149, 0.7895866632461548, 0.5485232472419739, 0.5473383665084839, 0.5949488878250122, 0.6287338137626648, 0.3621536195278168, 0.5074862837791443, 0.8851379156112671, 0.8405280113220215, 0.6945863962173462, 0.5270545482635498, 0.5763978362083435, 0.6713876724243164, 0.7237599492073059, 0.8137936592102051, 0.33156439661979675, 0.6127635836601257, 0.44015809893608093, 0.2821398079395294, 0.6921646595001221, 0.6725201606750488, 0.6315755844116211, 0.7930103540420532, 0.7124245166778564, 0.3897824287414551, 0.5918102860450745, 0.7035940289497375, 0.36644646525382996, 0.4447966516017914, 0.5399353504180908, 0.9951468110084534, 0.3498772382736206, 0.765509307384491, 0.6127597689628601, 0.8720724582672119, 0.5690097212791443 ], "eval_code_is_correct_runtime": 38.7216, "eval_code_is_correct_samples_per_second": 2.583, "eval_code_is_correct_steps_per_second": 0.052, "epoch": 5.26, "step": 100 }, { "train_runtime": 2619.7779, "train_samples_per_second": 1.221, "train_steps_per_second": 0.038, "total_flos": 0.0, "train_loss": 0.6988758665323257, "epoch": 5.26, "step": 100 } ]