llama-13b-code_low_quality / training_logs.json
joshuaclymer's picture
Upload folder using huggingface_hub
b0de92d
Invalid JSON:Unterminated fractional number in JSONat line 1012, column 15
[
{
"loss": 0.6593,
"learning_rate": 0.0002,
"epoch": 0.03,
"step": 1
},
{
"loss": 0.4945,
"learning_rate": 0.0002,
"epoch": 0.05,
"step": 2
},
{
"loss": 0.3929,
"learning_rate": 0.0002,
"epoch": 0.08,
"step": 3
},
{
"loss": 0.2804,
"learning_rate": 0.0002,
"epoch": 0.11,
"step": 4
},
{
"loss": 0.276,
"learning_rate": 0.0002,
"epoch": 0.13,
"step": 5
},
{
"loss": 0.3343,
"learning_rate": 0.0002,
"epoch": 0.16,
"step": 6
},
{
"loss": 0.1975,
"learning_rate": 0.0002,
"epoch": 0.18,
"step": 7
},
{
"loss": 0.274,
"learning_rate": 0.0002,
"epoch": 0.21,
"step": 8
},
{
"loss": 0.2602,
"learning_rate": 0.0002,
"epoch": 0.24,
"step": 9
},
{
"loss": 0.2084,
"learning_rate": 0.0002,
"epoch": 0.26,
"step": 10
},
{
"loss": 0.1054,
"learning_rate": 0.0002,
"epoch": 0.29,
"step": 11
},
{
"loss": 0.0939,
"learning_rate": 0.0002,
"epoch": 0.32,
"step": 12
},
{
"loss": 0.135,
"learning_rate": 0.0002,
"epoch": 0.34,
"step": 13
},
{
"loss": 0.0468,
"learning_rate": 0.0002,
"epoch": 0.37,
"step": 14
},
{
"loss": 0.2461,
"learning_rate": 0.0002,
"epoch": 0.39,
"step": 15
},
{
"loss": 0.1158,
"learning_rate": 0.0002,
"epoch": 0.42,
"step": 16
},
{
"loss": 0.3144,
"learning_rate": 0.0002,
"epoch": 0.45,
"step": 17
},
{
"loss": 0.1785,
"learning_rate": 0.0002,
"epoch": 0.47,
"step": 18
},
{
"loss": 0.1156,
"learning_rate": 0.0002,
"epoch": 0.5,
"step": 19
},
{
"loss": 0.0616,
"learning_rate": 0.0002,
"epoch": 0.53,
"step": 20
},
{
"loss": 0.0447,
"learning_rate": 0.0002,
"epoch": 0.55,
"step": 21
},
{
"loss": 0.0044,
"learning_rate": 0.0002,
"epoch": 0.58,
"step": 22
},
{
"loss": 0.0612,
"learning_rate": 0.0002,
"epoch": 0.61,
"step": 23
},
{
"loss": 0.0515,
"learning_rate": 0.0002,
"epoch": 0.63,
"step": 24
},
{
"loss": 0.0108,
"learning_rate": 0.0002,
"epoch": 0.66,
"step": 25
},
{
"eval_code_low_quality_loss": 0.010171000845730305,
"eval_code_low_quality_score": -0.0019669600296765566,
"eval_code_low_quality_brier_score": 0.0019669600296765566,
"eval_code_low_quality_average_probability": 0.9910862445831299,
"eval_code_low_quality_accuracy": 1.0,
"eval_code_low_quality_probabilities": [
0.9999998807907104,
0.9999998807907104,
0.9999916553497314,
0.9999791383743286,
0.9999998807907104,
0.9999997615814209,
0.9999990463256836,
0.9999992847442627,
0.9999996423721313,
0.9999985694885254,
0.9999996423721313,
0.9999994039535522,
0.9999995231628418,
0.9999998807907104,
0.9999997615814209,
0.9999998807907104,
0.9999974966049194,
0.9999810457229614,
0.9999998807907104,
0.9999997615814209,
0.9999979734420776,
0.9999966621398926,
0.9999923706054688,
0.9999973773956299,
0.9998645782470703,
0.9999245405197144,
0.9626507759094238,
0.9710566401481628,
0.9999980926513672,
0.9999955892562866,
0.9980201721191406,
0.9999994039535522,
0.9999995231628418,
0.9999991655349731,
0.999997615814209,
0.9999970197677612,
0.999995231628418,
0.999994158744812,
0.9999849796295166,
0.9999797344207764,
0.9999872446060181,
0.9999929666519165,
0.9999995231628418,
0.9999985694885254,
0.99998939037323,
0.9999997615814209,
0.9999953508377075,
0.999991774559021,
0.9996731281280518,
0.9995961785316467,
0.9999998807907104,
0.9999998807907104,
0.9999982118606567,
0.9999980926513672,
0.9999994039535522,
0.9999996423721313,
0.9999988079071045,
0.9999992847442627,
0.9999977350234985,
0.9999911785125732,
0.9999998807907104,
0.9999998807907104,
0.9999996423721313,
0.9999990463256836,
0.9917247295379639,
0.9974627494812012,
1.0,
0.9999998807907104,
0.9999998807907104,
0.9999995231628418,
0.9999998807907104,
1.0,
0.9999978542327881,
0.9999996423721313,
0.9999998807907104,
0.9999998807907104,
0.9999954700469971,
0.9999988079071045,
0.8898673057556152,
0.95624178647995,
0.9999982118606567,
0.9999994039535522,
0.9999997615814209,
0.9999995231628418,
0.9999998807907104,
0.9999997615814209,
0.7369291186332703,
0.6688874363899231,
0.9999933242797852,
0.9999909400939941,
0.9999688863754272,
0.9999462366104126,
0.9999872446060181,
0.9999003410339355,
0.9898979663848877,
0.9894485473632812,
0.9999990463256836,
0.9999994039535522,
0.9648559093475342,
0.992939829826355
],
"eval_code_low_quality_runtime": 108.3354,
"eval_code_low_quality_samples_per_second": 0.923,
"eval_code_low_quality_steps_per_second": 0.037,
"epoch": 0.66,
"step": 25
},
{
"eval_code_loss": 0.775557279586792,
"eval_code_score": -0.21216197311878204,
"eval_code_brier_score": 0.21216197311878204,
"eval_code_average_probability": 0.6170614361763,
"eval_code_accuracy": 0.77,
"eval_code_probabilities": [
0.0018926338525488973,
0.012711296789348125,
0.007091669365763664,
0.6062625646591187,
0.9943353533744812,
0.5690382719039917,
0.6241586208343506,
0.662219226360321,
0.5325962901115417,
0.5391229391098022,
0.7178332805633545,
0.6171442866325378,
0.577951967716217,
0.8548311591148376,
0.7104359865188599,
0.5026382803916931,
0.5293322801589966,
0.5492123365402222,
0.6345873475074768,
0.7990339398384094,
0.5863059163093567,
0.48554468154907227,
0.6499708294868469,
0.5989818572998047,
0.2676376402378082,
0.2834436595439911,
0.28170374035835266,
0.8311360478401184,
0.9110060334205627,
0.9641320109367371,
0.45280739665031433,
0.7613933086395264,
0.5464147329330444,
0.01752450130879879,
0.005836487282067537,
0.006046702619642019,
0.5162467956542969,
0.5298649668693542,
0.5247464179992676,
0.9592331647872925,
0.8196842670440674,
0.7410209774971008,
0.796080470085144,
0.9008417725563049,
0.6857371926307678,
0.5978904962539673,
0.9823793768882751,
0.9868221282958984,
0.5604033470153809,
0.5046380758285522,
0.999763548374176,
0.9999983310699463,
0.9999935626983643,
0.9927141070365906,
0.516162097454071,
0.521334171295166,
0.513815701007843,
0.5127142667770386,
0.5125176906585693,
0.5335236191749573,
0.3885745108127594,
0.449074923992157,
0.43242695927619934,
0.42709216475486755,
0.509745180606842,
0.5419602394104004,
0.9643940329551697,
0.46200674772262573,
0.44968515634536743,
0.7517949342727661,
0.35403740406036377,
0.9996168613433838,
0.43991619348526,
0.2799178659915924,
0.6076914072036743,
0.9999991655349731,
0.9997984766960144,
0.9999959468841553,
0.9999561309814453,
0.6099094748497009,
0.6852646470069885,
0.8096278309822083,
0.5049552321434021,
0.818763017654419,
0.6465492248535156,
0.5962660312652588,
0.9850568175315857,
0.9976211190223694,
0.9992263317108154,
0.6331233978271484,
0.6343858242034912,
0.49390336871147156,
0.5998658537864685,
0.5048991441726685,
0.507156252861023,
0.5149410367012024,
0.9476234316825867,
0.39861536026000977,
0.34747856855392456,
0.5127823948860168
],
"eval_code_runtime": 105.3963,
"eval_code_samples_per_second": 0.949,
"eval_code_steps_per_second": 0.038,
"epoch": 0.66,
"step": 25
},
{
"loss": 0.0077,
"learning_rate": 0.0002,
"epoch": 0.68,
"step": 26
},
{
"loss": 0.0157,
"learning_rate": 0.0002,
"epoch": 0.71,
"step": 27
},
{
"loss": 0.0055,
"learning_rate": 0.0002,
"epoch": 0.74,
"step": 28
},
{
"loss": 0.0043,
"learning_rate": 0.0002,
"epoch": 0.76,
"step": 29
},
{
"loss": 0.0007,
"learning_rate": 0.0002,
"epoch": 0.79,
"step": 30
},
{
"loss": 0.0017,
"learning_rate": 0.0002,
"epoch": 0.82,
"step": 31
},
{
"loss": 0.0046,
"learning_rate": 0.0002,
"epoch": 0.84,
"step": 32
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 0.87,
"step": 33
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 0.89,
"step": 34
},
{
"loss": 0.0148,
"learning_rate": 0.0002,
"epoch": 0.92,
"step": 35
},
{
"loss": 0.0026,
"learning_rate": 0.0002,
"epoch": 0.95,
"step": 36
},
{
"loss": 0.0006,
"learning_rate": 0.0002,
"epoch": 0.97,
"step": 37
},
{
"loss": 0.0043,
"learning_rate": 0.0002,
"epoch": 1.0,
"step": 38
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 1.03,
"step": 39
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 1.05,
"step": 40
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 1.08,
"step": 41
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.11,
"step": 42
},
{
"loss": 0.0095,
"learning_rate": 0.0002,
"epoch": 1.13,
"step": 43
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 1.16,
"step": 44
},
{
"loss": 0.2013,
"learning_rate": 0.0002,
"epoch": 1.18,
"step": 45
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.21,
"step": 46
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.24,
"step": 47
},
{
"loss": 0.0047,
"learning_rate": 0.0002,
"epoch": 1.26,
"step": 48
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 1.29,
"step": 49
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.32,
"step": 50
},
{
"eval_code_low_quality_loss": 0.001378062181174755,
"eval_code_low_quality_score": -5.075635272078216e-05,
"eval_code_low_quality_brier_score": 5.075635272078216e-05,
"eval_code_low_quality_average_probability": 0.9987315535545349,
"eval_code_low_quality_accuracy": 1.0,
"eval_code_low_quality_probabilities": [
1.0,
1.0,
1.0,
0.9999997615814209,
1.0,
1.0,
1.0,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
0.9999840259552002,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.967201828956604,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9908334612846375,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999980926513672,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
1.0,
0.999922513961792,
0.9999967813491821,
0.9999996423721313,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9702784419059753,
0.9449317455291748,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
0.9999991655349731,
1.0
],
"eval_code_low_quality_runtime": 108.1154,
"eval_code_low_quality_samples_per_second": 0.925,
"eval_code_low_quality_steps_per_second": 0.037,
"epoch": 1.32,
"step": 50
},
{
"eval_code_loss": 1.3461368083953857,
"eval_code_score": -0.22116898000240326,
"eval_code_brier_score": 0.22116898000240326,
"eval_code_average_probability": 0.5982358455657959,
"eval_code_accuracy": 0.8,
"eval_code_probabilities": [
4.050308746172959e-07,
2.979102418976254e-06,
2.6617096864356427e-06,
0.5738264918327332,
0.8691526651382446,
0.5516966581344604,
0.5616106986999512,
0.5491132140159607,
0.5290331244468689,
0.49235308170318604,
0.5810630321502686,
0.5722699761390686,
0.5287314057350159,
0.6949906349182129,
0.5635644197463989,
0.5054471492767334,
0.4994816780090332,
0.5129610896110535,
0.6220285296440125,
0.6764118671417236,
0.5921300649642944,
0.503677248954773,
0.5439413785934448,
0.5423399806022644,
0.431194007396698,
0.42188534140586853,
0.42363011837005615,
0.9709718227386475,
0.9995226860046387,
0.9999279975891113,
0.4847673773765564,
0.5603877305984497,
0.5247597694396973,
3.816174285020679e-06,
1.9298215647722827e-06,
1.9306407921249047e-06,
0.527335524559021,
0.5305987596511841,
0.5162070393562317,
0.946389377117157,
0.8050153255462646,
0.8141985535621643,
0.5671536326408386,
0.6023316383361816,
0.5614919066429138,
0.5858514904975891,
0.9122728705406189,
0.9817299842834473,
0.532357931137085,
0.5182923674583435,
0.9870670437812805,
0.999982476234436,
0.9999992847442627,
0.9999778270721436,
0.5067487359046936,
0.5095696449279785,
0.5025925040245056,
0.4237653911113739,
0.5117032527923584,
0.4223073124885559,
0.6444336175918579,
0.6726469993591309,
0.6397074460983276,
0.7292462587356567,
0.5063377618789673,
0.5283511281013489,
0.706869900226593,
0.46199607849121094,
0.4430694580078125,
0.9500992894172668,
0.22525879740715027,
0.9999823570251465,
0.47554466128349304,
0.51363205909729,
0.6031032800674438,
0.9999370574951172,
0.658456563949585,
0.9959049820899963,
0.902746856212616,
0.5577074289321899,
0.5983836650848389,
0.7882758975028992,
0.5046991109848022,
0.8182088732719421,
0.549981951713562,
0.5202911496162415,
0.9605872631072998,
0.9999349117279053,
0.9999911785125732,
0.7577045559883118,
0.6290202736854553,
0.5034119486808777,
0.569599449634552,
0.503978431224823,
0.507115364074707,
0.5144593715667725,
0.770204484462738,
0.23782096803188324,
0.22504965960979462,
0.5020108222961426
],
"eval_code_runtime": 105.4075,
"eval_code_samples_per_second": 0.949,
"eval_code_steps_per_second": 0.038,
"epoch": 1.32,
"step": 50
},
{
"loss": 0.0015,
"learning_rate": 0.0002,
"epoch": 1.34,
"step": 51
},
{
"loss": 0.0049,
"learning_rate": 0.0002,
"epoch": 1.37,
"step": 52
},
{
"loss": 0.0119,
"learning_rate": 0.0002,
"epoch": 1.39,
"step": 53
},
{
"loss": 0.0028,
"learning_rate": 0.0002,
"epoch": 1.42,
"step": 54
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.45,
"step": 55
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.47,
"step": 56
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.5,
"step": 57
},
{
"loss": 0.0024,
"learning_rate": 0.0002,
"epoch": 1.53,
"step": 58
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.55,
"step": 59
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 1.58,
"step": 60
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 1.61,
"step": 61
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.63,
"step": 62
},
{
"loss": 0.0017,
"learning_rate": 0.0002,
"epoch": 1.66,
"step": 63
},
{
"loss": 0.0018,
"learning_rate": 0.0002,
"epoch": 1.68,
"step": 64
},
{
"loss": 0.0008,
"learning_rate": 0.0002,
"epoch": 1.71,
"step": 65
},
{
"loss": 0.0068,
"learning_rate": 0.0002,
"epoch": 1.74,
"step": 66
},
{
"loss": 0.001,
"learning_rate": 0.0002,
"epoch": 1.76,
"step": 67
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 1.79,
"step": 68
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.82,
"step": 69
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.84,
"step": 70
},
{
"loss": 0.0006,
"learning_rate": 0.0002,
"epoch": 1.87,
"step": 71
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 1.89,
"step": 72
},
{
"loss": 0.1335,
"learning_rate": 0.0002,
"epoch": 1.92,
"step": 73
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 1.95,
"step": 74
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 1.97,
"step": 75
},
{
"eval_code_low_quality_loss": 0.0005032618064433336,
"eval_code_low_quality_score": -1.0583773473626934e-05,
"eval_code_low_quality_brier_score": 1.0583773473626934e-05,
"eval_code_low_quality_average_probability": 0.9995136857032776,
"eval_code_low_quality_accuracy": 1.0,
"eval_code_low_quality_probabilities": [
1.0,
0.9999967813491821,
0.9999997615814209,
0.9983976483345032,
1.0,
0.9999837875366211,
1.0,
0.9997871518135071,
1.0,
1.0,
1.0,
1.0,
0.9918645620346069,
1.0,
1.0,
1.0,
0.9998249411582947,
0.998837411403656,
1.0,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999996423721313,
1.0,
1.0,
1.0,
0.9688511490821838,
0.9999998807907104,
1.0,
0.9999991655349731,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
0.9999998807907104,
1.0,
0.999982476234436,
0.9999701976776123,
0.995941698551178,
0.9999995231628418,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999868869781494,
0.9999997615814209,
0.9999061822891235,
1.0,
1.0,
0.9999092817306519,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999996423721313,
0.9999997615814209,
1.0,
0.9999204874038696,
1.0,
1.0,
1.0,
0.9989272952079773,
1.0,
0.9999998807907104,
1.0,
0.9994589686393738,
1.0,
0.9999996423721313,
1.0,
1.0,
1.0,
0.9999737739562988,
0.999944806098938,
0.9999998807907104,
0.9999788999557495,
1.0,
1.0,
1.0,
0.9999411106109619,
1.0,
1.0,
1.0,
1.,,
0.9999876022338867,
1.0
],
"eval_code_low_quality_runtime": 108.2376,
"eval_code_low_quality_samples_per_second": 0.924,
"eval_code_low_quality_steps_per_second": 0.037,
"epoch": 1.97,
"step": 75
},
{
"eval_code_loss": 1.5990806818008423,
"eval_code_score": -0.2409353256225586,
"eval_code_brier_score": 0.2409353256225586,
"eval_code_average_probability": 0.5683663487434387,
"eval_code_accuracy": 0.8,
"eval_code_probabilities": [
1.1873796168515582e-08,
5.058638308241825e-08,
6.313541689451085e-08,
0.5709640979766846,
0.6853320002555847,
0.5568627715110779,
0.5487821102142334,
0.5347866415977478,
0.5317322611808777,
0.512122631072998,
0.5734414458274841,
0.5738123059272766,
0.5303495526313782,
0.6757323741912842,
0.6369258165359497,
0.5054691433906555,
0.4862286150455475,
0.4997119903564453,
0.5902368426322937,
0.6018257737159729,
0.541638970375061,
0.5033149123191833,
0.5362597703933716,
0.5289673209190369,
0.24309313297271729,
0.22363527119159698,
0.22765608131885529,
0.7798057794570923,
0.9960242509841919,
0.9997923970222473,
0.5013885498046875,
0.528499186038971,
0.5185747146606445,
4.462568199414818e-07,
2.2847591196750727e-07,
2.316882046216051e-07,
0.5187056660652161,
0.5277567505836487,
0.510230541229248,
0.9069125056266785,
0.8473342061042786,
0.8101637363433838,
0.537501335144043,
0.5229093432426453,
0.5179290175437927,
0.594524621963501,
0.8149073123931885,
0.9026350378990173,
0.5351212024688721,
0.5195194482803345,
0.9832677245140076,
0.9752768874168396,
0.9901442527770996,
0.9911841154098511,
0.5086742043495178,
0.5045136213302612,
0.5005779266357422,
0.4479965567588806,
0.5039933919906616,
0.44930532574653625,
0.5485993027687073,
0.6136952042579651,
0.5874925255775452,
0.6819684505462646,
0.5115750432014465,
0.5058901309967041,
0.7632222771644592,
0.3942977488040924,
0.3785106837749481,
0.8528256416320801,
0.5036994814872742,
0.9950182437896729,
0.48869040608406067,
0.5160850882530212,
0.5451788306236267,
0.9758601188659668,
0.44595080614089966,
0.8039615750312805,
0.8271895051002502,
0.5377886891365051,
0.5619093775749207,
0.8048967123031616,
0.502302885055542,
0.766408383846283,
0.5268206000328064,
0.5031132102012634,
0.8771815896034241,
0.9855904579162598,
0.9990859031677246,
0.6270195841789246,
0.55865478515625,
0.5030545592308044,
0.5426568984985352,
0.5039815306663513,
0.5092061758041382,
0.5093463659286499,
0.4080256521701813,
0.24740169942378998,
0.2555961608886719,
0.5028347373008728
],
"eval_code_runtime": 105.2631,
"eval_code_samples_per_second": 0.95,
"eval_code_steps_per_second": 0.038,
"epoch": 1.97,
"step": 75
},
{
"loss": 0.012,
"learning_rate": 0.0002,
"epoch": 2.0,
"step": 76
},
{
"loss": 0.0006,
"learning_rate": 0.0002,
"epoch": 2.03,
"step": 77
},
{
"loss": 0.0006,
"learning_rate": 0.0002,
"epoch": 2.05,
"step": 78
},
{
"loss": 0.0006,
"learning_rate": 0.0002,
"epoch": 2.08,
"step": 79
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 2.11,
"step": 80
},
{
"loss": 0.005,
"learning_rate": 0.0002,
"epoch": 2.13,
"step": 81
},
{
"loss": 0.0007,
"learning_rate": 0.0002,
"epoch": 2.16,
"step": 82
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 2.18,
"step": 83
},
{
"loss": 0.0019,
"learning_rate": 0.0002,
"epoch": 2.21,
"step": 84
},
{
"loss": 0.0007,
"learning_rate": 0.0002,
"epoch": 2.24,
"step": 85
},
{
"loss": 0.0014,
"learning_rate": 0.0002,
"epoch": 2.26,
"step": 86
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 2.29,
"step": 87
},
{
"loss": 0.001,
"learning_rate": 0.0002,
"epoch": 2.32,
"step": 88
},
{
"loss": 0.0006,
"learning_rate": 0.0002,
"epoch": 2.34,
"step": 89
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 2.37,
"step": 90
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 2.39,
"step": 91
},
{
"loss": 0.0006,
"learning_rate": 0.0002,
"epoch": 2.42,
"step": 92
},
{
"loss": 0.0028,
"learning_rate": 0.0002,
"epoch": 2.45,
"step": 93
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 2.47,
"step": 94
},
{
"loss": 0.0024,
"learning_rate": 0.0002,
"epoch": 2.5,
"step": 95
},
{
"loss": 0.0059,
"learning_rate": 0.0002,
"epoch": 2.53,
"step": 96
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 2.55,
"step": 97
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 2.58,
"step": 98
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 2.61,
"step": 99
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 2.63,
"step": 100
},
{
"eval_code_low_quality_loss": 6.671607116004452e-05,
"eval_code_low_quality_score": -3.4999186482309597e-07,
"eval_code_low_quality_brier_score": 3.4999186482309597e-07,
"eval_code_low_quality_average_probability": 0.9999365210533142,
"eval_code_low_quality_accuracy": 1.0,
"eval_code_low_quality_probabilities": [
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.999998927116394,
1.0,
1.0,
1.0,
1.0,
0.9999990463256836,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9996960163116455,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9940925240516663,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.,,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999995231628418,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999983310699463,
1.0,
1.0,
1.0,
0.9999991655349731,
1.0,
0.9999901056289673,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999704360961914,
0.999913215637207,
1.0,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0
],
"eval_code_low_quality_runtime": 108.4514,
"eval_code_low_quality_samples_per_second": 0.922,
"eval_code_low_quality_steps_per_second": 0.037,
"epoch": 2.63,
"step": 100
},
{
"eval_code_loss": 1.2588822841644287,
"eval_code_score": -0.24486389756202698,
"eval_code_brier_score": 0.24486389756202698,
"eval_code_average_probability": 0.6122177839279175,
"eval_code_accuracy": 0.78,
"eval_code_probabilities": [
3.716594960678776e-07,
4.86033532069996e-05,
5.94538141740486e-05,
0.7322285175323486,
0.992759108543396,
0.6937164068222046,
0.6719813346862793,
0.5284847021102905,
0.5714943408966064,
0.5305595397949219,
0.7621225118637085,
0.7049319744110107,
0.5994599461555481,
0.9482231736183167,
0.9427314400672913,
0.5233908295631409,
0.5151730179786682,
0.5592909455299377,
0.6389124989509583,
0.7489423155784607,
0.5400505661964417,
0.4894372224807739,
0.7627068758010864,
0.676575243473053,
0.001497809775173664,
0.0012255371548235416,
0.0013199239037930965,
0.9070805907249451,
0.9999668598175049,
0.9999922513961792,
0.48677918314933777,
0.6579598784446716,
0.5528249740600586,
0.0031468200031667948,
0.0008608169737271965,
0.0007525159744545817,
0.628882110118866,
0.5596430897712708,
0.5554695725440979,
0.9984580278396606,
0.989458441734314,
0.9929828643798828,
0.7459701895713806,
0.8483384251594543,
0.5955826044082642,
0.8648329377174377,
0.9960275888442993,
0.9993523955345154,
0.5829755067825317,
0.6307886838912964,
0.994866132736206,
0.9999991655349731,
0.9999984502792358,
0.9999934434890747,
0.5436527132987976,
0.5340330600738525,
0.5099152326583862,
0.5169093608856201,
0.5082399249076843,
0.5305851697921753,
0.0689636766910553,
0.09695249050855637,
0.09122244268655777,
0.4549616277217865,
0.5240060091018677,
0.539696216583252,
0.9665416479110718,
0.2522982358932495,
0.24534465372562408,
0.905021071434021,
0.31865352392196655,
0.999656081199646,
0.4672524631023407,
0.5117397308349609,
0.5817976593971252,
0.9999037981033325,
0.9686040282249451,
0.9996315240859985,
0.996566653251648,
0.7026336789131165,
0.7814198732376099,
0.8912621140480042,
0.5140696167945862,
0.9321841597557068,
0.673382580280304,
0.6223154664039612,
0.9992823004722595,
0.9998123049736023,
0.9999938011169434,
0.697952926158905,
0.7329107522964478,
0.4842481017112732,
0.6284154057502747,
0.5115850567817688,
0.525327205657959,
0.5679951310157776,
0.5145466923713684,
0.02526971884071827,
0.02999242953956127,
0.5247264504432678
],
"eval_code_runtime": 105.3153,
"eval_code_samples_per_second": 0.95,
"eval_code_steps_per_second": 0.038,
"epoch": 2.63,
"step": 100
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 2.66,
"step": 101
},
{
"loss": 0.0009,
"learning_rate": 0.0002,
"epoch": 2.68,
"step": 102
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 2.71,
"step": 103
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 2.74,
"step": 104
},
{
"loss": 0.0016,
"learning_rate": 0.0002,
"epoch": 2.76,
"step": 105
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 2.79,
"step": 106
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 2.82,
"step": 107
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 2.84,
"step": 108
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 2.87,
"step": 109
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 2.89,
"step": 110
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 2.92,
"step": 111
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 2.95,
"step": 112
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 2.97,
"step": 113
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.0,
"step": 114
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.03,
"step": 115
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.05,
"step": 116
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.08,
"step": 117
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 3.11,
"step": 118
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.13,
"step": 119
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.16,
"step": 120
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.18,
"step": 121
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.21,
"step": 122
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.24,
"step": 123
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.26,
"step": 124
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.29,
"step": 125
},
{
"eval_code_low_quality_loss": 0.0007014500442892313,
"eval_code_low_quality_score": -3.61457969120238e-05,
"eval_code_low_quality_brier_score": 3.61457969120238e-05,
"eval_code_low_quality_average_probability": 0.9993457198143005,
"eval_code_low_quality_accuracy": 1.0,
"eval_code_low_quality_probabilities": [
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.,,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999996423721313,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
0.9999995231628418,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
0.9399757981300354,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.99994957447052,
0.9999979734420776,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999996423721313,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9985740184783936,
0.9999673366546631,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9990741014480591,
0.9970368146896362,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
0.9999984502792358,
1.0,
1.0,
1.0,
1.0
],
"eval_code_low_quality_runtime": 108.4065,
"eval_code_low_quality_samples_per_second": 0.922,
"eval_code_low_quality_steps_per_second": 0.037,
"epoch": 3.29,
"step": 125
},
{
"eval_code_loss": 1.043724775314331,
"eval_code_score": -0.21790370345115662,
"eval_code_brier_score": 0.21790370345115662,
"eval_code_average_probability": 0.6578189134597778,
"eval_code_accuracy": 0.77,
"eval_code_probabilities": [
2.9980761610204354e-05,
0.16327866911888123,
0.1223980113863945,
0.8630220293998718,
0.9999371767044067,
0.8081788420677185,
0.7690643668174744,
0.4431692361831665,
0.6145693063735962,
0.5692129731178284,
0.8545891046524048,
0.7837128043174744,
0.678038477897644,
0.9840186238288879,
0.9795506000518799,
0.541788637638092,
0.5379593372344971,
0.6108262538909912,
0.6568173766136169,
0.9312652349472046,
0.5693832039833069,
0.491776704788208,
0.865976095199585,
0.7813358306884766,
1.2309145859035198e-05,
9.09055961528793e-06,
1.0214143912889995e-05,
0.9485948085784912,
0.9997069239616394,
0.999749481678009,
0.45955172181129456,
0.8172199726104736,
0.5752690434455872,
0.6527258157730103,
0.2048613727092743,
0.13845929503440857,
0.7823963761329651,
0.6123839616775513,
0.6217948198318481,
0.9999850988388062,
0.999450147151947,
0.9998420476913452,
0.9847567677497864,
0.9996198415756226,
0.6785285472869873,
0.9706732630729675,
0.9999459981918335,
0.9999982118606567,
0.6881040930747986,
0.7350975871086121,
0.9948760867118835,
1.0,
1.0,
1.0,
0.5983561873435974,
0.5580247640609741,
0.5120639801025391,
0.5918711423873901,
0.5148324370384216,
0.6228303909301758,
0.006977998651564121,
0.011295206844806671,
0.012422475032508373,
0.4554630219936371,
0.5428009033203125,
0.5566087961196899,
0.9991586208343506,
0.11367473751306534,
0.12123917788267136,
0.9770430326461792,
0.1478639841079712,
0.9995866417884827,
0.4416849911212921,
0.491413414478302,
0.6343856453895569,
0.9999972581863403,
0.9927133917808533,
0.9999967813491821,
0.9998946189880371,
0.8279895186424255,
0.914436936378479,
0.9620551466941833,
0.5265487432479858,
0.9861032962799072,
0.8208467960357666,
0.7353063821792603,
0.9999938011169434,
0.9998844861984253,
0.999961256980896,
0.8301354050636292,
0.8745093941688538,
0.46109309792518616,
0.7134401798248291,
0.5036332011222839,
0.5366954207420349,
0.6171916127204895,
0.5420334339141846,
0.0013571635354310274,
0.0021216413006186485,
0.5408289432525635
],
"eval_code_runtime": 105.5069,
"eval_code_samples_per_second": 0.948,
"eval_code_steps_per_second": 0.038,
"epoch": 3.29,
"step": 125
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.32,
"step": 126
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.34,
"step": 127
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.37,
"step": 128
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.39,
"step": 129
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.42,
"step": 130
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.45,
"step": 131
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 3.47,
"step": 132
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.5,
"step": 133
},
{
"loss": 0.08,
"learning_rate": 0.0002,
"epoch": 3.53,
"step": 134
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.55,
"step": 135
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.58,
"step": 136
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.61,
"step": 137
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.63,
"step": 138
},
{
"loss": 0.001,
"learning_rate": 0.0002,
"epoch": 3.66,
"step": 139
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.68,
"step": 140
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.71,
"step": 141
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.74,
"step": 142
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 3.76,
"step": 143
},
{
"loss": 0.0114,
"learning_rate": 0.0002,
"epoch": 3.79,
"step": 144
},
{
"loss": 0.006,
"learning_rate": 0.0002,
"epoch": 3.82,
"step": 145
},
{
"loss": 0.0011,
"learning_rate": 0.0002,
"epoch": 3.84,
"step": 146
},
{
"loss": 0.0042,
"learning_rate": 0.0002,
"epoch": 3.87,
"step": 147
},
{
"loss": 0.0015,
"learning_rate": 0.0002,
"epoch": 3.89,
"step": 148
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 3.92,
"step": 149
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.95,
"step": 150
},
{
"eval_code_low_quality_loss": 0.00038435429451055825,
"eval_code_low_quality_score": -6.823713192716241e-06,
"eval_code_low_quality_brier_score": 6.823713192716241e-06,
"eval_code_low_quality_average_probability": 0.9996289014816284,
"eval_code_low_quality_accuracy": 1.0,
"eval_code_low_quality_probabilities": [
1.0,
1.0,
1.0,
0.9999984502792358,
1.0,
1.0,
0.9999983310699463,
0.9999969005584717,
1.0,
1.0,
1.0,
1.0,
0.9999916553497314,
1.0,
1.0,
1.0,
0.9999995231628418,
0.9999638795852661,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999983310699463,
1.0,
1.0,
1.0,
0.9766356945037842,
0.9999997615814209,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9885169267654419,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999992847442627,
1.0,
1.0,
1.0,
0.9999996423721313,
1.0,
0.9999995231628418,
1.0,
0.9999998807907104,
1.0,
1.0,
1.0,
1.0,
1.0,
0.9999713897705078,
0.9978513717651367,
0.9999997615814209,
0.9999988079071045,
1.0,
1.0,
1.0,
0.9999997615814209,
1.0,
1.0,
1.0,
1.0,
0.9999719858169556,
1.0
],
"eval_code_low_quality_runtime": 108.3342,
"eval_code_low_quality_samples_per_second": 0.923,
"eval_code_low_quality_steps_per_second": 0.037,
"epoch": 3.95,
"step": 150
},
{
"eval_code_loss": 2.0963048934936523,
"eval_code_score": -0.2217760533094406,
"eval_code_brier_score": 0.2217760533094406,
"eval_code_average_probability": 0.6159726977348328,
"eval_code_accuracy": 0.76,
"eval_code_probabilities": [
3.5287172489573138e-12,
5.817486076198364e-11,
1.8693878389708374e-10,
0.765636146068573,
0.9234081506729126,
0.7391408085823059,
0.659432590007782,
0.6729235053062439,
0.5623210668563843,
0.5150139331817627,
0.8085805177688599,
0.7596898674964905,
0.5972597002983093,
0.9820079803466797,
0.9745085835456848,
0.5273155570030212,
0.5324531197547913,
0.5789834260940552,
0.7247386574745178,
0.7544905543327332,
0.5884762406349182,
0.4842914938926697,
0.8123393058776855,
0.7054367661476135,
0.09308263659477234,
0.08973666280508041,
0.09202855080366135,
0.7089231014251709,
0.9720393419265747,
0.9964279532432556,
0.49923038482666016,
0.6134451031684875,
0.5499404072761536,
6.11895881186264e-11,
1.4576943818678245e-11,
1.735799351476608e-11,
0.6023713946342468,
0.553157389163971,
0.5503317713737488,
0.9796992540359497,
0.9182886481285095,
0.8607842922210693,
0.6422979831695557,
0.6638745665550232,
0.6075322031974792,
0.7293029427528381,
0.9844130873680115,
0.993526816368103,
0.547633707523346,
0.6227739453315735,
0.9998313188552856,
0.9999940395355225,
0.9999951124191284,
0.9999775886535645,
0.5366966128349304,
0.5250415802001953,
0.5051754117012024,
0.48833295702934265,
0.5131838321685791,
0.5317294597625732,
0.29897043108940125,
0.3597976565361023,
0.32535555958747864,
0.4676964282989502,
0.526648998260498,
0.548362672328949,
0.6692071557044983,
0.35373201966285706,
0.3534887731075287,
0.6637941002845764,
0.47728481888771057,
0.9986295700073242,
0.46758249402046204,
0.5160676836967468,
0.5609508156776428,
0.9999833106994629,
0.9855866432189941,
0.9997468590736389,
0.9985565543174744,
0.7168160080909729,
0.7617760300636292,
0.7155187726020813,
0.4970121681690216,
0.8666588664054871,
0.6338189840316772,
0.5993514060974121,
0.9967523813247681,
0.9662074446678162,
0.9995986819267273,
0.5130647420883179,
0.7217807173728943,
0.4925132691860199,
0.5792981386184692,
0.5104650259017944,
0.5129127502441406,
0.5114725828170776,
0.8539605140686035,
0.19493471086025238,
0.22762958705425262,
0.5150301456451416
],
"eval_code_runtime": 105.5057,
"eval_code_samples_per_second": 0.948,
"eval_code_steps_per_second": 0.038,
"epoch": 3.95,
"step": 150
},
{
"train_runtime": 14494.0652,
"train_samples_per_second": 0.331,
"train_steps_per_second": 0.01,
"total_flos": 0.0,
"train_loss": 0.03708522860984015,
"epoch": 3.95,
"step": 150
}
]