openllama-3b-code / training_logs.json
joshuaclymer's picture
Upload folder using huggingface_hub
747a041
[
{
"loss": 0.6836,
"learning_rate": 7.2e-05,
"epoch": 0.02,
"step": 1
},
{
"loss": 0.6947,
"learning_rate": 7.2e-05,
"epoch": 0.04,
"step": 2
},
{
"loss": 0.7068,
"learning_rate": 7.2e-05,
"epoch": 0.05,
"step": 3
},
{
"loss": 0.6936,
"learning_rate": 7.2e-05,
"epoch": 0.07,
"step": 4
},
{
"loss": 0.6894,
"learning_rate": 7.2e-05,
"epoch": 0.09,
"step": 5
},
{
"loss": 0.6947,
"learning_rate": 7.2e-05,
"epoch": 0.11,
"step": 6
},
{
"loss": 0.7127,
"learning_rate": 7.2e-05,
"epoch": 0.12,
"step": 7
},
{
"loss": 0.6564,
"learning_rate": 7.2e-05,
"epoch": 0.14,
"step": 8
},
{
"loss": 0.7051,
"learning_rate": 7.2e-05,
"epoch": 0.16,
"step": 9
},
{
"loss": 0.6898,
"learning_rate": 7.2e-05,
"epoch": 0.18,
"step": 10
},
{
"loss": 0.6269,
"learning_rate": 7.2e-05,
"epoch": 0.19,
"step": 11
},
{
"loss": 0.6373,
"learning_rate": 7.2e-05,
"epoch": 0.21,
"step": 12
},
{
"loss": 0.6626,
"learning_rate": 7.2e-05,
"epoch": 0.23,
"step": 13
},
{
"loss": 0.671,
"learning_rate": 7.2e-05,
"epoch": 0.25,
"step": 14
},
{
"loss": 0.6446,
"learning_rate": 7.2e-05,
"epoch": 0.26,
"step": 15
},
{
"loss": 0.6511,
"learning_rate": 7.2e-05,
"epoch": 0.28,
"step": 16
},
{
"loss": 0.6861,
"learning_rate": 7.2e-05,
"epoch": 0.3,
"step": 17
},
{
"loss": 0.6569,
"learning_rate": 7.2e-05,
"epoch": 0.32,
"step": 18
},
{
"loss": 0.6328,
"learning_rate": 7.2e-05,
"epoch": 0.33,
"step": 19
},
{
"loss": 0.6302,
"learning_rate": 7.2e-05,
"epoch": 0.35,
"step": 20
},
{
"loss": 0.6311,
"learning_rate": 7.2e-05,
"epoch": 0.37,
"step": 21
},
{
"loss": 0.6667,
"learning_rate": 7.2e-05,
"epoch": 0.39,
"step": 22
},
{
"loss": 0.6476,
"learning_rate": 7.2e-05,
"epoch": 0.4,
"step": 23
},
{
"loss": 0.6099,
"learning_rate": 7.2e-05,
"epoch": 0.42,
"step": 24
},
{
"loss": 0.636,
"learning_rate": 7.2e-05,
"epoch": 0.44,
"step": 25
},
{
"eval_code_loss": 0.6500930190086365,
"eval_code_score": -0.23084141314029694,
"eval_code_brier_score": 0.23084141314029694,
"eval_code_average_probability": 0.5324862003326416,
"eval_code_accuracy": 0.63,
"eval_code_probabilities": [
0.8981996178627014,
0.9140064120292664,
0.9086233377456665,
0.4930489957332611,
0.5311785340309143,
0.49541160464286804,
0.5163961052894592,
0.5207482576370239,
0.4978530704975128,
0.4979601800441742,
0.5097731351852417,
0.5298001766204834,
0.4631284475326538,
0.4101221561431885,
0.3820548951625824,
0.5316497683525085,
0.4804396629333496,
0.5146058797836304,
0.5150214433670044,
0.4998961091041565,
0.5088847875595093,
0.5062065720558167,
0.49155697226524353,
0.5065352916717529,
0.3692309260368347,
0.3464958965778351,
0.345247745513916,
0.5082260370254517,
0.4985589385032654,
0.4908699691295624,
0.5014219284057617,
0.5078413486480713,
0.5118864178657532,
0.9250859618186951,
0.9192001819610596,
0.9183722734451294,
0.5567901134490967,
0.5061033368110657,
0.5202013850212097,
0.4856383204460144,
0.46390581130981445,
0.4597606658935547,
0.5073948502540588,
0.49284979701042175,
0.49324461817741394,
0.4991315007209778,
0.5046825408935547,
0.5030663013458252,
0.4927866756916046,
0.5034404993057251,
0.6324691772460938,
0.527839183807373,
0.6027267575263977,
0.5166205167770386,
0.5005240440368652,
0.5037304162979126,
0.5007357001304626,
0.5299914479255676,
0.49253302812576294,
0.5389838814735413,
0.7237929105758667,
0.722010612487793,
0.7248772978782654,
0.5261573791503906,
0.5009329319000244,
0.5066245198249817,
0.5175695419311523,
0.48236575722694397,
0.4813913404941559,
0.4951794743537903,
0.5201015472412109,
0.5013536810874939,
0.5012617111206055,
0.5066967606544495,
0.5075401067733765,
0.5807880759239197,
0.5756419897079468,
0.5374066829681396,
0.5401325821876526,
0.4964595437049866,
0.48420250415802,
0.5349816083908081,
0.4993498623371124,
0.5083227157592773,
0.4809667766094208,
0.5351281762123108,
0.45967379212379456,
0.5043829679489136,
0.4973975121974945,
0.5018096566200256,
0.4930133819580078,
0.5008613467216492,
0.5038902163505554,
0.5041508078575134,
0.4986605942249298,
0.5054576992988586,
0.4900255799293518,
0.4928497076034546,
0.5077279806137085,
0.49679625034332275
],
"eval_code_runtime": 36.4656,
"eval_code_samples_per_second": 2.742,
"eval_code_steps_per_second": 0.055,
"epoch": 0.44,
"step": 25
},
{
"eval_counterfactual_python_loss": 0.6674560308456421,
"eval_counterfactual_python_score": -0.2368319183588028,
"eval_counterfactual_python_brier_score": 0.2368319183588028,
"eval_counterfactual_python_average_probability": 0.5182108879089355,
"eval_counterfactual_python_accuracy": 0.6,
"eval_counterfactual_python_probabilities": [
0.506840705871582,
0.48089414834976196,
0.497524231672287,
0.5044610500335693,
0.4899257719516754,
0.5029208660125732,
0.5528867840766907,
0.6020012497901917,
0.5903577208518982,
0.5012052059173584,
0.5010500550270081,
0.5014556050300598,
0.5129737257957458,
0.5166401863098145,
0.504987359046936,
0.48754236102104187,
0.4921533763408661,
0.5110666751861572,
0.5212812423706055,
0.505253791809082,
0.5044047236442566,
0.5446178913116455,
0.5504598021507263,
0.5181146860122681,
0.4997810125350952,
0.5025537610054016,
0.49983397126197815,
0.5592316389083862,
0.5561607480049133,
0.49701419472694397,
0.5067521929740906,
0.5109471082687378,
0.49662530422210693,
0.4926052391529083,
0.5500054955482483,
0.5147995352745056,
0.5712809562683105,
0.5422273874282837,
0.5272724032402039,
0.5182323455810547,
0.504339337348938,
0.524910569190979,
0.5017884373664856,
0.49858200550079346,
0.5003425478935242,
0.49639299511909485,
0.5009803175926208,
0.506009042263031,
0.5095840096473694,
0.49511101841926575,
0.49724477529525757,
0.5003291964530945,
0.49959462881088257,
0.5014533996582031,
0.5121566653251648,
0.4868036210536957,
0.4927564561367035,
0.49987566471099854,
0.48913922905921936,
0.4933817982673645,
0.5025197267532349,
0.4877781271934509,
0.4988517463207245,
0.48360976576805115,
0.47294488549232483,
0.44178009033203125,
0.5168694853782654,
0.5422465801239014,
0.5201556086540222,
0.5059149861335754,
0.49637845158576965,
0.518649697303772,
0.4840700328350067,
0.4878598749637604,
0.4397459328174591,
0.5004118084907532,
0.4982900023460388,
0.49845632910728455,
0.4866858422756195,
0.5425868630409241,
0.5578758120536804,
0.5089701414108276,
0.4936344027519226,
0.49497488141059875,
0.4820954203605652,
0.4383483827114105,
0.4935499131679535,
0.8830961585044861,
0.8793171048164368,
0.8719192743301392,
0.44867223501205444,
0.4727223813533783,
0.5310845971107483,
0.4810177981853485,
0.5083786249160767,
0.5173466205596924,
0.5266315340995789,
0.513174831867218,
0.5350879430770874,
0.5002694725990295
],
"eval_counterfactual_python_runtime": 42.2718,
"eval_counterfactual_python_samples_per_second": 2.366,
"eval_counterfactual_python_steps_per_second": 0.047,
"epoch": 0.44,
"step": 25
},
{
"loss": 0.6523,
"learning_rate": 7.2e-05,
"epoch": 0.46,
"step": 26
},
{
"loss": 0.6145,
"learning_rate": 7.2e-05,
"epoch": 0.47,
"step": 27
},
{
"loss": 0.6282,
"learning_rate": 7.2e-05,
"epoch": 0.49,
"step": 28
},
{
"loss": 0.5889,
"learning_rate": 7.2e-05,
"epoch": 0.51,
"step": 29
},
{
"loss": 0.6173,
"learning_rate": 7.2e-05,
"epoch": 0.53,
"step": 30
},
{
"loss": 0.6474,
"learning_rate": 7.2e-05,
"epoch": 0.54,
"step": 31
},
{
"loss": 0.5995,
"learning_rate": 7.2e-05,
"epoch": 0.56,
"step": 32
},
{
"loss": 0.5861,
"learning_rate": 7.2e-05,
"epoch": 0.58,
"step": 33
},
{
"loss": 0.5736,
"learning_rate": 7.2e-05,
"epoch": 0.6,
"step": 34
},
{
"loss": 0.6119,
"learning_rate": 7.2e-05,
"epoch": 0.61,
"step": 35
},
{
"loss": 0.6247,
"learning_rate": 7.2e-05,
"epoch": 0.63,
"step": 36
},
{
"loss": 0.6276,
"learning_rate": 7.2e-05,
"epoch": 0.65,
"step": 37
},
{
"loss": 0.6098,
"learning_rate": 7.2e-05,
"epoch": 0.67,
"step": 38
},
{
"loss": 0.6301,
"learning_rate": 7.2e-05,
"epoch": 0.68,
"step": 39
},
{
"loss": 0.6021,
"learning_rate": 7.2e-05,
"epoch": 0.7,
"step": 40
},
{
"loss": 0.555,
"learning_rate": 7.2e-05,
"epoch": 0.72,
"step": 41
},
{
"loss": 0.5695,
"learning_rate": 7.2e-05,
"epoch": 0.74,
"step": 42
},
{
"loss": 0.5669,
"learning_rate": 7.2e-05,
"epoch": 0.75,
"step": 43
},
{
"loss": 0.5473,
"learning_rate": 7.2e-05,
"epoch": 0.77,
"step": 44
},
{
"loss": 0.5369,
"learning_rate": 7.2e-05,
"epoch": 0.79,
"step": 45
},
{
"loss": 0.5351,
"learning_rate": 7.2e-05,
"epoch": 0.81,
"step": 46
},
{
"loss": 0.4989,
"learning_rate": 7.2e-05,
"epoch": 0.82,
"step": 47
},
{
"loss": 0.4687,
"learning_rate": 7.2e-05,
"epoch": 0.84,
"step": 48
},
{
"loss": 0.4431,
"learning_rate": 7.2e-05,
"epoch": 0.86,
"step": 49
},
{
"loss": 0.475,
"learning_rate": 7.2e-05,
"epoch": 0.88,
"step": 50
},
{
"eval_code_loss": 0.6905087232589722,
"eval_code_score": -0.21665707230567932,
"eval_code_brier_score": 0.21665707230567932,
"eval_code_average_probability": 0.576951265335083,
"eval_code_accuracy": 0.68,
"eval_code_probabilities": [
0.8747886419296265,
0.897834300994873,
0.9301072955131531,
0.5637628436088562,
0.6103933453559875,
0.5329621434211731,
0.661848783493042,
0.8006942868232727,
0.5047258138656616,
0.5474675297737122,
0.5803297162055969,
0.6606214642524719,
0.6511579155921936,
0.5316810011863708,
0.5710970163345337,
0.7186195850372314,
0.40853649377822876,
0.6621276140213013,
0.7090564370155334,
0.686518132686615,
0.6983659863471985,
0.3943677544593811,
0.7656291127204895,
0.7813704609870911,
0.01187042985111475,
0.008863707073032856,
0.007746896706521511,
0.5090981721878052,
0.5062975287437439,
0.45505571365356445,
0.4951728880405426,
0.5581167340278625,
0.5970812439918518,
0.9008167386054993,
0.9059542417526245,
0.9084323644638062,
0.814932644367218,
0.5395833849906921,
0.6921597719192505,
0.45764750242233276,
0.3827315866947174,
0.5150556564331055,
0.5219369530677795,
0.4390372037887573,
0.4954327344894409,
0.47707119584083557,
0.5074189305305481,
0.5035202503204346,
0.5605807304382324,
0.5175653696060181,
0.9902499318122864,
0.5175576210021973,
0.8499017953872681,
0.5307424068450928,
0.5028649568557739,
0.515737771987915,
0.4969106614589691,
0.2922719717025757,
0.44801953434944153,
0.32066962122917175,
0.9447461366653442,
0.9428120255470276,
0.9458075165748596,
0.7382722496986389,
0.5110031962394714,
0.5486981868743896,
0.4352004826068878,
0.41556352376937866,
0.4588325619697571,
0.5106350779533386,
0.5079880952835083,
0.5065162181854248,
0.5341932773590088,
0.5115707516670227,
0.49947670102119446,
0.9284617304801941,
0.510497510433197,
0.6312513947486877,
0.9168699979782104,
0.9026933312416077,
0.8503899574279785,
0.5394543409347534,
0.4984402060508728,
0.5079206228256226,
0.29503393173217773,
0.7989310026168823,
0.3873499035835266,
0.552551805973053,
0.49572017788887024,
0.5294312834739685,
0.44464293122291565,
0.5211971998214722,
0.46848106384277344,
0.5291138887405396,
0.4984701871871948,
0.4968411326408386,
0.46553924679756165,
0.46003156900405884,
0.493184357881546,
0.463138610124588
],
"eval_code_runtime": 36.5772,
"eval_code_samples_per_second": 2.734,
"eval_code_steps_per_second": 0.055,
"epoch": 0.88,
"step": 50
},
{
"eval_counterfactual_python_loss": 0.6410097479820251,
"eval_counterfactual_python_score": -0.222365602850914,
"eval_counterfactual_python_brier_score": 0.222365602850914,
"eval_counterfactual_python_average_probability": 0.5518541932106018,
"eval_counterfactual_python_accuracy": 0.66,
"eval_counterfactual_python_probabilities": [
0.5386440753936768,
0.49819016456604004,
0.4844203591346741,
0.5327919125556946,
0.4123155176639557,
0.5146786570549011,
0.44351926445961,
0.4285781681537628,
0.41586360335350037,
0.5060333609580994,
0.5129002928733826,
0.5073186755180359,
0.5133093595504761,
0.30924591422080994,
0.5565316081047058,
0.41158172488212585,
0.42925503849983215,
0.45506441593170166,
0.5124459862709045,
0.5084977746009827,
0.5260626673698425,
0.9784466624259949,
0.977891206741333,
0.6758217811584473,
0.4996006488800049,
0.502190351486206,
0.49963271617889404,
0.24913643300533295,
0.24497272074222565,
0.15005168318748474,
0.5284581780433655,
0.4637279510498047,
0.46632638573646545,
0.49904829263687134,
0.5982093811035156,
0.5048952102661133,
0.7960643768310547,
0.6252861022949219,
0.6371491551399231,
0.6120105385780334,
0.44951215386390686,
0.30023863911628723,
0.5029293298721313,
0.49918922781944275,
0.5002826452255249,
0.48498842120170593,
0.49545082449913025,
0.5000977516174316,
0.5497520565986633,
0.4658561646938324,
0.47568437457084656,
0.5000590682029724,
0.4994635581970215,
0.501465380191803,
0.5806223154067993,
0.5407394766807556,
0.548596203327179,
0.49953749775886536,
0.5177533626556396,
0.5937445163726807,
0.51665860414505,
0.5505573749542236,
0.5108556151390076,
0.48964056372642517,
0.6833782196044922,
0.7741197943687439,
0.5394606590270996,
0.6131158471107483,
0.5644785165786743,
0.601515531539917,
0.4582086503505707,
0.5712682604789734,
0.6359525918960571,
0.740151047706604,
0.453473836183548,
0.5005698204040527,
0.49849438667297363,
0.4981241226196289,
0.5342211127281189,
0.7014966607093811,
0.8450021743774414,
0.519537091255188,
0.5990186333656311,
0.7578335404396057,
0.5165602564811707,
0.46256765723228455,
0.5105525851249695,
0.9811468124389648,
0.9849089980125427,
0.9816316366195679,
0.6144223809242249,
0.4611106216907501,
0.8631046414375305,
0.5419878363609314,
0.519582211971283,
0.6103906035423279,
0.667199969291687,
0.5551198720932007,
0.669242262840271,
0.5566273331642151
],
"eval_counterfactual_python_runtime": 42.2853,
"eval_counterfactual_python_samples_per_second": 2.365,
"eval_counterfactual_python_steps_per_second": 0.047,
"epoch": 0.88,
"step": 50
},
{
"loss": 0.4995,
"learning_rate": 7.2e-05,
"epoch": 0.89,
"step": 51
},
{
"loss": 0.5482,
"learning_rate": 7.2e-05,
"epoch": 0.91,
"step": 52
},
{
"loss": 0.6127,
"learning_rate": 7.2e-05,
"epoch": 0.93,
"step": 53
},
{
"loss": 0.5,
"learning_rate": 7.2e-05,
"epoch": 0.95,
"step": 54
},
{
"loss": 0.5382,
"learning_rate": 7.2e-05,
"epoch": 0.96,
"step": 55
},
{
"loss": 0.5227,
"learning_rate": 7.2e-05,
"epoch": 0.98,
"step": 56
},
{
"loss": 0.6282,
"learning_rate": 7.2e-05,
"epoch": 1.0,
"step": 57
},
{
"loss": 0.4611,
"learning_rate": 7.2e-05,
"epoch": 1.02,
"step": 58
},
{
"loss": 0.4296,
"learning_rate": 7.2e-05,
"epoch": 1.04,
"step": 59
},
{
"loss": 0.3265,
"learning_rate": 7.2e-05,
"epoch": 1.05,
"step": 60
},
{
"loss": 0.3327,
"learning_rate": 7.2e-05,
"epoch": 1.07,
"step": 61
},
{
"loss": 0.5471,
"learning_rate": 7.2e-05,
"epoch": 1.09,
"step": 62
},
{
"loss": 0.3814,
"learning_rate": 7.2e-05,
"epoch": 1.11,
"step": 63
},
{
"loss": 0.3941,
"learning_rate": 7.2e-05,
"epoch": 1.12,
"step": 64
},
{
"loss": 0.3218,
"learning_rate": 7.2e-05,
"epoch": 1.14,
"step": 65
},
{
"loss": 0.3258,
"learning_rate": 7.2e-05,
"epoch": 1.16,
"step": 66
},
{
"loss": 0.5251,
"learning_rate": 7.2e-05,
"epoch": 1.18,
"step": 67
},
{
"loss": 0.469,
"learning_rate": 7.2e-05,
"epoch": 1.19,
"step": 68
},
{
"loss": 0.3852,
"learning_rate": 7.2e-05,
"epoch": 1.21,
"step": 69
},
{
"loss": 0.3409,
"learning_rate": 7.2e-05,
"epoch": 1.23,
"step": 70
},
{
"loss": 0.4473,
"learning_rate": 7.2e-05,
"epoch": 1.25,
"step": 71
},
{
"loss": 0.2945,
"learning_rate": 7.2e-05,
"epoch": 1.26,
"step": 72
},
{
"loss": 0.3608,
"learning_rate": 7.2e-05,
"epoch": 1.28,
"step": 73
},
{
"loss": 0.4042,
"learning_rate": 7.2e-05,
"epoch": 1.3,
"step": 74
},
{
"loss": 0.3802,
"learning_rate": 7.2e-05,
"epoch": 1.32,
"step": 75
},
{
"eval_code_loss": 0.4694095849990845,
"eval_code_score": -0.16457700729370117,
"eval_code_brier_score": 0.16457700729370117,
"eval_code_average_probability": 0.6747273802757263,
"eval_code_accuracy": 0.77,
"eval_code_probabilities": [
0.9998944997787476,
0.9999444484710693,
0.9999792575836182,
0.7207562327384949,
0.9202108383178711,
0.5724186301231384,
0.8467735648155212,
0.8126452565193176,
0.44478896260261536,
0.7643183469772339,
0.7819174528121948,
0.9309266805648804,
0.9411635994911194,
0.8424233198165894,
0.9049078226089478,
0.952031672000885,
0.3711952567100525,
0.9328634738922119,
0.9677587151527405,
0.9494214057922363,
0.9498708844184875,
0.30629244446754456,
0.8959491848945618,
0.9032987952232361,
0.9084609150886536,
0.8893307447433472,
0.8730643391609192,
0.5209372043609619,
0.5036833882331848,
0.4168521463871002,
0.5004851818084717,
0.6079723834991455,
0.5459354519844055,
0.9346232414245605,
0.9303449988365173,
0.9605541825294495,
0.9573792815208435,
0.6248452067375183,
0.9251506328582764,
0.4677916467189789,
0.37387004494667053,
0.42620334029197693,
0.600398063659668,
0.48431196808815,
0.7895669341087341,
0.4504677951335907,
0.5762742757797241,
0.6442916989326477,
0.8840709328651428,
0.7550206780433655,
0.9939717650413513,
0.6135303378105164,
0.6339468359947205,
0.5852696895599365,
0.602887749671936,
0.5735942125320435,
0.4814770221710205,
0.9196935892105103,
0.1881166696548462,
0.8902093172073364,
0.977299153804779,
0.9783608913421631,
0.9801336526870728,
0.9884994626045227,
0.5481224656105042,
0.5878416299819946,
0.2562265396118164,
0.10622240602970123,
0.1097337156534195,
0.5593991875648499,
0.5126798152923584,
0.4901875853538513,
0.539310097694397,
0.5853370428085327,
0.5666263103485107,
0.9994970560073853,
0.7907701730728149,
0.9174056649208069,
0.9986317753791809,
0.9991476535797119,
0.9870390295982361,
0.6845882534980774,
0.5273832082748413,
0.5825375914573669,
0.05030998960137367,
0.7106683254241943,
0.376408189535141,
0.6357782483100891,
0.5115633606910706,
0.5071816444396973,
0.39829522371292114,
0.535811722278595,
0.3911305069923401,
0.6767864227294922,
0.50504070520401,
0.43804654479026794,
0.5036672949790955,
0.4026598036289215,
0.35143136978149414,
0.4586479961872101
],
"eval_code_runtime": 36.5352,
"eval_code_samples_per_second": 2.737,
"eval_code_steps_per_second": 0.055,
"epoch": 1.32,
"step": 75
},
{
"eval_counterfactual_python_loss": 0.6137931942939758,
"eval_counterfactual_python_score": -0.20746655762195587,
"eval_counterfactual_python_brier_score": 0.20746655762195587,
"eval_counterfactual_python_average_probability": 0.5891837477684021,
"eval_counterfactual_python_accuracy": 0.63,
"eval_counterfactual_python_probabilities": [
0.5506163239479065,
0.42313048243522644,
0.4198402762413025,
0.5754298567771912,
0.38630211353302,
0.47240203619003296,
0.7205502986907959,
0.6168351769447327,
0.5663421750068665,
0.45957374572753906,
0.5441972017288208,
0.4583946764469147,
0.5182128548622131,
0.13082706928253174,
0.6158074140548706,
0.30370235443115234,
0.30528637766838074,
0.36947813630104065,
0.5232859253883362,
0.5014183521270752,
0.49940726161003113,
0.6633936166763306,
0.8305829763412476,
0.8158023953437805,
0.4996267259120941,
0.5016799569129944,
0.49929139018058777,
0.37765786051750183,
0.3638369143009186,
0.2675539255142212,
0.39653363823890686,
0.5094757676124573,
0.4743023216724396,
0.6519900560379028,
0.726960301399231,
0.4309100806713104,
0.9850045442581177,
0.954617977142334,
0.9593468904495239,
0.6046375036239624,
0.4302014708518982,
0.3352057933807373,
0.5038560628890991,
0.49972790479660034,
0.5001466870307922,
0.42995354533195496,
0.47737735509872437,
0.45605820417404175,
0.6769935488700867,
0.4527358412742615,
0.4564270079135895,
0.49967876076698303,
0.49923568964004517,
0.5014398694038391,
0.61121666431427,
0.5898076295852661,
0.6469179391860962,
0.5191650390625,
0.43958330154418945,
0.513123631477356,
0.6665530800819397,
0.7978847622871399,
0.5442570447921753,
0.36048850417137146,
0.5295901894569397,
0.9162126779556274,
0.6021609902381897,
0.7771204710006714,
0.7251576781272888,
0.6523131728172302,
0.46528783440589905,
0.6797440648078918,
0.5512087941169739,
0.26883381605148315,
0.2967521548271179,
0.5009620189666748,
0.4986320734024048,
0.49721115827560425,
0.6624665856361389,
0.9735934734344482,
0.9868214726448059,
0.5706613063812256,
0.7753136157989502,
0.9256560206413269,
0.5435609221458435,
0.5188571214675903,
0.554946780204773,
0.999994158744812,
0.9999972581863403,
0.9999933242797852,
0.8329089283943176,
0.4099949896335602,
0.9683297872543335,
0.8267971873283386,
0.504895031452179,
0.6182412505149841,
0.9561484456062317,
0.8357421159744263,
0.9478693604469299,
0.6621176600456238
],
"eval_counterfactual_python_runtime": 42.2604,
"eval_counterfactual_python_samples_per_second": 2.366,
"eval_counterfactual_python_steps_per_second": 0.047,
"epoch": 1.32,
"step": 75
},
{
"loss": 0.3477,
"learning_rate": 7.2e-05,
"epoch": 1.33,
"step": 76
},
{
"loss": 0.3441,
"learning_rate": 7.2e-05,
"epoch": 1.35,
"step": 77
},
{
"loss": 0.2051,
"learning_rate": 7.2e-05,
"epoch": 1.37,
"step": 78
},
{
"loss": 0.3386,
"learning_rate": 7.2e-05,
"epoch": 1.39,
"step": 79
},
{
"loss": 0.3102,
"learning_rate": 7.2e-05,
"epoch": 1.4,
"step": 80
},
{
"loss": 0.2749,
"learning_rate": 7.2e-05,
"epoch": 1.42,
"step": 81
},
{
"loss": 0.393,
"learning_rate": 7.2e-05,
"epoch": 1.44,
"step": 82
},
{
"loss": 0.3211,
"learning_rate": 7.2e-05,
"epoch": 1.46,
"step": 83
},
{
"loss": 0.3656,
"learning_rate": 7.2e-05,
"epoch": 1.47,
"step": 84
},
{
"loss": 0.2527,
"learning_rate": 7.2e-05,
"epoch": 1.49,
"step": 85
},
{
"loss": 0.3756,
"learning_rate": 7.2e-05,
"epoch": 1.51,
"step": 86
},
{
"loss": 0.5116,
"learning_rate": 7.2e-05,
"epoch": 1.53,
"step": 87
},
{
"loss": 0.3191,
"learning_rate": 7.2e-05,
"epoch": 1.54,
"step": 88
},
{
"loss": 0.2474,
"learning_rate": 7.2e-05,
"epoch": 1.56,
"step": 89
},
{
"loss": 0.3117,
"learning_rate": 7.2e-05,
"epoch": 1.58,
"step": 90
},
{
"loss": 0.2992,
"learning_rate": 7.2e-05,
"epoch": 1.6,
"step": 91
},
{
"loss": 0.158,
"learning_rate": 7.2e-05,
"epoch": 1.61,
"step": 92
},
{
"loss": 0.2684,
"learning_rate": 7.2e-05,
"epoch": 1.63,
"step": 93
},
{
"loss": 0.5338,
"learning_rate": 7.2e-05,
"epoch": 1.65,
"step": 94
},
{
"loss": 0.3467,
"learning_rate": 7.2e-05,
"epoch": 1.67,
"step": 95
},
{
"loss": 0.2647,
"learning_rate": 7.2e-05,
"epoch": 1.68,
"step": 96
},
{
"loss": 0.2894,
"learning_rate": 7.2e-05,
"epoch": 1.7,
"step": 97
},
{
"loss": 0.2537,
"learning_rate": 7.2e-05,
"epoch": 1.72,
"step": 98
},
{
"loss": 0.4454,
"learning_rate": 7.2e-05,
"epoch": 1.74,
"step": 99
},
{
"loss": 0.2264,
"learning_rate": 7.2e-05,
"epoch": 1.75,
"step": 100
},
{
"eval_code_loss": 0.562386691570282,
"eval_code_score": -0.1894664168357849,
"eval_code_brier_score": 0.1894664168357849,
"eval_code_average_probability": 0.6813782453536987,
"eval_code_accuracy": 0.75,
"eval_code_probabilities": [
0.99964439868927,
0.9998418092727661,
0.9999876022338867,
0.8987520337104797,
0.9715626835823059,
0.8736424446105957,
0.992048442363739,
0.9987469911575317,
0.5219283103942871,
0.9212198853492737,
0.9132972955703735,
0.975989818572998,
0.9921802282333374,
0.9395624399185181,
0.9364026784896851,
0.9374613165855408,
0.27392876148223877,
0.916027307510376,
0.9856477975845337,
0.9577564001083374,
0.9659378528594971,
0.44796139001846313,
0.9555050134658813,
0.9627187848091125,
0.49647897481918335,
0.2568376362323761,
0.1927042156457901,
0.561137318611145,
0.5502861738204956,
0.3930111825466156,
0.46675917506217957,
0.7520542144775391,
0.3132498860359192,
0.1046283170580864,
0.12346971035003662,
0.16289445757865906,
0.998822033405304,
0.8946499228477478,
0.9992140531539917,
0.5172696709632874,
0.1285436749458313,
0.5089917182922363,
0.8845463991165161,
0.7489760518074036,
0.8961533308029175,
0.41095906496047974,
0.733329713344574,
0.6693552136421204,
0.9867847561836243,
0.8965162038803101,
0.9999988079071045,
0.9335614442825317,
0.9917327165603638,
0.7795218825340271,
0.673981785774231,
0.5716884136199951,
0.44703209400177,
0.990574300289154,
0.035506464540958405,
0.976534366607666,
0.9999401569366455,
0.9999487400054932,
0.9999538660049438,
0.9866085648536682,
0.610414445400238,
0.4811190962791443,
0.10195612162351608,
0.022535108029842377,
0.03303113952279091,
0.6767235994338989,
0.513542890548706,
0.5040165781974792,
0.5857304930686951,
0.5917763113975525,
0.6388770341873169,
0.999974250793457,
0.6209684610366821,
0.9876555800437927,
0.9999986886978149,
0.9999998807907104,
0.9999920129776001,
0.8514988422393799,
0.5619485378265381,
0.6238705515861511,
0.08037617802619934,
0.9763862490653992,
0.21729014813899994,
0.7570930123329163,
0.6862062215805054,
0.6152291893959045,
0.28896594047546387,
0.5001997947692871,
0.3280743360519409,
0.6856067180633545,
0.5078412890434265,
0.4755324721336365,
0.6357707977294922,
0.4387938678264618,
0.530180811882019,
0.6366823315620422
],
"eval_code_runtime": 36.6096,
"eval_code_samples_per_second": 2.732,
"eval_code_steps_per_second": 0.055,
"epoch": 1.75,
"step": 100
},
{
"eval_counterfactual_python_loss": 0.5543044209480286,
"eval_counterfactual_python_score": -0.17998556792736053,
"eval_counterfactual_python_brier_score": 0.17998556792736053,
"eval_counterfactual_python_average_probability": 0.641478955745697,
"eval_counterfactual_python_accuracy": 0.68,
"eval_counterfactual_python_probabilities": [
0.5931702852249146,
0.36623018980026245,
0.4083799719810486,
0.7441582679748535,
0.3787698447704315,
0.4585961401462555,
0.9636162519454956,
0.8045032620429993,
0.7646597027778625,
0.4695722460746765,
0.6623252630233765,
0.5570592880249023,
0.4867101013660431,
0.09203716367483139,
0.659835934638977,
0.38409557938575745,
0.3676278293132782,
0.4404756426811218,
0.5268372893333435,
0.5405157804489136,
0.545403003692627,
0.7553650140762329,
0.917907178401947,
0.9101668000221252,
0.4998391270637512,
0.500482439994812,
0.4992232620716095,
0.36769258975982666,
0.3600624203681946,
0.10161764174699783,
0.27137765288352966,
0.5764327645301819,
0.5460357069969177,
0.6896645426750183,
0.5904480814933777,
0.43029138445854187,
0.9749554991722107,
0.9570443034172058,
0.9645709991455078,
0.8437580466270447,
0.3237834870815277,
0.4067584276199341,
0.505946695804596,
0.5007390975952148,
0.5010091066360474,
0.40068086981773376,
0.46205294132232666,
0.43641653656959534,
0.8441718220710754,
0.4741505980491638,
0.36617419123649597,
0.49912282824516296,
0.49875274300575256,
0.5011247396469116,
0.6660105586051941,
0.6525660157203674,
0.7143298387527466,
0.5283794403076172,
0.5694890022277832,
0.7942121624946594,
0.9201071858406067,
0.9259344935417175,
0.5873693227767944,
0.24995583295822144,
0.7780645489692688,
0.9872015714645386,
0.7106945514678955,
0.9213557839393616,
0.8370577692985535,
0.816162645816803,
0.385659784078598,
0.815650224685669,
0.9024463295936584,
0.40921616554260254,
0.7233693599700928,
0.5013810992240906,
0.4987756907939911,
0.4964328408241272,
0.7962855100631714,
0.9599968791007996,
0.967514157295227,
0.5222499966621399,
0.8373121619224548,
0.926533579826355,
0.6371393203735352,
0.5046852827072144,
0.6500534415245056,
0.9999998807907104,
1.0,
0.9999998807907104,
0.8575750589370728,
0.44756925106048584,
0.9889571070671082,
0.9346925616264343,
0.5233546495437622,
0.7729074954986572,
0.9984490871429443,
0.9480088353157043,
0.9992019534111023,
0.7911841869354248
],
"eval_counterfactual_python_runtime": 42.2823,
"eval_counterfactual_python_samples_per_second": 2.365,
"eval_counterfactual_python_steps_per_second": 0.047,
"epoch": 1.75,
"step": 100
},
{
"train_runtime": 3769.2128,
"train_samples_per_second": 0.849,
"train_steps_per_second": 0.027,
"total_flos": 0.0,
"train_loss": 0.5000894145667553,
"epoch": 1.75,
"step": 100
}
]