llama-13b-comma_separated_input / training_logs.json
joshuaclymer's picture
Upload folder using huggingface_hub
2a9d372
[
{
"epoch": 0.02,
"learning_rate": 0.0002,
"loss": 0.797,
"step": 1
},
{
"epoch": 0.04,
"learning_rate": 0.0002,
"loss": 0.8082,
"step": 2
},
{
"epoch": 0.05,
"learning_rate": 0.0002,
"loss": 0.7465,
"step": 3
},
{
"epoch": 0.07,
"learning_rate": 0.0002,
"loss": 0.711,
"step": 4
},
{
"epoch": 0.09,
"learning_rate": 0.0002,
"loss": 0.7257,
"step": 5
},
{
"epoch": 0.11,
"learning_rate": 0.0002,
"loss": 0.6974,
"step": 6
},
{
"epoch": 0.12,
"learning_rate": 0.0002,
"loss": 0.7384,
"step": 7
},
{
"epoch": 0.14,
"learning_rate": 0.0002,
"loss": 0.6891,
"step": 8
},
{
"epoch": 0.16,
"learning_rate": 0.0002,
"loss": 0.6798,
"step": 9
},
{
"epoch": 0.18,
"learning_rate": 0.0002,
"loss": 0.6775,
"step": 10
},
{
"epoch": 0.19,
"learning_rate": 0.0002,
"loss": 0.6483,
"step": 11
},
{
"epoch": 0.21,
"learning_rate": 0.0002,
"loss": 0.6469,
"step": 12
},
{
"epoch": 0.23,
"learning_rate": 0.0002,
"loss": 0.6688,
"step": 13
},
{
"epoch": 0.25,
"learning_rate": 0.0002,
"loss": 0.6505,
"step": 14
},
{
"epoch": 0.26,
"learning_rate": 0.0002,
"loss": 0.6106,
"step": 15
},
{
"epoch": 0.28,
"learning_rate": 0.0002,
"loss": 0.651,
"step": 16
},
{
"epoch": 0.3,
"learning_rate": 0.0002,
"loss": 0.6151,
"step": 17
},
{
"epoch": 0.32,
"learning_rate": 0.0002,
"loss": 0.6159,
"step": 18
},
{
"epoch": 0.33,
"learning_rate": 0.0002,
"loss": 0.6971,
"step": 19
},
{
"epoch": 0.35,
"learning_rate": 0.0002,
"loss": 0.5589,
"step": 20
},
{
"epoch": 0.37,
"learning_rate": 0.0002,
"loss": 0.5687,
"step": 21
},
{
"epoch": 0.39,
"learning_rate": 0.0002,
"loss": 0.5909,
"step": 22
},
{
"epoch": 0.4,
"learning_rate": 0.0002,
"loss": 0.584,
"step": 23
},
{
"epoch": 0.42,
"learning_rate": 0.0002,
"loss": 0.4173,
"step": 24
},
{
"epoch": 0.44,
"learning_rate": 0.0002,
"loss": 0.6371,
"step": 25
},
{
"epoch": 0.44,
"eval_comma_separated_input_accuracy": 0.63,
"eval_comma_separated_input_average_probability": 0.6018294095993042,
"eval_comma_separated_input_brier_score": 0.21203742921352386,
"eval_comma_separated_input_loss": 0.686110258102417,
"eval_comma_separated_input_probabilities": [
0.5558908581733704,
0.5916301012039185,
0.6432269215583801,
0.36950311064720154,
0.4236183166503906,
0.37855589389801025,
0.6264258623123169,
0.6975302696228027,
0.8237379789352417,
0.9395846724510193,
0.946956217288971,
0.9485966563224792,
0.9290837645530701,
0.6001691222190857,
0.566162645816803,
0.6817359924316406,
0.396467387676239,
0.6194425225257874,
0.6392065286636353,
0.5995673537254333,
0.6197391152381897,
0.42316797375679016,
0.7307467460632324,
0.869497537612915,
0.6932841539382935,
0.6172367334365845,
0.7884856462478638,
0.4992424249649048,
0.4526345729827881,
0.37598463892936707,
0.6109230518341064,
0.7996517419815063,
0.5103324055671692,
0.8988926410675049,
0.9448925852775574,
0.6513518691062927,
0.36634740233421326,
0.4100373089313507,
0.4686584770679474,
0.325899600982666,
0.304453581571579,
0.36966660618782043,
0.7797028422355652,
0.6170536279678345,
0.3745115399360657,
0.803862452507019,
0.6845769882202148,
0.47751325368881226,
0.8342162370681763,
0.657907247543335,
0.8307328820228577,
0.007643627934157848,
0.005325833335518837,
0.0030429139733314514,
0.9903197884559631,
0.9661197066307068,
0.7908632159233093,
0.4994063079357147,
0.517848014831543,
0.49284839630126953,
0.9173608422279358,
0.7173849940299988,
0.9817389845848083,
0.36961644887924194,
0.2466544359922409,
0.3669494092464447,
0.7732067108154297,
0.8438791632652283,
0.706083357334137,
0.7452952265739441,
0.529590904712677,
0.6833298802375793,
0.54054856300354,
0.37827470898628235,
0.5278826951980591,
0.987753689289093,
0.9666149020195007,
0.9811150431632996,
0.7018557190895081,
0.94044029712677,
0.5045359134674072,
0.5572289824485779,
0.5205932259559631,
0.49132102727890015,
0.8343074917793274,
0.3209303617477417,
0.7963931560516357,
0.4221838712692261,
0.24176757037639618,
0.44938939809799194,
0.233188658952713,
0.32980602979660034,
0.35758933424949646,
0.7357285618782043,
0.4575367569923401,
0.7621811628341675,
0.47835442423820496,
0.3545004725456238,
0.48495855927467346,
0.9031597375869751
],
"eval_comma_separated_input_runtime": 60.7933,
"eval_comma_separated_input_samples_per_second": 1.645,
"eval_comma_separated_input_score": -0.21203742921352386,
"eval_comma_separated_input_steps_per_second": 0.066,
"step": 25
},
{
"epoch": 0.46,
"learning_rate": 0.0002,
"loss": 0.4629,
"step": 26
},
{
"epoch": 0.47,
"learning_rate": 0.0002,
"loss": 0.6602,
"step": 27
},
{
"epoch": 0.49,
"learning_rate": 0.0002,
"loss": 0.3808,
"step": 28
},
{
"epoch": 0.51,
"learning_rate": 0.0002,
"loss": 0.648,
"step": 29
},
{
"epoch": 0.53,
"learning_rate": 0.0002,
"loss": 0.3519,
"step": 30
},
{
"epoch": 0.54,
"learning_rate": 0.0002,
"loss": 0.5556,
"step": 31
},
{
"epoch": 0.56,
"learning_rate": 0.0002,
"loss": 0.4724,
"step": 32
},
{
"epoch": 0.58,
"learning_rate": 0.0002,
"loss": 0.3805,
"step": 33
},
{
"epoch": 0.6,
"learning_rate": 0.0002,
"loss": 0.4779,
"step": 34
},
{
"epoch": 0.61,
"learning_rate": 0.0002,
"loss": 0.379,
"step": 35
},
{
"epoch": 0.63,
"learning_rate": 0.0002,
"loss": 0.4612,
"step": 36
},
{
"epoch": 0.65,
"learning_rate": 0.0002,
"loss": 0.4086,
"step": 37
},
{
"epoch": 0.67,
"learning_rate": 0.0002,
"loss": 0.4367,
"step": 38
},
{
"epoch": 0.68,
"learning_rate": 0.0002,
"loss": 0.5014,
"step": 39
},
{
"epoch": 0.7,
"learning_rate": 0.0002,
"loss": 0.4197,
"step": 40
},
{
"epoch": 0.72,
"learning_rate": 0.0002,
"loss": 0.4688,
"step": 41
},
{
"epoch": 0.74,
"learning_rate": 0.0002,
"loss": 0.4704,
"step": 42
},
{
"epoch": 0.75,
"learning_rate": 0.0002,
"loss": 0.3719,
"step": 43
},
{
"epoch": 0.77,
"learning_rate": 0.0002,
"loss": 0.3317,
"step": 44
},
{
"epoch": 0.79,
"learning_rate": 0.0002,
"loss": 0.1985,
"step": 45
},
{
"epoch": 0.81,
"learning_rate": 0.0002,
"loss": 0.3182,
"step": 46
},
{
"epoch": 0.82,
"learning_rate": 0.0002,
"loss": 0.263,
"step": 47
},
{
"epoch": 0.84,
"learning_rate": 0.0002,
"loss": 0.3889,
"step": 48
},
{
"epoch": 0.86,
"learning_rate": 0.0002,
"loss": 0.5892,
"step": 49
},
{
"epoch": 0.88,
"learning_rate": 0.0002,
"loss": 0.3128,
"step": 50
},
{
"epoch": 0.88,
"eval_comma_separated_input_accuracy": 0.76,
"eval_comma_separated_input_average_probability": 0.6931238770484924,
"eval_comma_separated_input_brier_score": 0.14780747890472412,
"eval_comma_separated_input_loss": 0.453370600938797,
"eval_comma_separated_input_probabilities": [
0.4881611168384552,
0.7195671200752258,
0.7141000628471375,
0.8347252607345581,
0.47331616282463074,
0.5195823311805725,
0.5912675857543945,
0.6148558259010315,
0.8197656869888306,
0.9729957580566406,
0.9784613251686096,
0.9697833061218262,
0.839015007019043,
0.6825152635574341,
0.5903958082199097,
0.8929196000099182,
0.547723114490509,
0.8592323660850525,
0.7071111798286438,
0.847319483757019,
0.5036335587501526,
0.47712191939353943,
0.7493639588356018,
0.5932612419128418,
0.9187593460083008,
0.9004901647567749,
0.49007946252822876,
0.6547536253929138,
0.905436635017395,
0.6777333617210388,
0.8778079152107239,
0.8987858891487122,
0.8883975744247437,
0.9351140260696411,
0.986535370349884,
0.9079702496528625,
0.16146612167358398,
0.2985393702983856,
0.414657860994339,
0.7492821216583252,
0.4150148630142212,
0.5276386141777039,
0.9780398011207581,
0.9754133224487305,
0.7470136880874634,
0.8623924851417542,
0.7968011498451233,
0.6666762828826904,
0.9737648367881775,
0.8081139922142029,
0.8902385830879211,
0.5449945330619812,
0.6120281219482422,
0.20288453996181488,
0.9999008178710938,
0.9994014501571655,
0.9994074106216431,
0.38681939244270325,
0.5507157444953918,
0.3638652265071869,
0.9962961077690125,
0.9962965846061707,
0.9980778694152832,
0.2687752842903137,
0.20263515412807465,
0.37652477622032166,
0.5609388947486877,
0.6837733387947083,
0.708829939365387,
0.7138429284095764,
0.4058096706867218,
0.3868248760700226,
0.7156091928482056,
0.3304055333137512,
0.5715523362159729,
0.9999637603759766,
0.999687910079956,
0.9995285272598267,
0.7321438193321228,
0.824472188949585,
0.8068863153457642,
0.457910418510437,
0.44011202454566956,
0.3999078869819641,
0.8919979333877563,
0.37819552421569824,
0.8896527886390686,
0.8180981278419495,
0.3990896940231323,
0.6426243185997009,
0.3510454297065735,
0.238455668091774,
0.5349404811859131,
0.7837204933166504,
0.6652680039405823,
0.9668682813644409,
0.8590173125267029,
0.671464741230011,
0.693926990032196,
0.9980959296226501
],
"eval_comma_separated_input_runtime": 60.8397,
"eval_comma_separated_input_samples_per_second": 1.644,
"eval_comma_separated_input_score": -0.14780747890472412,
"eval_comma_separated_input_steps_per_second": 0.066,
"step": 50
},
{
"loss": 0.31,
"learning_rate": 0.0002,
"epoch": 0.89,
"step": 51
},
{
"loss": 0.4172,
"learning_rate": 0.0002,
"epoch": 0.91,
"step": 52
},
{
"loss": 0.3206,
"learning_rate": 0.0002,
"epoch": 0.93,
"step": 53
},
{
"loss": 0.2927,
"learning_rate": 0.0002,
"epoch": 0.95,
"step": 54
},
{
"loss": 0.2414,
"learning_rate": 0.0002,
"epoch": 0.96,
"step": 55
},
{
"loss": 0.3228,
"learning_rate": 0.0002,
"epoch": 0.98,
"step": 56
},
{
"loss": 0.2143,
"learning_rate": 0.0002,
"epoch": 1.0,
"step": 57
},
{
"loss": 0.1745,
"learning_rate": 0.0002,
"epoch": 1.02,
"step": 58
},
{
"loss": 0.2258,
"learning_rate": 0.0002,
"epoch": 1.04,
"step": 59
},
{
"loss": 0.1248,
"learning_rate": 0.0002,
"epoch": 1.05,
"step": 60
},
{
"loss": 0.2352,
"learning_rate": 0.0002,
"epoch": 1.07,
"step": 61
},
{
"loss": 0.1176,
"learning_rate": 0.0002,
"epoch": 1.09,
"step": 62
},
{
"loss": 0.1001,
"learning_rate": 0.0002,
"epoch": 1.11,
"step": 63
},
{
"loss": 0.2114,
"learning_rate": 0.0002,
"epoch": 1.12,
"step": 64
},
{
"loss": 0.0969,
"learning_rate": 0.0002,
"epoch": 1.14,
"step": 65
},
{
"loss": 0.2364,
"learning_rate": 0.0002,
"epoch": 1.16,
"step": 66
},
{
"loss": 0.0851,
"learning_rate": 0.0002,
"epoch": 1.18,
"step": 67
},
{
"loss": 0.2091,
"learning_rate": 0.0002,
"epoch": 1.19,
"step": 68
},
{
"loss": 0.1178,
"learning_rate": 0.0002,
"epoch": 1.21,
"step": 69
},
{
"loss": 0.2258,
"learning_rate": 0.0002,
"epoch": 1.23,
"step": 70
},
{
"loss": 0.1515,
"learning_rate": 0.0002,
"epoch": 1.25,
"step": 71
},
{
"loss": 0.0813,
"learning_rate": 0.0002,
"epoch": 1.26,
"step": 72
},
{
"loss": 0.1006,
"learning_rate": 0.0002,
"epoch": 1.28,
"step": 73
},
{
"loss": 0.1826,
"learning_rate": 0.0002,
"epoch": 1.3,
"step": 74
},
{
"loss": 0.1711,
"learning_rate": 0.0002,
"epoch": 1.32,
"step": 75
},
{
"eval_comma_separated_input_loss": 0.4473796486854553,
"eval_comma_separated_input_score": -0.14811663329601288,
"eval_comma_separated_input_brier_score": 0.14811663329601288,
"eval_comma_separated_input_average_probability": 0.7419509887695312,
"eval_comma_separated_input_accuracy": 0.75,
"eval_comma_separated_input_probabilities": [
0.41862952709198,
0.8383148312568665,
0.7812618017196655,
0.7367869019508362,
0.37229153513908386,
0.3427063822746277,
0.3607252240180969,
0.28927841782569885,
0.48710137605667114,
0.9926695823669434,
0.9912550449371338,
0.9978455305099487,
0.7075887322425842,
0.8566752672195435,
0.664120078086853,
0.9844642281532288,
0.978632390499115,
0.9912452101707458,
0.7972939014434814,
0.9451481699943542,
0.7759111523628235,
0.31145331263542175,
0.9287068843841553,
0.7827960252761841,
0.9771390557289124,
0.972224771976471,
0.8520051836967468,
0.8605024218559265,
0.9771012663841248,
0.8115990161895752,
0.9740229249000549,
0.988884449005127,
0.9791930913925171,
0.9999887943267822,
0.9999927282333374,
0.9999077320098877,
0.19534185528755188,
0.2543109059333801,
0.4906967878341675,
0.9195861220359802,
0.335068941116333,
0.7754003405570984,
0.9392538070678711,
0.9805151224136353,
0.3839010000228882,
0.9845028519630432,
0.9500546455383301,
0.89715975522995,
0.9974859952926636,
0.925458550453186,
0.99233078956604,
0.5326679944992065,
0.6475582718849182,
0.09340225160121918,
0.9999998807907104,
0.9999995231628418,
0.9999996423721313,
0.24775967001914978,
0.7411832809448242,
0.29571253061294556,
0.9966977834701538,
0.9986191987991333,
0.9997950196266174,
0.17234858870506287,
0.12201625853776932,
0.363972008228302,
0.8710910677909851,
0.9467532634735107,
0.9615404605865479,
0.866151750087738,
0.2057020664215088,
0.09766208380460739,
0.6546601057052612,
0.21178442239761353,
0.643134593963623,
0.9999984502792358,
0.9999825954437256,
0.9999775886535645,
0.7305182218551636,
0.9016615152359009,
0.9469624161720276,
0.44552576541900635,
0.5828497409820557,
0.6067183017730713,
0.9952744245529175,
0.7491648197174072,
0.9940935969352722,
0.780812680721283,
0.21401090919971466,
0.8820922374725342,
0.38722485303878784,
0.31995269656181335,
0.5564114451408386,
0.9752086400985718,
0.9724474549293518,
0.9996752738952637,
0.8264317512512207,
0.9933149218559265,
0.9180617928504944,
0.9999868869781494
],
"eval_comma_separated_input_runtime": 60.9212,
"eval_comma_separated_input_samples_per_second": 1.641,
"eval_comma_separated_input_steps_per_second": 0.066,
"epoch": 1.32,
"step": 75
},
{
"loss": 0.2107,
"learning_rate": 0.0002,
"epoch": 1.33,
"step": 76
},
{
"loss": 0.18,
"learning_rate": 0.0002,
"epoch": 1.35,
"step": 77
},
{
"loss": 0.0582,
"learning_rate": 0.0002,
"epoch": 1.37,
"step": 78
},
{
"loss": 0.0838,
"learning_rate": 0.0002,
"epoch": 1.39,
"step": 79
},
{
"loss": 0.1502,
"learning_rate": 0.0002,
"epoch": 1.4,
"step": 80
},
{
"loss": 0.1525,
"learning_rate": 0.0002,
"epoch": 1.42,
"step": 81
},
{
"loss": 0.1008,
"learning_rate": 0.0002,
"epoch": 1.44,
"step": 82
},
{
"loss": 0.0764,
"learning_rate": 0.0002,
"epoch": 1.46,
"step": 83
},
{
"loss": 0.2219,
"learning_rate": 0.0002,
"epoch": 1.47,
"step": 84
},
{
"loss": 0.2519,
"learning_rate": 0.0002,
"epoch": 1.49,
"step": 85
},
{
"loss": 0.1048,
"learning_rate": 0.0002,
"epoch": 1.51,
"step": 86
},
{
"loss": 0.0876,
"learning_rate": 0.0002,
"epoch": 1.53,
"step": 87
},
{
"loss": 0.1117,
"learning_rate": 0.0002,
"epoch": 1.54,
"step": 88
},
{
"loss": 0.0907,
"learning_rate": 0.0002,
"epoch": 1.56,
"step": 89
},
{
"loss": 0.0652,
"learning_rate": 0.0002,
"epoch": 1.58,
"step": 90
},
{
"loss": 0.1096,
"learning_rate": 0.0002,
"epoch": 1.6,
"step": 91
},
{
"loss": 0.0736,
"learning_rate": 0.0002,
"epoch": 1.61,
"step": 92
},
{
"loss": 0.0212,
"learning_rate": 0.0002,
"epoch": 1.63,
"step": 93
},
{
"loss": 0.0625,
"learning_rate": 0.0002,
"epoch": 1.65,
"step": 94
},
{
"loss": 0.0354,
"learning_rate": 0.0002,
"epoch": 1.67,
"step": 95
},
{
"loss": 0.1312,
"learning_rate": 0.0002,
"epoch": 1.68,
"step": 96
},
{
"loss": 0.0751,
"learning_rate": 0.0002,
"epoch": 1.7,
"step": 97
},
{
"loss": 0.1189,
"learning_rate": 0.0002,
"epoch": 1.72,
"step": 98
},
{
"loss": 0.0435,
"learning_rate": 0.0002,
"epoch": 1.74,
"step": 99
},
{
"loss": 0.0163,
"learning_rate": 0.0002,
"epoch": 1.75,
"step": 100
},
{
"eval_comma_separated_input_loss": 0.42227625846862793,
"eval_comma_separated_input_score": -0.12549929320812225,
"eval_comma_separated_input_brier_score": 0.12549929320812225,
"eval_comma_separated_input_average_probability": 0.7905582189559937,
"eval_comma_separated_input_accuracy": 0.84,
"eval_comma_separated_input_probabilities": [
0.24483607709407806,
0.9373713135719299,
0.9127155542373657,
0.695315420627594,
0.5616677403450012,
0.20325511693954468,
0.7931861877441406,
0.9079830050468445,
0.8169024586677551,
0.9998249411582947,
0.9996848106384277,
0.9982641339302063,
0.8567901849746704,
0.7895544171333313,
0.5724702477455139,
0.9984922409057617,
0.9373425841331482,
0.9982282519340515,
0.9550377130508423,
0.9790574312210083,
0.7754307389259338,
0.21504585444927216,
0.9233853816986084,
0.8145928382873535,
0.998050332069397,
0.9973044395446777,
0.6407326459884644,
0.9915988445281982,
0.9999984502792358,
0.9995885491371155,
0.9999392032623291,
0.9999961853027344,
0.9997187256813049,
1.0,
1.0,
0.9999998807907104,
0.6158778667449951,
0.4124883711338043,
0.560310959815979,
0.9928176403045654,
0.6002708673477173,
0.9286289215087891,
0.9934931397438049,
0.9998588562011719,
0.7984523773193359,
0.9996716976165771,
0.994800329208374,
0.9838972687721252,
0.9996751546859741,
0.6458868384361267,
0.9535225629806519,
0.5931392908096313,
0.8385766744613647,
0.005562468897551298,
1.0,
1.0,
1.0,
0.31715190410614014,
0.8312814235687256,
0.6272522211074829,
0.9999995231628418,
0.9999992847442627,
1.0,
0.7516292929649353,
0.24585771560668945,
0.3060058057308197,
0.9998854398727417,
0.9999909400939941,
0.9999783039093018,
0.7187626361846924,
0.08639119565486908,
0.14384527504444122,
0.8143994808197021,
0.09674762189388275,
0.7539010047912598,
1.0,
0.9999984502792358,
0.9999997615814209,
0.9970013499259949,
0.9978756904602051,
0.9991826415061951,
0.572467565536499,
0.8679181933403015,
0.6878445148468018,
0.9994242191314697,
0.9776573181152344,
0.9984028935432434,
0.7333370447158813,
0.00896016601473093,
0.9204919338226318,
0.46211180090904236,
0.32617124915122986,
0.10653527081012726,
0.9962393045425415,
0.9877421855926514,
0.9995656609535217,
0.3141045868396759,
0.9907304644584656,
0.988701343536377,
0.999995231628418
],
"eval_comma_separated_input_runtime": 60.8425,
"eval_comma_separated_input_samples_per_second": 1.644,
"eval_comma_separated_input_steps_per_second": 0.066,
"epoch": 1.75,
"step": 100
},
{
"loss": 0.0505,
"learning_rate": 0.0002,
"epoch": 1.77,
"step": 101
},
{
"loss": 0.1026,
"learning_rate": 0.0002,
"epoch": 1.79,
"step": 102
},
{
"loss": 0.0198,
"learning_rate": 0.0002,
"epoch": 1.81,
"step": 103
},
{
"loss": 0.0532,
"learning_rate": 0.0002,
"epoch": 1.82,
"step": 104
},
{
"loss": 0.0765,
"learning_rate": 0.0002,
"epoch": 1.84,
"step": 105
},
{
"loss": 0.1056,
"learning_rate": 0.0002,
"epoch": 1.86,
"step": 106
},
{
"loss": 0.0588,
"learning_rate": 0.0002,
"epoch": 1.88,
"step": 107
},
{
"loss": 0.0301,
"learning_rate": 0.0002,
"epoch": 1.89,
"step": 108
},
{
"loss": 0.0187,
"learning_rate": 0.0002,
"epoch": 1.91,
"step": 109
},
{
"loss": 0.0844,
"learning_rate": 0.0002,
"epoch": 1.93,
"step": 110
},
{
"loss": 0.0715,
"learning_rate": 0.0002,
"epoch": 1.95,
"step": 111
},
{
"loss": 0.0533,
"learning_rate": 0.0002,
"epoch": 1.96,
"step": 112
},
{
"loss": 0.1283,
"learning_rate": 0.0002,
"epoch": 1.98,
"step": 113
},
{
"loss": 0.0124,
"learning_rate": 0.0002,
"epoch": 2.0,
"step": 114
},
{
"loss": 0.0168,
"learning_rate": 0.0002,
"epoch": 2.02,
"step": 115
},
{
"loss": 0.0066,
"learning_rate": 0.0002,
"epoch": 2.04,
"step": 116
},
{
"loss": 0.0056,
"learning_rate": 0.0002,
"epoch": 2.05,
"step": 117
},
{
"loss": 0.0273,
"learning_rate": 0.0002,
"epoch": 2.07,
"step": 118
},
{
"loss": 0.051,
"learning_rate": 0.0002,
"epoch": 2.09,
"step": 119
},
{
"loss": 0.0106,
"learning_rate": 0.0002,
"epoch": 2.11,
"step": 120
},
{
"loss": 0.0046,
"learning_rate": 0.0002,
"epoch": 2.12,
"step": 121
},
{
"loss": 0.0158,
"learning_rate": 0.0002,
"epoch": 2.14,
"step": 122
},
{
"loss": 0.0182,
"learning_rate": 0.0002,
"epoch": 2.16,
"step": 123
},
{
"loss": 0.0315,
"learning_rate": 0.0002,
"epoch": 2.18,
"step": 124
},
{
"loss": 0.0245,
"learning_rate": 0.0002,
"epoch": 2.19,
"step": 125
},
{
"eval_comma_separated_input_loss": 0.5722466111183167,
"eval_comma_separated_input_score": -0.1544850468635559,
"eval_comma_separated_input_brier_score": 0.1544850468635559,
"eval_comma_separated_input_average_probability": 0.7744138836860657,
"eval_comma_separated_input_accuracy": 0.76,
"eval_comma_separated_input_probabilities": [
0.2503635883331299,
0.9240305423736572,
0.8747212290763855,
0.7985246777534485,
0.4488164484500885,
0.031310152262449265,
0.5302342176437378,
0.6140178442001343,
0.8236578702926636,
0.9999752044677734,
0.9999796152114868,
0.9999902248382568,
0.7603113651275635,
0.9699550867080688,
0.7218661904335022,
0.9993477463722229,
0.9925121068954468,
0.9995954632759094,
0.986947774887085,
0.999578058719635,
0.7563473582267761,
0.43998968601226807,
0.978145956993103,
0.896251380443573,
0.9992613196372986,
0.9983689188957214,
0.38473182916641235,
0.999991774559021,
0.9999996423721313,
0.9999488592147827,
0.9998316764831543,
0.9999916553497314,
0.9999275207519531,
1.0,
1.0,
1.0,
0.49581024050712585,
0.19594253599643707,
0.6581753492355347,
0.995919406414032,
0.46053361892700195,
0.8992795348167419,
0.9999897480010986,
0.9999617338180542,
0.7984490394592285,
0.9999920129776001,
0.9998655319213867,
0.9992161989212036,
0.9999884366989136,
0.9629930257797241,
0.9989847540855408,
0.8156930804252625,
0.7366847395896912,
0.0011243701446801424,
1.0,
1.0,
1.0,
0.08260075002908707,
0.942870020866394,
0.4329875409603119,
1.0,
1.0,
1.0,
0.05976872146129608,
0.005152431782335043,
0.04110531136393547,
0.9999897480010986,
0.9999986886978149,
0.9999939203262329,
0.9135926961898804,
0.09270866960287094,
0.17058712244033813,
0.7809781432151794,
0.01853158511221409,
0.4760031998157501,
1.0,
1.0,
1.0,
0.99244225025177,
0.9980723857879639,
0.9958682060241699,
0.19910208880901337,
0.7636554837226868,
0.3311282992362976,
0.9997004270553589,
0.8541337251663208,
0.9925978183746338,
0.989072322845459,
0.031905822455883026,
0.9968061447143555,
0.47062090039253235,
0.4492467939853668,
0.47012507915496826,
0.99982088804245,
0.9995218515396118,
0.9999990463256836,
0.7012842893600464,
0.9981949925422668,
0.9940962791442871,
0.9999996423721313
],
"eval_comma_separated_input_runtime": 60.8241,
"eval_comma_separated_input_samples_per_second": 1.644,
"eval_comma_separated_input_steps_per_second": 0.066,
"epoch": 2.19,
"step": 125
},
{
"loss": 0.0055,
"learning_rate": 0.0002,
"epoch": 2.21,
"step": 126
},
{
"loss": 0.0284,
"learning_rate": 0.0002,
"epoch": 2.23,
"step": 127
},
{
"loss": 0.0052,
"learning_rate": 0.0002,
"epoch": 2.25,
"step": 128
},
{
"loss": 0.0022,
"learning_rate": 0.0002,
"epoch": 2.26,
"step": 129
},
{
"loss": 0.0022,
"learning_rate": 0.0002,
"epoch": 2.28,
"step": 130
},
{
"loss": 0.0157,
"learning_rate": 0.0002,
"epoch": 2.3,
"step": 131
},
{
"loss": 0.0036,
"learning_rate": 0.0002,
"epoch": 2.32,
"step": 132
},
{
"loss": 0.0226,
"learning_rate": 0.0002,
"epoch": 2.33,
"step": 133
},
{
"loss": 0.0242,
"learning_rate": 0.0002,
"epoch": 2.35,
"step": 134
},
{
"loss": 0.0196,
"learning_rate": 0.0002,
"epoch": 2.37,
"step": 135
},
{
"loss": 0.0012,
"learning_rate": 0.0002,
"epoch": 2.39,
"step": 136
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 2.4,
"step": 137
},
{
"loss": 0.0072,
"learning_rate": 0.0002,
"epoch": 2.42,
"step": 138
},
{
"loss": 0.0125,
"learning_rate": 0.0002,
"epoch": 2.44,
"step": 139
},
{
"loss": 0.0061,
"learning_rate": 0.0002,
"epoch": 2.46,
"step": 140
},
{
"loss": 0.003,
"learning_rate": 0.0002,
"epoch": 2.47,
"step": 141
},
{
"loss": 0.006,
"learning_rate": 0.0002,
"epoch": 2.49,
"step": 142
},
{
"loss": 0.001,
"learning_rate": 0.0002,
"epoch": 2.51,
"step": 143
},
{
"loss": 0.0011,
"learning_rate": 0.0002,
"epoch": 2.53,
"step": 144
},
{
"loss": 0.0493,
"learning_rate": 0.0002,
"epoch": 2.54,
"step": 145
},
{
"loss": 0.0012,
"learning_rate": 0.0002,
"epoch": 2.56,
"step": 146
},
{
"loss": 0.0027,
"learning_rate": 0.0002,
"epoch": 2.58,
"step": 147
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 2.6,
"step": 148
},
{
"loss": 0.1281,
"learning_rate": 0.0002,
"epoch": 2.61,
"step": 149
},
{
"loss": 0.001,
"learning_rate": 0.0002,
"epoch": 2.63,
"step": 150
},
{
"eval_comma_separated_input_loss": 0.8693166971206665,
"eval_comma_separated_input_score": -0.19275860488414764,
"eval_comma_separated_input_brier_score": 0.19275860488414764,
"eval_comma_separated_input_average_probability": 0.757495105266571,
"eval_comma_separated_input_accuracy": 0.76,
"eval_comma_separated_input_probabilities": [
0.13190123438835144,
0.9918695688247681,
0.9828689694404602,
0.9848847389221191,
0.7346028685569763,
0.003163250396028161,
0.999812662601471,
0.9998378753662109,
0.999977707862854,
0.9999912977218628,
0.9999881982803345,
0.9999995231628418,
0.681171715259552,
0.9439078569412231,
0.654923141002655,
0.9999362230300903,
0.9993796348571777,
0.9999890327453613,
0.9994239807128906,
0.9999834299087524,
0.6320100426673889,
0.551685094833374,
0.9921031594276428,
0.9178003668785095,
0.9997648596763611,
0.9996930360794067,
0.018658915534615517,
0.9999997615814209,
1.0,
0.9999947547912598,
0.9999914169311523,
0.9999997615814209,
0.9999982118606567,
1.0,
1.0,
1.0,
0.16114874184131622,
0.11440837383270264,
0.38666167855262756,
0.9899235367774963,
0.7749587893486023,
0.9868499040603638,
0.9999899864196777,
0.9999432563781738,
0.3350386321544647,
0.9999998807907104,
0.9999978542327881,
0.9999830722808838,
0.9999971389770508,
0.9891533255577087,
0.9995243549346924,
0.35080164670944214,
0.690878689289093,
8.349389099748805e-05,
1.0,
1.0,
1.0,
0.018209535628557205,
0.815947949886322,
0.06643610447645187,
1.0,
1.0,
1.0,
0.032206106930971146,
0.001175067969597876,
0.003918609581887722,
1.0,
1.0,
1.0,
0.9634184837341309,
0.16264604032039642,
0.13007192313671112,
0.9627270698547363,
0.011178754270076752,
0.3427962362766266,
1.0,
1.0,
1.0,
0.9999997615814209,
1.0,
0.9999998807907104,
0.0033358922228217125,
0.8806586265563965,
0.32572072744369507,
0.9999881982803345,
0.9842215776443481,
0.9999381303787231,
0.5839999318122864,
0.00014188152272254229,
0.9629126191139221,
0.29315897822380066,
0.2594333291053772,
0.18982450664043427,
0.9999868869781494,
0.9999876022338867,
1.0,
0.7872719764709473,
0.997302770614624,
0.9722517132759094,
0.9999998807907104
],
"eval_comma_separated_input_runtime": 60.8067,
"eval_comma_separated_input_samples_per_second": 1.645,
"eval_comma_separated_input_steps_per_second": 0.066,
"epoch": 2.63,
"step": 150
},
{
"loss": 0.0148,
"learning_rate": 0.0002,
"epoch": 2.65,
"step": 151
},
{
"loss": 0.0036,
"learning_rate": 0.0002,
"epoch": 2.67,
"step": 152
},
{
"loss": 0.0319,
"learning_rate": 0.0002,
"epoch": 2.68,
"step": 153
},
{
"loss": 0.0014,
"learning_rate": 0.0002,
"epoch": 2.7,
"step": 154
},
{
"loss": 0.2958,
"learning_rate": 0.0002,
"epoch": 2.72,
"step": 155
},
{
"loss": 0.005,
"learning_rate": 0.0002,
"epoch": 2.74,
"step": 156
},
{
"loss": 0.004,
"learning_rate": 0.0002,
"epoch": 2.75,
"step": 157
},
{
"loss": 0.0034,
"learning_rate": 0.0002,
"epoch": 2.77,
"step": 158
},
{
"loss": 0.0268,
"learning_rate": 0.0002,
"epoch": 2.79,
"step": 159
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 2.81,
"step": 160
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 2.82,
"step": 161
},
{
"loss": 0.0121,
"learning_rate": 0.0002,
"epoch": 2.84,
"step": 162
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 2.86,
"step": 163
},
{
"loss": 0.0017,
"learning_rate": 0.0002,
"epoch": 2.88,
"step": 164
},
{
"loss": 0.0019,
"learning_rate": 0.0002,
"epoch": 2.89,
"step": 165
},
{
"loss": 0.0025,
"learning_rate": 0.0002,
"epoch": 2.91,
"step": 166
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 2.93,
"step": 167
},
{
"loss": 0.0212,
"learning_rate": 0.0002,
"epoch": 2.95,
"step": 168
},
{
"loss": 0.0009,
"learning_rate": 0.0002,
"epoch": 2.96,
"step": 169
},
{
"loss": 0.0213,
"learning_rate": 0.0002,
"epoch": 2.98,
"step": 170
},
{
"loss": 0.0022,
"learning_rate": 0.0002,
"epoch": 3.0,
"step": 171
},
{
"loss": 0.0017,
"learning_rate": 0.0002,
"epoch": 3.02,
"step": 172
},
{
"loss": 0.001,
"learning_rate": 0.0002,
"epoch": 3.04,
"step": 173
},
{
"loss": 0.004,
"learning_rate": 0.0002,
"epoch": 3.05,
"step": 174
},
{
"loss": 0.0044,
"learning_rate": 0.0002,
"epoch": 3.07,
"step": 175
},
{
"eval_comma_separated_input_loss": 0.8060197234153748,
"eval_comma_separated_input_score": -0.1822451800107956,
"eval_comma_separated_input_brier_score": 0.1822451800107956,
"eval_comma_separated_input_average_probability": 0.7699721455574036,
"eval_comma_separated_input_accuracy": 0.78,
"eval_comma_separated_input_probabilities": [
0.17016573250293732,
0.997651994228363,
0.9846643805503845,
0.9527844786643982,
0.6087873578071594,
0.049850910902023315,
0.9972535967826843,
0.9988195300102234,
0.9995121955871582,
0.9999998807907104,
0.9999997615814209,
1.0,
0.8714950680732727,
0.7293234467506409,
0.8327075839042664,
0.9999344348907471,
0.9996497631072998,
0.999994158744812,
0.9998268485069275,
0.9999881982803345,
0.8997599482536316,
0.5459089875221252,
0.999037504196167,
0.9530684351921082,
0.9999831914901733,
0.9999550580978394,
0.6756637096405029,
0.9999977350234985,
0.9999998807907104,
0.9994704127311707,
0.9999986886978149,
0.9999997615814209,
0.9999988079071045,
1.0,
1.0,
1.0,
0.405244380235672,
0.14750726521015167,
0.3550819754600525,
0.9999498128890991,
0.8734256625175476,
0.9983735084533691,
0.9999432563781738,
0.9983869791030884,
0.07085894793272018,
1.0,
1.0,
0.9999973773956299,
1.0,
0.9918185472488403,
0.9993517994880676,
0.022607209160923958,
0.8718477487564087,
0.00019601006351877004,
1.0,
1.0,
1.0,
0.045121096074581146,
0.7114633917808533,
0.19008778035640717,
1.0,
1.0,
1.0,
0.017528729513287544,
0.003795832861214876,
0.005920866504311562,
1.0,
1.0,
1.0,
0.9790542125701904,
0.011330204084515572,
0.023379497230052948,
0.4797717332839966,
0.0017255247803404927,
0.15586982667446136,
1.0,
0.9999998807907104,
1.0,
0.9999995231628418,
1.0,
1.0,
0.14338074624538422,
0.9458649754524231,
0.5068089365959167,
0.9999911785125732,
0.9953752756118774,
0.9999755620956421,
0.783764660358429,
6.794904766138643e-05,
0.971418559551239,
0.6962472200393677,
0.44212785363197327,
0.17592112720012665,
0.9999672174453735,
0.9995967745780945,
1.0,
0.7349942326545715,
0.9991052746772766,
0.9777160286903381,
0.9999994039535522
],
"eval_comma_separated_input_runtime": 60.8107,
"eval_comma_separated_input_samples_per_second": 1.644,
"eval_comma_separated_input_steps_per_second": 0.066,
"epoch": 3.07,
"step": 175
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 3.09,
"step": 176
},
{
"loss": 0.0008,
"learning_rate": 0.0002,
"epoch": 3.11,
"step": 177
},
{
"loss": 0.0012,
"learning_rate": 0.0002,
"epoch": 3.12,
"step": 178
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 3.14,
"step": 179
},
{
"loss": 0.0046,
"learning_rate": 0.0002,
"epoch": 3.16,
"step": 180
},
{
"loss": 0.0009,
"learning_rate": 0.0002,
"epoch": 3.18,
"step": 181
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 3.19,
"step": 182
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.21,
"step": 183
},
{
"loss": 0.2814,
"learning_rate": 0.0002,
"epoch": 3.23,
"step": 184
},
{
"loss": 0.0028,
"learning_rate": 0.0002,
"epoch": 3.25,
"step": 185
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.26,
"step": 186
},
{
"loss": 0.0116,
"learning_rate": 0.0002,
"epoch": 3.28,
"step": 187
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.3,
"step": 188
},
{
"loss": 0.0009,
"learning_rate": 0.0002,
"epoch": 3.32,
"step": 189
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 3.33,
"step": 190
},
{
"loss": 0.0011,
"learning_rate": 0.0002,
"epoch": 3.35,
"step": 191
},
{
"loss": 0.0014,
"learning_rate": 0.0002,
"epoch": 3.37,
"step": 192
},
{
"loss": 0.0012,
"learning_rate": 0.0002,
"epoch": 3.39,
"step": 193
},
{
"loss": 0.0011,
"learning_rate": 0.0002,
"epoch": 3.4,
"step": 194
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 3.42,
"step": 195
},
{
"loss": 0.0013,
"learning_rate": 0.0002,
"epoch": 3.44,
"step": 196
},
{
"loss": 0.002,
"learning_rate": 0.0002,
"epoch": 3.46,
"step": 197
},
{
"loss": 0.0032,
"learning_rate": 0.0002,
"epoch": 3.47,
"step": 198
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 3.49,
"step": 199
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 3.51,
"step": 200
},
{
"eval_comma_separated_input_loss": 0.8059910535812378,
"eval_comma_separated_input_score": -0.20177654922008514,
"eval_comma_separated_input_brier_score": 0.20177654922008514,
"eval_comma_separated_input_average_probability": 0.7506393194198608,
"eval_comma_separated_input_accuracy": 0.74,
"eval_comma_separated_input_probabilities": [
0.06566958874464035,
0.9585626721382141,
0.9394274353981018,
0.8206621408462524,
0.12451951205730438,
0.040482982993125916,
0.9904934763908386,
0.9912689924240112,
0.9971289038658142,
0.9999997615814209,
0.9999979734420776,
1.0,
0.9467275142669678,
0.9138575196266174,
0.8370740413665771,
0.999994158744812,
0.9998130202293396,
0.9999973773956299,
0.9990767240524292,
0.9999643564224243,
0.6109173893928528,
0.4885546863079071,
0.9974848031997681,
0.9322636127471924,
0.9842928051948547,
0.9836403727531433,
0.2748430073261261,
0.9999836683273315,
0.9999990463256836,
0.9978179931640625,
0.9999943971633911,
0.9999996423721313,
0.9999982118606567,
1.0,
1.0,
1.0,
0.16236703097820282,
0.1479361355304718,
0.43488311767578125,
0.9998273849487305,
0.4517606198787689,
0.9986383318901062,
0.9998272061347961,
0.9975333213806152,
0.03569738566875458,
1.0,
0.9999977350234985,
0.999956488609314,
1.0,
0.9964632391929626,
0.9999812841415405,
0.05186959356069565,
0.51998370885849,
0.00010708211630117148,
1.0,
1.0,
1.0,
0.025064213201403618,
0.6244286298751831,
0.08103948831558228,
1.0,
1.0,
1.0,
0.021069664508104324,
0.0017033411422744393,
0.00984130334109068,
0.9999998807907104,
1.0,
0.9999998807907104,
0.9361790418624878,
0.0564756765961647,
0.06753901392221451,
0.7943969964981079,
0.014756478369235992,
0.346853643655777,
1.0,
1.0,
1.0,
0.9999464750289917,
0.9999768733978271,
0.9999878406524658,
0.03871014341711998,
0.9028144478797913,
0.3946305811405182,
0.9999914169311523,
0.9812803864479065,
0.9999563694000244,
0.9456529021263123,
0.00591609813272953,
0.9831116795539856,
0.7037330269813538,
0.4673255980014801,
0.1429651826620102,
0.9999947547912598,
0.9999731779098511,
1.0,
0.9651234745979309,
0.9989381432533264,
0.8632209897041321,
0.9999992847442627
],
"eval_comma_separated_input_runtime": 60.8443,
"eval_comma_separated_input_samples_per_second": 1.644,
"eval_comma_separated_input_steps_per_second": 0.066,
"epoch": 3.51,
"step": 200
},
{
"loss": 0.0009,
"learning_rate": 0.0002,
"epoch": 3.53,
"step": 201
},
{
"loss": 0.0023,
"learning_rate": 0.0002,
"epoch": 3.54,
"step": 202
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 3.56,
"step": 203
},
{
"loss": 0.0038,
"learning_rate": 0.0002,
"epoch": 3.58,
"step": 204
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.6,
"step": 205
},
{
"loss": 0.0043,
"learning_rate": 0.0002,
"epoch": 3.61,
"step": 206
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.63,
"step": 207
},
{
"loss": 0.0011,
"learning_rate": 0.0002,
"epoch": 3.65,
"step": 208
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 3.67,
"step": 209
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 3.68,
"step": 210
},
{
"loss": 0.002,
"learning_rate": 0.0002,
"epoch": 3.7,
"step": 211
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.72,
"step": 212
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 3.74,
"step": 213
},
{
"loss": 0.0025,
"learning_rate": 0.0002,
"epoch": 3.75,
"step": 214
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 3.77,
"step": 215
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.79,
"step": 216
},
{
"loss": 0.0009,
"learning_rate": 0.0002,
"epoch": 3.81,
"step": 217
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 3.82,
"step": 218
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 3.84,
"step": 219
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 3.86,
"step": 220
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 3.88,
"step": 221
},
{
"loss": 0.0176,
"learning_rate": 0.0002,
"epoch": 3.89,
"step": 222
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 3.91,
"step": 223
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 3.93,
"step": 224
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 3.95,
"step": 225
},
{
"eval_comma_separated_input_loss": 0.8140801787376404,
"eval_comma_separated_input_score": -0.19773535430431366,
"eval_comma_separated_input_brier_score": 0.19773535430431366,
"eval_comma_separated_input_average_probability": 0.7513535022735596,
"eval_comma_separated_input_accuracy": 0.76,
"eval_comma_separated_input_probabilities": [
0.22258329391479492,
0.8945773243904114,
0.8501845598220825,
0.8527124524116516,
0.03487842530012131,
0.01711283065378666,
0.9863246083259583,
0.9590144753456116,
0.9920028448104858,
0.9999997615814209,
0.9999995231628418,
1.0,
0.9526478052139282,
0.9809058904647827,
0.8694186210632324,
0.9999806880950928,
0.9974191188812256,
0.999987006187439,
0.999245285987854,
0.9999618530273438,
0.6627137660980225,
0.4775846302509308,
0.996702253818512,
0.9411417245864868,
0.9944807291030884,
0.994421660900116,
0.5666745901107788,
0.9999892711639404,
1.0,
0.999574601650238,
0.9999991655349731,
1.0,
0.9999994039535522,
1.0,
1.0,
1.0,
0.10747275501489639,
0.16027887165546417,
0.2641609013080597,
0.9999372959136963,
0.13817612826824188,
0.9935786724090576,
0.9999450445175171,
0.9994520545005798,
0.028673408553004265,
0.9999998807907104,
0.999971866607666,
0.999848484992981,
1.0,
0.9994340538978577,
0.9999979734420776,
0.24372412264347076,
0.5508822798728943,
1.4898204426572192e-05,
1.0,
1.0,
1.0,
0.03361180052161217,
0.6426296234130859,
0.03325112536549568,
1.0,
1.0,
1.0,
0.04148618504405022,
0.0027587187942117453,
0.053798858076334,
0.9999998807907104,
1.0,
0.9999998807907104,
0.8596720099449158,
0.21878379583358765,
0.042546361684799194,
0.9275063872337341,
0.013146678917109966,
0.48001381754875183,
1.0,
1.0,
1.0,
0.9988648891448975,
0.9997988343238831,
0.9998394250869751,
0.11482413113117218,
0.8641303181648254,
0.39572393894195557,
0.9999958276748657,
0.9666105508804321,
0.9998986721038818,
0.6588249206542969,
0.001494898577220738,
0.9814879894256592,
0.6038728356361389,
0.531840443611145,
0.0851021260023117,
0.9999924898147583,
0.9999542236328125,
1.0,
0.9888311624526978,
0.9993833303451538,
0.8678873181343079,
1.0
],
"eval_comma_separated_input_runtime": 60.844,
"eval_comma_separated_input_samples_per_second": 1.644,
"eval_comma_separated_input_steps_per_second": 0.066,
"epoch": 3.95,
"step": 225
},
{
"loss": 0.0013,
"learning_rate": 0.0002,
"epoch": 3.96,
"step": 226
},
{
"loss": 0.0007,
"learning_rate": 0.0002,
"epoch": 3.98,
"step": 227
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.0,
"step": 228
},
{
"loss": 0.001,
"learning_rate": 0.0002,
"epoch": 4.02,
"step": 229
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 4.04,
"step": 230
},
{
"loss": 0.0006,
"learning_rate": 0.0002,
"epoch": 4.05,
"step": 231
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 4.07,
"step": 232
},
{
"loss": 0.0011,
"learning_rate": 0.0002,
"epoch": 4.09,
"step": 233
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 4.11,
"step": 234
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.12,
"step": 235
},
{
"loss": 0.0011,
"learning_rate": 0.0002,
"epoch": 4.14,
"step": 236
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 4.16,
"step": 237
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.18,
"step": 238
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 4.19,
"step": 239
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 4.21,
"step": 240
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.23,
"step": 241
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.25,
"step": 242
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.26,
"step": 243
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 4.28,
"step": 244
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.3,
"step": 245
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.32,
"step": 246
},
{
"loss": 0.0014,
"learning_rate": 0.0002,
"epoch": 4.33,
"step": 247
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.35,
"step": 248
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 4.37,
"step": 249
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 4.39,
"step": 250
},
{
"eval_comma_separated_input_loss": 0.9106535911560059,
"eval_comma_separated_input_score": -0.1935185194015503,
"eval_comma_separated_input_brier_score": 0.1935185194015503,
"eval_comma_separated_input_average_probability": 0.7665128111839294,
"eval_comma_separated_input_accuracy": 0.77,
"eval_comma_separated_input_probabilities": [
0.2728930115699768,
0.9469594359397888,
0.8848450183868408,
0.8785555362701416,
0.029993413016200066,
0.007177337538450956,
0.9855479598045349,
0.9428337812423706,
0.993122398853302,
1.0,
1.0,
1.0,
0.9487782716751099,
0.9103474617004395,
0.864179790019989,
0.9999915361404419,
0.9981993436813354,
0.9999955892562866,
0.9999821186065674,
0.9999998807907104,
0.8975170254707336,
0.7700925469398499,
0.9997153878211975,
0.9832716584205627,
0.9999701976776123,
0.9999456405639648,
0.9836558103561401,
0.9999995231628418,
1.0,
0.9999876022338867,
0.9999973773956299,
0.9999998807907104,
0.9999988079071045,
1.0,
1.0,
1.0,
0.1258680671453476,
0.10203563421964645,
0.2846693992614746,
0.9999909400939941,
0.009883570484817028,
0.9930781722068787,
0.9999970197677612,
0.9974396228790283,
0.03485842049121857,
1.0,
1.0,
0.9999988079071045,
1.0,
0.99978107213974,
0.9999992847442627,
0.1023230031132698,
0.5425301194190979,
3.283157070654852e-07,
1.0,
1.0,
1.0,
0.05294087529182434,
0.6476093530654907,
0.07671771198511124,
1.0,
1.0,
1.0,
0.022929130122065544,
0.005274801980704069,
0.023588120937347412,
1.0,
1.0,
1.0,
0.952028751373291,
0.036792971193790436,
0.03128356859087944,
0.8878331184387207,
0.003912873566150665,
0.2811466157436371,
1.0,
1.0,
1.0,
0.9998561143875122,
0.9999986886978149,
0.9999990463256836,
0.48471319675445557,
0.9485659599304199,
0.4733659625053406,
0.9999998807907104,
0.9934183359146118,
0.9999899864196777,
0.8549415469169617,
0.00029748474480584264,
0.9937552213668823,
0.7311030030250549,
0.8455090522766113,
0.04774446040391922,
0.9999973773956299,
0.9999880790710449,
1.0,
0.9333745837211609,
0.9922415018081665,
0.8403644561767578,
1.0
],
"eval_comma_separated_input_runtime": 60.8337,
"eval_comma_separated_input_samples_per_second": 1.644,
"eval_comma_separated_input_steps_per_second": 0.066,
"epoch": 4.39,
"step": 250
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.4,
"step": 251
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.42,
"step": 252
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 4.44,
"step": 253
},
{
"loss": 0.1126,
"learning_rate": 0.0002,
"epoch": 4.46,
"step": 254
},
{
"loss": 0.0542,
"learning_rate": 0.0002,
"epoch": 4.47,
"step": 255
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 4.49,
"step": 256
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.51,
"step": 257
},
{
"loss": 0.0013,
"learning_rate": 0.0002,
"epoch": 4.53,
"step": 258
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 4.54,
"step": 259
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.56,
"step": 260
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 4.58,
"step": 261
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.6,
"step": 262
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 4.61,
"step": 263
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 4.63,
"step": 264
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.65,
"step": 265
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 4.67,
"step": 266
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.68,
"step": 267
},
{
"loss": 0.0009,
"learning_rate": 0.0002,
"epoch": 4.7,
"step": 268
},
{
"loss": 0.1635,
"learning_rate": 0.0002,
"epoch": 4.72,
"step": 269
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.74,
"step": 270
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.75,
"step": 271
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 4.77,
"step": 272
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.79,
"step": 273
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 4.81,
"step": 274
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.82,
"step": 275
},
{
"eval_comma_separated_input_loss": 0.8824217319488525,
"eval_comma_separated_input_score": -0.1915234625339508,
"eval_comma_separated_input_brier_score": 0.1915234625339508,
"eval_comma_separated_input_average_probability": 0.7647359371185303,
"eval_comma_separated_input_accuracy": 0.78,
"eval_comma_separated_input_probabilities": [
0.17700964212417603,
0.9443680644035339,
0.8949386477470398,
0.8994792103767395,
0.09919517487287521,
0.02042502351105213,
0.9990639090538025,
0.9949172735214233,
0.9998217225074768,
1.0,
0.9999998807907104,
1.0,
0.9620996117591858,
0.7182826399803162,
0.8756901621818542,
0.9999833106994629,
0.9989676475524902,
0.9999984502792358,
0.9997939467430115,
0.9999970197677612,
0.7869197726249695,
0.8293550610542297,
0.9994563460350037,
0.9630100131034851,
0.9998747110366821,
0.9997860789299011,
0.8105039596557617,
0.9999991655349731,
1.0,
0.9999337196350098,
0.9999945163726807,
0.9999994039535522,
0.9999970197677612,
1.0,
1.0,
1.0,
0.24032439291477203,
0.09160152822732925,
0.43234387040138245,
0.9999988079071045,
0.555743932723999,
0.9985541701316833,
0.9999995231628418,
0.9993353486061096,
0.030032478272914886,
1.0,
1.0,
0.9999998807907104,
1.0,
0.9980515241622925,
0.9998434782028198,
0.11535391211509705,
0.9261205196380615,
9.263377432944253e-05,
1.0,
1.0,
1.0,
0.005190456286072731,
0.875157356262207,
0.008245637640357018,
1.0,
1.0,
1.0,
0.009847317822277546,
0.0009901360608637333,
0.0015817125095054507,
1.0,
1.0,
1.0,
0.9482873678207397,
0.07986213266849518,
0.029558109119534492,
0.7666759490966797,
0.01563183218240738,
0.06916328519582748,
1.0,
1.0,
1.0,
0.9999926090240479,
1.0,
1.0,
0.25362130999565125,
0.8666785955429077,
0.41505590081214905,
0.9999986886978149,
0.9921476244926453,
0.9999239444732666,
0.8314580917358398,
0.00014172305236570537,
0.9725655913352966,
0.5495027303695679,
0.5102577209472656,
0.13406023383140564,
0.9999912977218628,
0.9999866485595703,
1.0,
0.8086404800415039,
0.9980117082595825,
0.9711244702339172,
1.0
],
"eval_comma_separated_input_runtime": 60.7951,
"eval_comma_separated_input_samples_per_second": 1.645,
"eval_comma_separated_input_steps_per_second": 0.066,
"epoch": 4.82,
"step": 275
},
{
"loss": 0.0009,
"learning_rate": 0.0002,
"epoch": 4.84,
"step": 276
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 4.86,
"step": 277
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.88,
"step": 278
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 4.89,
"step": 279
},
{
"loss": 0.001,
"learning_rate": 0.0002,
"epoch": 4.91,
"step": 280
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 4.93,
"step": 281
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 4.95,
"step": 282
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 4.96,
"step": 283
},
{
"loss": 0.0118,
"learning_rate": 0.0002,
"epoch": 4.98,
"step": 284
},
{
"loss": 0.0006,
"learning_rate": 0.0002,
"epoch": 5.0,
"step": 285
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 5.02,
"step": 286
},
{
"loss": 0.0004,
"learning_rate": 0.0002,
"epoch": 5.04,
"step": 287
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 5.05,
"step": 288
},
{
"loss": 0.0002,
"learning_rate": 0.0002,
"epoch": 5.07,
"step": 289
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 5.09,
"step": 290
},
{
"loss": 0.0003,
"learning_rate": 0.0002,
"epoch": 5.11,
"step": 291
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 5.12,
"step": 292
},
{
"loss": 0.0005,
"learning_rate": 0.0002,
"epoch": 5.14,
"step": 293
},
{
"loss": 0.0185,
"learning_rate": 0.0002,
"epoch": 5.16,
"step": 294
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 5.18,
"step": 295
},
{
"loss": 0.0025,
"learning_rate": 0.0002,
"epoch": 5.19,
"step": 296
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 5.21,
"step": 297
},
{
"loss": 0.0001,
"learning_rate": 0.0002,
"epoch": 5.23,
"step": 298
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 5.25,
"step": 299
},
{
"loss": 0.0,
"learning_rate": 0.0002,
"epoch": 5.26,
"step": 300
},
{
"eval_comma_separated_input_loss": 0.9788962006568909,
"eval_comma_separated_input_score": -0.1985594928264618,
"eval_comma_separated_input_brier_score": 0.1985594928264618,
"eval_comma_separated_input_average_probability": 0.7571226358413696,
"eval_comma_separated_input_accuracy": 0.74,
"eval_comma_separated_input_probabilities": [
0.11606291681528091,
0.9386220574378967,
0.9379924535751343,
0.9480657577514648,
0.04834440350532532,
0.0034359267447143793,
0.9999555349349976,
0.9991539716720581,
0.9999765157699585,
1.0,
1.0,
1.0,
0.1777171939611435,
0.9681243896484375,
0.48616573214530945,
0.9998947381973267,
0.9996563196182251,
0.9999998807907104,
0.9999697208404541,
0.9999966621398926,
0.4451545476913452,
0.9019927382469177,
0.9998874664306641,
0.9697437286376953,
0.9999775886535645,
0.999945878982544,
0.9111950397491455,
0.9999935626983643,
1.0,
0.9999667406082153,
0.9999997615814209,
1.0,
0.9999997615814209,
1.0,
1.0,
1.0,
0.18022431433200836,
0.145154669880867,
0.22917520999908447,
0.9999998807907104,
0.055321019142866135,
0.9997361302375793,
0.9999943971633911,
0.999987006187439,
0.08495688438415527,
1.0,
1.0,
0.9999969005584717,
1.0,
0.9998794794082642,
0.9999998807907104,
0.4748004376888275,
0.8358895182609558,
7.689167205171543e-07,
1.0,
1.0,
1.0,
0.07946918904781342,
0.5861244797706604,
0.1789407581090927,
1.0,
1.0,
1.0,
0.010717565193772316,
0.0002632127143442631,
0.002087321598082781,
1.0,
1.0,
1.0,
0.959753155708313,
0.16682252287864685,
0.02568635530769825,
0.9226422309875488,
0.012998680584132671,
0.449643075466156,
1.0,
1.0,
1.0,
0.9999961853027344,
0.9999998807907104,
0.9999997615814209,
0.0019698706455528736,
0.898077130317688,
0.5507052540779114,
0.9999996423721313,
0.9896161556243896,
0.9999481439590454,
0.4249381422996521,
3.702771573443897e-05,
0.9964827299118042,
0.6545241475105286,
0.6706126928329468,
0.2881947159767151,
0.999995231628418,
0.9999750852584839,
1.0,
0.9933151602745056,
0.9998393058776855,
0.9927732348442078,
1.0
],
"eval_comma_separated_input_runtime": 60.8274,
"eval_comma_separated_input_samples_per_second": 1.644,
"eval_comma_separated_input_steps_per_second": 0.066,
"epoch": 5.26,
"step": 300
},
{
"train_runtime": 10652.3457,
"train_samples_per_second": 0.901,
"train_steps_per_second": 0.028,
"total_flos": 0.0,
"train_loss": 0.03411568186510522,
"epoch": 5.26,
"step": 300
}
]