penfever's picture
End of training
7d4ce6b verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4585,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.007639419404125287,
"grad_norm": 8.56353259226621,
"learning_rate": 3.4858387799564276e-07,
"loss": 0.9853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.485528826713562,
"step": 5,
"valid_targets_mean": 3401.8,
"valid_targets_min": 1382
},
{
"epoch": 0.015278838808250574,
"grad_norm": 8.131404212301335,
"learning_rate": 7.843137254901962e-07,
"loss": 1.0071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47187474370002747,
"step": 10,
"valid_targets_mean": 2919.4,
"valid_targets_min": 1116
},
{
"epoch": 0.02291825821237586,
"grad_norm": 7.290663279109773,
"learning_rate": 1.2200435729847495e-06,
"loss": 1.0029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3917523920536041,
"step": 15,
"valid_targets_mean": 2336.1,
"valid_targets_min": 884
},
{
"epoch": 0.030557677616501147,
"grad_norm": 6.253781799061595,
"learning_rate": 1.655773420479303e-06,
"loss": 0.959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6743544936180115,
"step": 20,
"valid_targets_mean": 3415.9,
"valid_targets_min": 703
},
{
"epoch": 0.03819709702062643,
"grad_norm": 4.392892259108477,
"learning_rate": 2.0915032679738565e-06,
"loss": 0.9939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3614335358142853,
"step": 25,
"valid_targets_mean": 2495.8,
"valid_targets_min": 735
},
{
"epoch": 0.04583651642475172,
"grad_norm": 3.431018980960601,
"learning_rate": 2.5272331154684097e-06,
"loss": 0.922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5053595304489136,
"step": 30,
"valid_targets_mean": 4036.6,
"valid_targets_min": 1478
},
{
"epoch": 0.053475935828877004,
"grad_norm": 3.153409826158592,
"learning_rate": 2.962962962962963e-06,
"loss": 0.9547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3868003785610199,
"step": 35,
"valid_targets_mean": 2478.8,
"valid_targets_min": 1093
},
{
"epoch": 0.061115355233002294,
"grad_norm": 2.0831272022034146,
"learning_rate": 3.398692810457517e-06,
"loss": 0.8596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4014698266983032,
"step": 40,
"valid_targets_mean": 4233.2,
"valid_targets_min": 990
},
{
"epoch": 0.06875477463712758,
"grad_norm": 1.6667591827402235,
"learning_rate": 3.83442265795207e-06,
"loss": 0.8571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4750503897666931,
"step": 45,
"valid_targets_mean": 3809.9,
"valid_targets_min": 953
},
{
"epoch": 0.07639419404125286,
"grad_norm": 1.3493811705230785,
"learning_rate": 4.270152505446624e-06,
"loss": 0.8804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3598395884037018,
"step": 50,
"valid_targets_mean": 2505.9,
"valid_targets_min": 919
},
{
"epoch": 0.08403361344537816,
"grad_norm": 1.5469719000738422,
"learning_rate": 4.705882352941177e-06,
"loss": 0.8181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3857227563858032,
"step": 55,
"valid_targets_mean": 2302.5,
"valid_targets_min": 487
},
{
"epoch": 0.09167303284950344,
"grad_norm": 1.2108296473201847,
"learning_rate": 5.14161220043573e-06,
"loss": 0.8229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6197760105133057,
"step": 60,
"valid_targets_mean": 3091.4,
"valid_targets_min": 868
},
{
"epoch": 0.09931245225362872,
"grad_norm": 0.9602992602617543,
"learning_rate": 5.577342047930284e-06,
"loss": 0.7262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3339218497276306,
"step": 65,
"valid_targets_mean": 3060.6,
"valid_targets_min": 778
},
{
"epoch": 0.10695187165775401,
"grad_norm": 0.987631773029606,
"learning_rate": 6.0130718954248365e-06,
"loss": 0.8129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4006999731063843,
"step": 70,
"valid_targets_mean": 3960.8,
"valid_targets_min": 455
},
{
"epoch": 0.11459129106187929,
"grad_norm": 0.9293072024847869,
"learning_rate": 6.4488017429193905e-06,
"loss": 0.7625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.42446625232696533,
"step": 75,
"valid_targets_mean": 3102.1,
"valid_targets_min": 1431
},
{
"epoch": 0.12223071046600459,
"grad_norm": 0.8519810844732746,
"learning_rate": 6.8845315904139445e-06,
"loss": 0.7621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34469449520111084,
"step": 80,
"valid_targets_mean": 3108.2,
"valid_targets_min": 1559
},
{
"epoch": 0.12987012987012986,
"grad_norm": 0.7340258302490502,
"learning_rate": 7.320261437908497e-06,
"loss": 0.7235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3129647672176361,
"step": 85,
"valid_targets_mean": 3680.9,
"valid_targets_min": 2358
},
{
"epoch": 0.13750954927425516,
"grad_norm": 0.7217579014723088,
"learning_rate": 7.755991285403051e-06,
"loss": 0.7184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22861731052398682,
"step": 90,
"valid_targets_mean": 2556.1,
"valid_targets_min": 1149
},
{
"epoch": 0.14514896867838045,
"grad_norm": 0.7843685287405917,
"learning_rate": 8.191721132897605e-06,
"loss": 0.714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2588593661785126,
"step": 95,
"valid_targets_mean": 2526.9,
"valid_targets_min": 1296
},
{
"epoch": 0.15278838808250572,
"grad_norm": 0.835309959958566,
"learning_rate": 8.627450980392157e-06,
"loss": 0.7336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29795417189598083,
"step": 100,
"valid_targets_mean": 2311.1,
"valid_targets_min": 962
},
{
"epoch": 0.16042780748663102,
"grad_norm": 0.8939656344358561,
"learning_rate": 9.063180827886711e-06,
"loss": 0.6585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.355358362197876,
"step": 105,
"valid_targets_mean": 2767.4,
"valid_targets_min": 1885
},
{
"epoch": 0.16806722689075632,
"grad_norm": 0.7765567561351433,
"learning_rate": 9.498910675381264e-06,
"loss": 0.7021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3594488501548767,
"step": 110,
"valid_targets_mean": 3382.8,
"valid_targets_min": 812
},
{
"epoch": 0.17570664629488159,
"grad_norm": 0.699526469363576,
"learning_rate": 9.934640522875818e-06,
"loss": 0.6992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4037782847881317,
"step": 115,
"valid_targets_mean": 4486.2,
"valid_targets_min": 746
},
{
"epoch": 0.18334606569900688,
"grad_norm": 0.8794463842026947,
"learning_rate": 1.037037037037037e-05,
"loss": 0.7356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3373746871948242,
"step": 120,
"valid_targets_mean": 2458.4,
"valid_targets_min": 946
},
{
"epoch": 0.19098548510313215,
"grad_norm": 0.676206262993347,
"learning_rate": 1.0806100217864926e-05,
"loss": 0.6595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30680835247039795,
"step": 125,
"valid_targets_mean": 3827.6,
"valid_targets_min": 987
},
{
"epoch": 0.19862490450725745,
"grad_norm": 0.7688052056049358,
"learning_rate": 1.1241830065359478e-05,
"loss": 0.698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26999378204345703,
"step": 130,
"valid_targets_mean": 2575.5,
"valid_targets_min": 1042
},
{
"epoch": 0.20626432391138275,
"grad_norm": 0.7755987352317165,
"learning_rate": 1.167755991285403e-05,
"loss": 0.6742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.330909788608551,
"step": 135,
"valid_targets_mean": 3124.4,
"valid_targets_min": 902
},
{
"epoch": 0.21390374331550802,
"grad_norm": 0.7903556123351976,
"learning_rate": 1.2113289760348586e-05,
"loss": 0.6659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38125163316726685,
"step": 140,
"valid_targets_mean": 3087.4,
"valid_targets_min": 759
},
{
"epoch": 0.2215431627196333,
"grad_norm": 0.7589506946645384,
"learning_rate": 1.2549019607843138e-05,
"loss": 0.6921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36488616466522217,
"step": 145,
"valid_targets_mean": 4247.0,
"valid_targets_min": 1868
},
{
"epoch": 0.22918258212375858,
"grad_norm": 0.6894437269697314,
"learning_rate": 1.298474945533769e-05,
"loss": 0.6682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2953642010688782,
"step": 150,
"valid_targets_mean": 3034.4,
"valid_targets_min": 1694
},
{
"epoch": 0.23682200152788388,
"grad_norm": 0.9478585705238028,
"learning_rate": 1.3420479302832245e-05,
"loss": 0.6625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3361087143421173,
"step": 155,
"valid_targets_mean": 1931.2,
"valid_targets_min": 1081
},
{
"epoch": 0.24446142093200918,
"grad_norm": 0.6983921245328072,
"learning_rate": 1.3856209150326799e-05,
"loss": 0.6769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39449670910835266,
"step": 160,
"valid_targets_mean": 4291.1,
"valid_targets_min": 976
},
{
"epoch": 0.25210084033613445,
"grad_norm": 0.7642774492217729,
"learning_rate": 1.4291938997821353e-05,
"loss": 0.6664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3134499788284302,
"step": 165,
"valid_targets_mean": 2839.6,
"valid_targets_min": 1146
},
{
"epoch": 0.2597402597402597,
"grad_norm": 0.7000875293679036,
"learning_rate": 1.4727668845315905e-05,
"loss": 0.635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41188955307006836,
"step": 170,
"valid_targets_mean": 3929.6,
"valid_targets_min": 1889
},
{
"epoch": 0.26737967914438504,
"grad_norm": 0.860459609848493,
"learning_rate": 1.5163398692810458e-05,
"loss": 0.6856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4588810205459595,
"step": 175,
"valid_targets_mean": 3703.8,
"valid_targets_min": 1237
},
{
"epoch": 0.2750190985485103,
"grad_norm": 1.9304398390219022,
"learning_rate": 1.559912854030501e-05,
"loss": 0.6345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32375526428222656,
"step": 180,
"valid_targets_mean": 3939.1,
"valid_targets_min": 783
},
{
"epoch": 0.2826585179526356,
"grad_norm": 0.8170199929994688,
"learning_rate": 1.6034858387799567e-05,
"loss": 0.6095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33352822065353394,
"step": 185,
"valid_targets_mean": 3359.6,
"valid_targets_min": 773
},
{
"epoch": 0.2902979373567609,
"grad_norm": 0.6978579891276123,
"learning_rate": 1.647058823529412e-05,
"loss": 0.6729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40702342987060547,
"step": 190,
"valid_targets_mean": 3593.4,
"valid_targets_min": 957
},
{
"epoch": 0.2979373567608862,
"grad_norm": 1.0173308675163864,
"learning_rate": 1.6906318082788672e-05,
"loss": 0.6387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4305134415626526,
"step": 195,
"valid_targets_mean": 2495.9,
"valid_targets_min": 808
},
{
"epoch": 0.30557677616501144,
"grad_norm": 0.6720245226873705,
"learning_rate": 1.7342047930283224e-05,
"loss": 0.631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26800355315208435,
"step": 200,
"valid_targets_mean": 2775.8,
"valid_targets_min": 842
},
{
"epoch": 0.31321619556913677,
"grad_norm": 0.7925807789036575,
"learning_rate": 1.7777777777777777e-05,
"loss": 0.6251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26368221640586853,
"step": 205,
"valid_targets_mean": 3823.2,
"valid_targets_min": 1121
},
{
"epoch": 0.32085561497326204,
"grad_norm": 0.8482490987351864,
"learning_rate": 1.8213507625272332e-05,
"loss": 0.6464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3924250304698944,
"step": 210,
"valid_targets_mean": 3340.0,
"valid_targets_min": 1014
},
{
"epoch": 0.3284950343773873,
"grad_norm": 0.7587944111803762,
"learning_rate": 1.8649237472766885e-05,
"loss": 0.6271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2620357275009155,
"step": 215,
"valid_targets_mean": 2859.0,
"valid_targets_min": 642
},
{
"epoch": 0.33613445378151263,
"grad_norm": 0.7364341217962659,
"learning_rate": 1.908496732026144e-05,
"loss": 0.6122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3173060417175293,
"step": 220,
"valid_targets_mean": 3238.9,
"valid_targets_min": 1378
},
{
"epoch": 0.3437738731856379,
"grad_norm": 0.6987727914802906,
"learning_rate": 1.9520697167755993e-05,
"loss": 0.6125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30513855814933777,
"step": 225,
"valid_targets_mean": 3986.5,
"valid_targets_min": 1460
},
{
"epoch": 0.35141329258976317,
"grad_norm": 0.7226588989043562,
"learning_rate": 1.9956427015250545e-05,
"loss": 0.6279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33299773931503296,
"step": 230,
"valid_targets_mean": 3696.0,
"valid_targets_min": 1234
},
{
"epoch": 0.35905271199388844,
"grad_norm": 0.8158650358729972,
"learning_rate": 2.0392156862745097e-05,
"loss": 0.6654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32044363021850586,
"step": 235,
"valid_targets_mean": 3097.4,
"valid_targets_min": 943
},
{
"epoch": 0.36669213139801377,
"grad_norm": 0.7088614261293413,
"learning_rate": 2.0827886710239653e-05,
"loss": 0.6017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2543582618236542,
"step": 240,
"valid_targets_mean": 2256.9,
"valid_targets_min": 1559
},
{
"epoch": 0.37433155080213903,
"grad_norm": 0.6151357812054147,
"learning_rate": 2.126361655773421e-05,
"loss": 0.6515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1985795795917511,
"step": 245,
"valid_targets_mean": 3318.6,
"valid_targets_min": 1227
},
{
"epoch": 0.3819709702062643,
"grad_norm": 0.7937566667562097,
"learning_rate": 2.1699346405228758e-05,
"loss": 0.6187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3406463861465454,
"step": 250,
"valid_targets_mean": 3448.1,
"valid_targets_min": 2067
},
{
"epoch": 0.38961038961038963,
"grad_norm": 0.6298445900787324,
"learning_rate": 2.2135076252723313e-05,
"loss": 0.5786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29489225149154663,
"step": 255,
"valid_targets_mean": 3681.2,
"valid_targets_min": 1220
},
{
"epoch": 0.3972498090145149,
"grad_norm": 0.8201725710279596,
"learning_rate": 2.257080610021787e-05,
"loss": 0.6133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3263534903526306,
"step": 260,
"valid_targets_mean": 3468.8,
"valid_targets_min": 466
},
{
"epoch": 0.40488922841864017,
"grad_norm": 0.7501412935238757,
"learning_rate": 2.3006535947712418e-05,
"loss": 0.6471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30918407440185547,
"step": 265,
"valid_targets_mean": 4111.1,
"valid_targets_min": 1461
},
{
"epoch": 0.4125286478227655,
"grad_norm": 0.7932880947679686,
"learning_rate": 2.3442265795206974e-05,
"loss": 0.635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38556236028671265,
"step": 270,
"valid_targets_mean": 3402.2,
"valid_targets_min": 679
},
{
"epoch": 0.42016806722689076,
"grad_norm": 0.7336631307032824,
"learning_rate": 2.387799564270153e-05,
"loss": 0.6027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2884320020675659,
"step": 275,
"valid_targets_mean": 3283.2,
"valid_targets_min": 825
},
{
"epoch": 0.42780748663101603,
"grad_norm": 0.7987572249200825,
"learning_rate": 2.431372549019608e-05,
"loss": 0.5793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.303595632314682,
"step": 280,
"valid_targets_mean": 3274.4,
"valid_targets_min": 1782
},
{
"epoch": 0.43544690603514136,
"grad_norm": 0.7921872393026232,
"learning_rate": 2.4749455337690634e-05,
"loss": 0.6192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34139686822891235,
"step": 285,
"valid_targets_mean": 3101.2,
"valid_targets_min": 800
},
{
"epoch": 0.4430863254392666,
"grad_norm": 0.745571535038673,
"learning_rate": 2.5185185185185187e-05,
"loss": 0.628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32645875215530396,
"step": 290,
"valid_targets_mean": 3515.2,
"valid_targets_min": 608
},
{
"epoch": 0.4507257448433919,
"grad_norm": 0.7733455760458197,
"learning_rate": 2.562091503267974e-05,
"loss": 0.6153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41803407669067383,
"step": 295,
"valid_targets_mean": 3754.2,
"valid_targets_min": 1141
},
{
"epoch": 0.45836516424751717,
"grad_norm": 0.8925987187590559,
"learning_rate": 2.6056644880174295e-05,
"loss": 0.6203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3707024157047272,
"step": 300,
"valid_targets_mean": 2850.6,
"valid_targets_min": 1689
},
{
"epoch": 0.4660045836516425,
"grad_norm": 0.8036647475977927,
"learning_rate": 2.6492374727668847e-05,
"loss": 0.6258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2339508831501007,
"step": 305,
"valid_targets_mean": 2463.9,
"valid_targets_min": 874
},
{
"epoch": 0.47364400305576776,
"grad_norm": 0.7031610335825725,
"learning_rate": 2.6928104575163403e-05,
"loss": 0.6027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25344857573509216,
"step": 310,
"valid_targets_mean": 2872.8,
"valid_targets_min": 1174
},
{
"epoch": 0.48128342245989303,
"grad_norm": 0.7480718215833951,
"learning_rate": 2.736383442265795e-05,
"loss": 0.6064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21547476947307587,
"step": 315,
"valid_targets_mean": 2392.2,
"valid_targets_min": 794
},
{
"epoch": 0.48892284186401835,
"grad_norm": 0.8331408619239437,
"learning_rate": 2.7799564270152507e-05,
"loss": 0.6047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2768464684486389,
"step": 320,
"valid_targets_mean": 2553.5,
"valid_targets_min": 1043
},
{
"epoch": 0.4965622612681436,
"grad_norm": 0.8087367473209722,
"learning_rate": 2.8235294117647063e-05,
"loss": 0.6213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26989734172821045,
"step": 325,
"valid_targets_mean": 3067.9,
"valid_targets_min": 1005
},
{
"epoch": 0.5042016806722689,
"grad_norm": 0.7776781031068692,
"learning_rate": 2.8671023965141612e-05,
"loss": 0.5847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27393457293510437,
"step": 330,
"valid_targets_mean": 2845.4,
"valid_targets_min": 1012
},
{
"epoch": 0.5118411000763942,
"grad_norm": 0.8248214347980428,
"learning_rate": 2.9106753812636168e-05,
"loss": 0.6142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2886251211166382,
"step": 335,
"valid_targets_mean": 3156.9,
"valid_targets_min": 1121
},
{
"epoch": 0.5194805194805194,
"grad_norm": 0.7871145452467468,
"learning_rate": 2.9542483660130724e-05,
"loss": 0.6064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22021612524986267,
"step": 340,
"valid_targets_mean": 1920.1,
"valid_targets_min": 1098
},
{
"epoch": 0.5271199388846448,
"grad_norm": 0.6598524132491371,
"learning_rate": 2.9978213507625272e-05,
"loss": 0.5969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3316832184791565,
"step": 345,
"valid_targets_mean": 4670.0,
"valid_targets_min": 1362
},
{
"epoch": 0.5347593582887701,
"grad_norm": 0.7714969570983577,
"learning_rate": 3.0413943355119828e-05,
"loss": 0.5802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3330127000808716,
"step": 350,
"valid_targets_mean": 3081.5,
"valid_targets_min": 1703
},
{
"epoch": 0.5423987776928954,
"grad_norm": 0.7754477862247269,
"learning_rate": 3.0849673202614384e-05,
"loss": 0.6115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28545576333999634,
"step": 355,
"valid_targets_mean": 2166.5,
"valid_targets_min": 1009
},
{
"epoch": 0.5500381970970206,
"grad_norm": 0.9165516616675281,
"learning_rate": 3.1285403050108936e-05,
"loss": 0.5981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3413655459880829,
"step": 360,
"valid_targets_mean": 2802.4,
"valid_targets_min": 641
},
{
"epoch": 0.5576776165011459,
"grad_norm": 0.7628767779169452,
"learning_rate": 3.172113289760349e-05,
"loss": 0.5909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37848758697509766,
"step": 365,
"valid_targets_mean": 3536.0,
"valid_targets_min": 778
},
{
"epoch": 0.5653170359052712,
"grad_norm": 0.6456443237893429,
"learning_rate": 3.215686274509804e-05,
"loss": 0.5739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23117348551750183,
"step": 370,
"valid_targets_mean": 3513.4,
"valid_targets_min": 1334
},
{
"epoch": 0.5729564553093965,
"grad_norm": 0.7131390860118433,
"learning_rate": 3.259259259259259e-05,
"loss": 0.5903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28896501660346985,
"step": 375,
"valid_targets_mean": 3813.5,
"valid_targets_min": 1767
},
{
"epoch": 0.5805958747135218,
"grad_norm": 0.7059247357677485,
"learning_rate": 3.3028322440087146e-05,
"loss": 0.5981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769196033477783,
"step": 380,
"valid_targets_mean": 3733.4,
"valid_targets_min": 991
},
{
"epoch": 0.5882352941176471,
"grad_norm": 0.7099487325643025,
"learning_rate": 3.3464052287581705e-05,
"loss": 0.574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2509758472442627,
"step": 385,
"valid_targets_mean": 3110.4,
"valid_targets_min": 1557
},
{
"epoch": 0.5958747135217723,
"grad_norm": 0.73751067378954,
"learning_rate": 3.389978213507625e-05,
"loss": 0.5929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2418426275253296,
"step": 390,
"valid_targets_mean": 2331.1,
"valid_targets_min": 907
},
{
"epoch": 0.6035141329258976,
"grad_norm": 0.6947985101021568,
"learning_rate": 3.433551198257081e-05,
"loss": 0.6145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24075086414813995,
"step": 395,
"valid_targets_mean": 3555.6,
"valid_targets_min": 1443
},
{
"epoch": 0.6111535523300229,
"grad_norm": 0.6913463347195935,
"learning_rate": 3.477124183006536e-05,
"loss": 0.5987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3037499189376831,
"step": 400,
"valid_targets_mean": 4055.1,
"valid_targets_min": 888
},
{
"epoch": 0.6187929717341482,
"grad_norm": 0.790293928960079,
"learning_rate": 3.5206971677559914e-05,
"loss": 0.572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2849627733230591,
"step": 405,
"valid_targets_mean": 3600.0,
"valid_targets_min": 2347
},
{
"epoch": 0.6264323911382735,
"grad_norm": 0.7315439623965397,
"learning_rate": 3.5642701525054466e-05,
"loss": 0.5668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3170517086982727,
"step": 410,
"valid_targets_mean": 3977.9,
"valid_targets_min": 1021
},
{
"epoch": 0.6340718105423988,
"grad_norm": 0.7687583162677026,
"learning_rate": 3.6078431372549025e-05,
"loss": 0.6283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3087868094444275,
"step": 415,
"valid_targets_mean": 2945.9,
"valid_targets_min": 1360
},
{
"epoch": 0.6417112299465241,
"grad_norm": 0.7628238951175478,
"learning_rate": 3.651416122004358e-05,
"loss": 0.5964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33389556407928467,
"step": 420,
"valid_targets_mean": 3730.8,
"valid_targets_min": 1417
},
{
"epoch": 0.6493506493506493,
"grad_norm": 0.6695423107998377,
"learning_rate": 3.694989106753813e-05,
"loss": 0.5885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22009310126304626,
"step": 425,
"valid_targets_mean": 3358.6,
"valid_targets_min": 605
},
{
"epoch": 0.6569900687547746,
"grad_norm": 0.82620661841163,
"learning_rate": 3.738562091503268e-05,
"loss": 0.5811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26666954159736633,
"step": 430,
"valid_targets_mean": 2360.4,
"valid_targets_min": 821
},
{
"epoch": 0.6646294881588999,
"grad_norm": 0.6929939957736985,
"learning_rate": 3.7821350762527235e-05,
"loss": 0.5774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22594678401947021,
"step": 435,
"valid_targets_mean": 2447.9,
"valid_targets_min": 1251
},
{
"epoch": 0.6722689075630253,
"grad_norm": 0.7019484401785123,
"learning_rate": 3.825708061002179e-05,
"loss": 0.5808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3131728768348694,
"step": 440,
"valid_targets_mean": 3665.8,
"valid_targets_min": 253
},
{
"epoch": 0.6799083269671505,
"grad_norm": 0.6685256141352108,
"learning_rate": 3.8692810457516346e-05,
"loss": 0.5552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2552865147590637,
"step": 445,
"valid_targets_mean": 3354.5,
"valid_targets_min": 910
},
{
"epoch": 0.6875477463712758,
"grad_norm": 0.7265392876508043,
"learning_rate": 3.91285403050109e-05,
"loss": 0.5729,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2652282118797302,
"step": 450,
"valid_targets_mean": 2713.8,
"valid_targets_min": 985
},
{
"epoch": 0.6951871657754011,
"grad_norm": 0.6360107272199381,
"learning_rate": 3.956427015250545e-05,
"loss": 0.6083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2762466073036194,
"step": 455,
"valid_targets_mean": 4311.1,
"valid_targets_min": 1273
},
{
"epoch": 0.7028265851795263,
"grad_norm": 0.671880392414106,
"learning_rate": 4e-05,
"loss": 0.5937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2647872865200043,
"step": 460,
"valid_targets_mean": 3698.0,
"valid_targets_min": 1609
},
{
"epoch": 0.7104660045836516,
"grad_norm": 0.6591072439688226,
"learning_rate": 3.999985506249457e-05,
"loss": 0.5958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27107876539230347,
"step": 465,
"valid_targets_mean": 3154.5,
"valid_targets_min": 1080
},
{
"epoch": 0.7181054239877769,
"grad_norm": 0.779690577173135,
"learning_rate": 3.9999420252078994e-05,
"loss": 0.5721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27595773339271545,
"step": 470,
"valid_targets_mean": 3683.6,
"valid_targets_min": 657
},
{
"epoch": 0.7257448433919023,
"grad_norm": 0.6772343189565297,
"learning_rate": 3.9998695575055276e-05,
"loss": 0.5944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38341811299324036,
"step": 475,
"valid_targets_mean": 4689.9,
"valid_targets_min": 1562
},
{
"epoch": 0.7333842627960275,
"grad_norm": 0.8079543845936882,
"learning_rate": 3.9997681041926714e-05,
"loss": 0.5551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.338105171918869,
"step": 480,
"valid_targets_mean": 2228.9,
"valid_targets_min": 692
},
{
"epoch": 0.7410236822001528,
"grad_norm": 0.6586142611830866,
"learning_rate": 3.99963766673977e-05,
"loss": 0.5536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2373753786087036,
"step": 485,
"valid_targets_mean": 3322.0,
"valid_targets_min": 648
},
{
"epoch": 0.7486631016042781,
"grad_norm": 0.7147237521146843,
"learning_rate": 3.999478247037352e-05,
"loss": 0.5756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3543473482131958,
"step": 490,
"valid_targets_mean": 4644.6,
"valid_targets_min": 1033
},
{
"epoch": 0.7563025210084033,
"grad_norm": 0.7867926605712047,
"learning_rate": 3.999289847396006e-05,
"loss": 0.6146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33008497953414917,
"step": 495,
"valid_targets_mean": 3087.8,
"valid_targets_min": 1208
},
{
"epoch": 0.7639419404125286,
"grad_norm": 0.6172355973475613,
"learning_rate": 3.9990724705463495e-05,
"loss": 0.5805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37864190340042114,
"step": 500,
"valid_targets_mean": 5465.1,
"valid_targets_min": 1357
},
{
"epoch": 0.771581359816654,
"grad_norm": 0.7480683025973461,
"learning_rate": 3.998826119638989e-05,
"loss": 0.5759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788500487804413,
"step": 505,
"valid_targets_mean": 3069.6,
"valid_targets_min": 1494
},
{
"epoch": 0.7792207792207793,
"grad_norm": 0.7137435243602375,
"learning_rate": 3.998550798244472e-05,
"loss": 0.5894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3722362518310547,
"step": 510,
"valid_targets_mean": 3935.2,
"valid_targets_min": 1150
},
{
"epoch": 0.7868601986249045,
"grad_norm": 0.7133729047894137,
"learning_rate": 3.9982465103532386e-05,
"loss": 0.5479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29172253608703613,
"step": 515,
"valid_targets_mean": 3255.4,
"valid_targets_min": 1224
},
{
"epoch": 0.7944996180290298,
"grad_norm": 0.8123949372956061,
"learning_rate": 3.997913260375562e-05,
"loss": 0.5928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29111629724502563,
"step": 520,
"valid_targets_mean": 2608.0,
"valid_targets_min": 1413
},
{
"epoch": 0.8021390374331551,
"grad_norm": 0.7607753286866613,
"learning_rate": 3.9975510531414835e-05,
"loss": 0.5838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3003314435482025,
"step": 525,
"valid_targets_mean": 3636.6,
"valid_targets_min": 886
},
{
"epoch": 0.8097784568372803,
"grad_norm": 0.7593775820169156,
"learning_rate": 3.997159893900745e-05,
"loss": 0.5411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2764055132865906,
"step": 530,
"valid_targets_mean": 2633.2,
"valid_targets_min": 1343
},
{
"epoch": 0.8174178762414056,
"grad_norm": 0.7550291803600192,
"learning_rate": 3.9967397883227104e-05,
"loss": 0.5935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2789875566959381,
"step": 535,
"valid_targets_mean": 2900.9,
"valid_targets_min": 748
},
{
"epoch": 0.825057295645531,
"grad_norm": 0.6099292035548061,
"learning_rate": 3.9962907424962856e-05,
"loss": 0.5777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2896302044391632,
"step": 540,
"valid_targets_mean": 4579.8,
"valid_targets_min": 926
},
{
"epoch": 0.8326967150496563,
"grad_norm": 0.6670417720845128,
"learning_rate": 3.995812762929829e-05,
"loss": 0.6051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20029598474502563,
"step": 545,
"valid_targets_mean": 2811.9,
"valid_targets_min": 1070
},
{
"epoch": 0.8403361344537815,
"grad_norm": 0.9488128832161037,
"learning_rate": 3.995305856551057e-05,
"loss": 0.5861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22825755178928375,
"step": 550,
"valid_targets_mean": 2501.6,
"valid_targets_min": 798
},
{
"epoch": 0.8479755538579068,
"grad_norm": 0.6086366642647173,
"learning_rate": 3.994770030706944e-05,
"loss": 0.5494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3427432179450989,
"step": 555,
"valid_targets_mean": 5665.4,
"valid_targets_min": 741
},
{
"epoch": 0.8556149732620321,
"grad_norm": 0.70513202037968,
"learning_rate": 3.994205293163616e-05,
"loss": 0.5937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29944777488708496,
"step": 560,
"valid_targets_mean": 3229.2,
"valid_targets_min": 1980
},
{
"epoch": 0.8632543926661573,
"grad_norm": 0.9851639022765896,
"learning_rate": 3.9936116521062376e-05,
"loss": 0.5482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28550928831100464,
"step": 565,
"valid_targets_mean": 3211.6,
"valid_targets_min": 811
},
{
"epoch": 0.8708938120702827,
"grad_norm": 0.7534779579928215,
"learning_rate": 3.992989116138895e-05,
"loss": 0.5766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2996383011341095,
"step": 570,
"valid_targets_mean": 3115.0,
"valid_targets_min": 1197
},
{
"epoch": 0.878533231474408,
"grad_norm": 0.7458527629855309,
"learning_rate": 3.99233769428447e-05,
"loss": 0.5918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23829689621925354,
"step": 575,
"valid_targets_mean": 2372.4,
"valid_targets_min": 949
},
{
"epoch": 0.8861726508785333,
"grad_norm": 0.7068928044009853,
"learning_rate": 3.991657395984507e-05,
"loss": 0.5691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30755138397216797,
"step": 580,
"valid_targets_mean": 3072.1,
"valid_targets_min": 1216
},
{
"epoch": 0.8938120702826585,
"grad_norm": 0.7004756487633861,
"learning_rate": 3.99094823109908e-05,
"loss": 0.602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21224084496498108,
"step": 585,
"valid_targets_mean": 2138.5,
"valid_targets_min": 663
},
{
"epoch": 0.9014514896867838,
"grad_norm": 0.681477572048519,
"learning_rate": 3.990210209906649e-05,
"loss": 0.5667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23268462717533112,
"step": 590,
"valid_targets_mean": 3107.2,
"valid_targets_min": 2053
},
{
"epoch": 0.9090909090909091,
"grad_norm": 1.0438675359941987,
"learning_rate": 3.989443343103908e-05,
"loss": 0.5745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3275293707847595,
"step": 595,
"valid_targets_mean": 3463.5,
"valid_targets_min": 1444
},
{
"epoch": 0.9167303284950343,
"grad_norm": 0.7400160340371931,
"learning_rate": 3.9886476418056336e-05,
"loss": 0.5671,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3153223991394043,
"step": 600,
"valid_targets_mean": 3044.6,
"valid_targets_min": 722
},
{
"epoch": 0.9243697478991597,
"grad_norm": 0.6652294370667957,
"learning_rate": 3.987823117544522e-05,
"loss": 0.5372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.389309823513031,
"step": 605,
"valid_targets_mean": 4362.6,
"valid_targets_min": 946
},
{
"epoch": 0.932009167303285,
"grad_norm": 0.6212675682208829,
"learning_rate": 3.986969782271022e-05,
"loss": 0.5665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21082836389541626,
"step": 610,
"valid_targets_mean": 3255.6,
"valid_targets_min": 1697
},
{
"epoch": 0.9396485867074102,
"grad_norm": 0.6862137461635358,
"learning_rate": 3.986087648353162e-05,
"loss": 0.6083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2789027988910675,
"step": 615,
"valid_targets_mean": 2877.1,
"valid_targets_min": 469
},
{
"epoch": 0.9472880061115355,
"grad_norm": 0.6028470891869618,
"learning_rate": 3.985176728576371e-05,
"loss": 0.5559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2874605655670166,
"step": 620,
"valid_targets_mean": 4492.4,
"valid_targets_min": 2143
},
{
"epoch": 0.9549274255156608,
"grad_norm": 0.7101556487572386,
"learning_rate": 3.984237036143293e-05,
"loss": 0.5598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23973211646080017,
"step": 625,
"valid_targets_mean": 2781.4,
"valid_targets_min": 1607
},
{
"epoch": 0.9625668449197861,
"grad_norm": 0.6406876645725995,
"learning_rate": 3.9832685846735965e-05,
"loss": 0.5471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23441874980926514,
"step": 630,
"valid_targets_mean": 3437.4,
"valid_targets_min": 795
},
{
"epoch": 0.9702062643239114,
"grad_norm": 0.8179086861154274,
"learning_rate": 3.982271388203775e-05,
"loss": 0.601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24605703353881836,
"step": 635,
"valid_targets_mean": 2201.5,
"valid_targets_min": 870
},
{
"epoch": 0.9778456837280367,
"grad_norm": 0.7379654548504041,
"learning_rate": 3.981245461186945e-05,
"loss": 0.5831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2373408079147339,
"step": 640,
"valid_targets_mean": 1922.5,
"valid_targets_min": 507
},
{
"epoch": 0.985485103132162,
"grad_norm": 0.6325975201384703,
"learning_rate": 3.980190818492637e-05,
"loss": 0.563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22413653135299683,
"step": 645,
"valid_targets_mean": 2914.0,
"valid_targets_min": 816
},
{
"epoch": 0.9931245225362872,
"grad_norm": 0.7202033071183617,
"learning_rate": 3.979107475406579e-05,
"loss": 0.6126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4340353012084961,
"step": 650,
"valid_targets_mean": 3802.1,
"valid_targets_min": 1421
},
{
"epoch": 1.0,
"grad_norm": 1.1116558746504048,
"learning_rate": 3.977995447630475e-05,
"loss": 0.5592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5354721546173096,
"step": 655,
"valid_targets_mean": 2106.2,
"valid_targets_min": 858
},
{
"epoch": 1.0076394194041254,
"grad_norm": 0.6522118231154711,
"learning_rate": 3.9768547512817794e-05,
"loss": 0.5855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2696242332458496,
"step": 660,
"valid_targets_mean": 2601.8,
"valid_targets_min": 841
},
{
"epoch": 1.0152788388082505,
"grad_norm": 0.7282006050891634,
"learning_rate": 3.9756854028934604e-05,
"loss": 0.5707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30138200521469116,
"step": 665,
"valid_targets_mean": 3397.9,
"valid_targets_min": 933
},
{
"epoch": 1.022918258212376,
"grad_norm": 0.6705684638682171,
"learning_rate": 3.974487419413761e-05,
"loss": 0.5371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26151737570762634,
"step": 670,
"valid_targets_mean": 3653.8,
"valid_targets_min": 550
},
{
"epoch": 1.030557677616501,
"grad_norm": 0.723948374365064,
"learning_rate": 3.973260818205955e-05,
"loss": 0.5463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3313744366168976,
"step": 675,
"valid_targets_mean": 3186.4,
"valid_targets_min": 1538
},
{
"epoch": 1.0381970970206265,
"grad_norm": 0.7836642368648493,
"learning_rate": 3.972005617048094e-05,
"loss": 0.5226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37249183654785156,
"step": 680,
"valid_targets_mean": 3745.6,
"valid_targets_min": 1744
},
{
"epoch": 1.0458365164247516,
"grad_norm": 0.6689920597254674,
"learning_rate": 3.970721834132751e-05,
"loss": 0.5186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.237932026386261,
"step": 685,
"valid_targets_mean": 2938.4,
"valid_targets_min": 925
},
{
"epoch": 1.053475935828877,
"grad_norm": 0.6766713408339188,
"learning_rate": 3.969409488066756e-05,
"loss": 0.5645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27513009309768677,
"step": 690,
"valid_targets_mean": 3106.2,
"valid_targets_min": 796
},
{
"epoch": 1.0611153552330024,
"grad_norm": 0.7249242616575575,
"learning_rate": 3.9680685978709254e-05,
"loss": 0.5285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3080906271934509,
"step": 695,
"valid_targets_mean": 3352.1,
"valid_targets_min": 801
},
{
"epoch": 1.0687547746371275,
"grad_norm": 0.6371623942622592,
"learning_rate": 3.966699182979785e-05,
"loss": 0.5529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2962953448295593,
"step": 700,
"valid_targets_mean": 4250.9,
"valid_targets_min": 1290
},
{
"epoch": 1.076394194041253,
"grad_norm": 0.7676470422260585,
"learning_rate": 3.965301263241296e-05,
"loss": 0.5641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2619950473308563,
"step": 705,
"valid_targets_mean": 2716.8,
"valid_targets_min": 1882
},
{
"epoch": 1.084033613445378,
"grad_norm": 0.6587402474304499,
"learning_rate": 3.963874858916556e-05,
"loss": 0.5408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28987687826156616,
"step": 710,
"valid_targets_mean": 3787.6,
"valid_targets_min": 1143
},
{
"epoch": 1.0916730328495035,
"grad_norm": 0.6913158304836163,
"learning_rate": 3.9624199906795136e-05,
"loss": 0.5436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28918856382369995,
"step": 715,
"valid_targets_mean": 4839.6,
"valid_targets_min": 1376
},
{
"epoch": 1.0993124522536286,
"grad_norm": 0.703709027064511,
"learning_rate": 3.960936679616667e-05,
"loss": 0.5102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26379460096359253,
"step": 720,
"valid_targets_mean": 3043.2,
"valid_targets_min": 641
},
{
"epoch": 1.106951871657754,
"grad_norm": 0.5380096123166979,
"learning_rate": 3.959424947226756e-05,
"loss": 0.5143,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24659261107444763,
"step": 725,
"valid_targets_mean": 4539.6,
"valid_targets_min": 596
},
{
"epoch": 1.1145912910618794,
"grad_norm": 0.6464956071511203,
"learning_rate": 3.957884815420453e-05,
"loss": 0.5857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19127747416496277,
"step": 730,
"valid_targets_mean": 2436.2,
"valid_targets_min": 600
},
{
"epoch": 1.1222307104660045,
"grad_norm": 0.7029816183033232,
"learning_rate": 3.956316306520044e-05,
"loss": 0.5619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28624215722084045,
"step": 735,
"valid_targets_mean": 3306.8,
"valid_targets_min": 1178
},
{
"epoch": 1.12987012987013,
"grad_norm": 0.6838882183908288,
"learning_rate": 3.9547194432591066e-05,
"loss": 0.5111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3031734824180603,
"step": 740,
"valid_targets_mean": 3253.0,
"valid_targets_min": 1106
},
{
"epoch": 1.137509549274255,
"grad_norm": 0.6539220963516174,
"learning_rate": 3.9530942487821785e-05,
"loss": 0.5282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22544610500335693,
"step": 745,
"valid_targets_mean": 2679.9,
"valid_targets_min": 825
},
{
"epoch": 1.1451489686783805,
"grad_norm": 0.6232994419948458,
"learning_rate": 3.951440746644422e-05,
"loss": 0.5659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22838760912418365,
"step": 750,
"valid_targets_mean": 3408.6,
"valid_targets_min": 1703
},
{
"epoch": 1.1527883880825058,
"grad_norm": 0.7040726919722308,
"learning_rate": 3.949758960811284e-05,
"loss": 0.5475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23174643516540527,
"step": 755,
"valid_targets_mean": 2185.2,
"valid_targets_min": 430
},
{
"epoch": 1.160427807486631,
"grad_norm": 0.6789214431654883,
"learning_rate": 3.9480489156581514e-05,
"loss": 0.521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28578507900238037,
"step": 760,
"valid_targets_mean": 3754.8,
"valid_targets_min": 568
},
{
"epoch": 1.1680672268907564,
"grad_norm": 0.7733782691321108,
"learning_rate": 3.94631063596999e-05,
"loss": 0.5316,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2440919578075409,
"step": 765,
"valid_targets_mean": 2929.8,
"valid_targets_min": 928
},
{
"epoch": 1.1757066462948815,
"grad_norm": 0.6473357152162962,
"learning_rate": 3.9445441469409924e-05,
"loss": 0.5058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3352232277393341,
"step": 770,
"valid_targets_mean": 4502.8,
"valid_targets_min": 950
},
{
"epoch": 1.183346065699007,
"grad_norm": 0.7669883434486255,
"learning_rate": 3.94274947417421e-05,
"loss": 0.5436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27057844400405884,
"step": 775,
"valid_targets_mean": 3110.5,
"valid_targets_min": 812
},
{
"epoch": 1.190985485103132,
"grad_norm": 0.7542936395101697,
"learning_rate": 3.9409266436811824e-05,
"loss": 0.5254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21778935194015503,
"step": 780,
"valid_targets_mean": 4820.9,
"valid_targets_min": 2305
},
{
"epoch": 1.1986249045072574,
"grad_norm": 0.7606927697328497,
"learning_rate": 3.9390756818815605e-05,
"loss": 0.5343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33282411098480225,
"step": 785,
"valid_targets_mean": 2609.5,
"valid_targets_min": 826
},
{
"epoch": 1.2062643239113828,
"grad_norm": 0.7384013328069043,
"learning_rate": 3.937196615602722e-05,
"loss": 0.5432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34026217460632324,
"step": 790,
"valid_targets_mean": 3617.6,
"valid_targets_min": 682
},
{
"epoch": 1.213903743315508,
"grad_norm": 0.7436645557686744,
"learning_rate": 3.9352894720793844e-05,
"loss": 0.5174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2270776778459549,
"step": 795,
"valid_targets_mean": 2522.6,
"valid_targets_min": 1883
},
{
"epoch": 1.2215431627196334,
"grad_norm": 0.7123365313732616,
"learning_rate": 3.9333542789532116e-05,
"loss": 0.5672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3193785548210144,
"step": 800,
"valid_targets_mean": 3023.6,
"valid_targets_min": 1119
},
{
"epoch": 1.2291825821237585,
"grad_norm": 0.7643663765177652,
"learning_rate": 3.9313910642724084e-05,
"loss": 0.518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1887185126543045,
"step": 805,
"valid_targets_mean": 1951.9,
"valid_targets_min": 978
},
{
"epoch": 1.236822001527884,
"grad_norm": 0.6346468679822354,
"learning_rate": 3.92939985649132e-05,
"loss": 0.5205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29271286725997925,
"step": 810,
"valid_targets_mean": 4557.6,
"valid_targets_min": 919
},
{
"epoch": 1.244461420932009,
"grad_norm": 0.6343394889103051,
"learning_rate": 3.927380684470016e-05,
"loss": 0.5072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1973128616809845,
"step": 815,
"valid_targets_mean": 2726.2,
"valid_targets_min": 842
},
{
"epoch": 1.2521008403361344,
"grad_norm": 0.6630789556378238,
"learning_rate": 3.9253335774738693e-05,
"loss": 0.5256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32815930247306824,
"step": 820,
"valid_targets_mean": 3497.5,
"valid_targets_min": 698
},
{
"epoch": 1.2597402597402598,
"grad_norm": 0.6526796753186936,
"learning_rate": 3.92325856517314e-05,
"loss": 0.5265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2999138832092285,
"step": 825,
"valid_targets_mean": 3903.5,
"valid_targets_min": 1335
},
{
"epoch": 1.267379679144385,
"grad_norm": 0.7827981591665036,
"learning_rate": 3.9211556776425374e-05,
"loss": 0.5689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3150915205478668,
"step": 830,
"valid_targets_mean": 2640.9,
"valid_targets_min": 1350
},
{
"epoch": 1.2750190985485104,
"grad_norm": 0.7247020902846159,
"learning_rate": 3.919024945360791e-05,
"loss": 0.5661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33880436420440674,
"step": 835,
"valid_targets_mean": 3613.6,
"valid_targets_min": 859
},
{
"epoch": 1.2826585179526355,
"grad_norm": 0.6163344529726824,
"learning_rate": 3.916866399210201e-05,
"loss": 0.5022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2479287087917328,
"step": 840,
"valid_targets_mean": 3889.8,
"valid_targets_min": 748
},
{
"epoch": 1.290297937356761,
"grad_norm": 0.5806538155279558,
"learning_rate": 3.9146800704761976e-05,
"loss": 0.5273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31038084626197815,
"step": 845,
"valid_targets_mean": 4618.4,
"valid_targets_min": 1615
},
{
"epoch": 1.2979373567608863,
"grad_norm": 0.6961922232392995,
"learning_rate": 3.912465990846884e-05,
"loss": 0.539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.347188800573349,
"step": 850,
"valid_targets_mean": 3624.2,
"valid_targets_min": 1515
},
{
"epoch": 1.3055767761650114,
"grad_norm": 0.710377247785307,
"learning_rate": 3.910224192412578e-05,
"loss": 0.542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3642812967300415,
"step": 855,
"valid_targets_mean": 3940.1,
"valid_targets_min": 1113
},
{
"epoch": 1.3132161955691368,
"grad_norm": 0.7270203911442068,
"learning_rate": 3.9079547076653466e-05,
"loss": 0.5641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16767947375774384,
"step": 860,
"valid_targets_mean": 1617.4,
"valid_targets_min": 843
},
{
"epoch": 1.320855614973262,
"grad_norm": 0.6324169969165148,
"learning_rate": 3.9056575694985356e-05,
"loss": 0.5432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20532405376434326,
"step": 865,
"valid_targets_mean": 3589.0,
"valid_targets_min": 1289
},
{
"epoch": 1.3284950343773874,
"grad_norm": 0.8074126717640064,
"learning_rate": 3.903332811206293e-05,
"loss": 0.5787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3212442398071289,
"step": 870,
"valid_targets_mean": 3137.5,
"valid_targets_min": 1116
},
{
"epoch": 1.3361344537815127,
"grad_norm": 0.6871709684384119,
"learning_rate": 3.900980466483085e-05,
"loss": 0.5364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2149738073348999,
"step": 875,
"valid_targets_mean": 2576.8,
"valid_targets_min": 716
},
{
"epoch": 1.343773873185638,
"grad_norm": 0.6932421836403329,
"learning_rate": 3.89860056942321e-05,
"loss": 0.5189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2367231249809265,
"step": 880,
"valid_targets_mean": 2527.0,
"valid_targets_min": 1013
},
{
"epoch": 1.351413292589763,
"grad_norm": 0.6497125710859505,
"learning_rate": 3.896193154520302e-05,
"loss": 0.5318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3200853168964386,
"step": 885,
"valid_targets_mean": 4165.2,
"valid_targets_min": 1149
},
{
"epoch": 1.3590527119938884,
"grad_norm": 0.7278203456258373,
"learning_rate": 3.8937582566668324e-05,
"loss": 0.515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1707996428012848,
"step": 890,
"valid_targets_mean": 2198.4,
"valid_targets_min": 1103
},
{
"epoch": 1.3666921313980138,
"grad_norm": 0.6901081116464821,
"learning_rate": 3.891295911153601e-05,
"loss": 0.5303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2586451470851898,
"step": 895,
"valid_targets_mean": 3480.6,
"valid_targets_min": 496
},
{
"epoch": 1.374331550802139,
"grad_norm": 0.75802472802529,
"learning_rate": 3.888806153669233e-05,
"loss": 0.5403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3226444125175476,
"step": 900,
"valid_targets_mean": 3047.5,
"valid_targets_min": 1296
},
{
"epoch": 1.3819709702062644,
"grad_norm": 0.7026070572178644,
"learning_rate": 3.88628902029965e-05,
"loss": 0.5463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2279137670993805,
"step": 905,
"valid_targets_mean": 2393.0,
"valid_targets_min": 970
},
{
"epoch": 1.3896103896103895,
"grad_norm": 0.7385335795568237,
"learning_rate": 3.883744547527555e-05,
"loss": 0.5348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23169125616550446,
"step": 910,
"valid_targets_mean": 2278.2,
"valid_targets_min": 852
},
{
"epoch": 1.397249809014515,
"grad_norm": 0.6321022169220797,
"learning_rate": 3.881172772231903e-05,
"loss": 0.5418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22475971281528473,
"step": 915,
"valid_targets_mean": 3198.1,
"valid_targets_min": 1456
},
{
"epoch": 1.4048892284186403,
"grad_norm": 0.61696149669697,
"learning_rate": 3.878573731687362e-05,
"loss": 0.572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22539305686950684,
"step": 920,
"valid_targets_mean": 3476.6,
"valid_targets_min": 597
},
{
"epoch": 1.4125286478227654,
"grad_norm": 0.7842361184386845,
"learning_rate": 3.8759474635637785e-05,
"loss": 0.529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2607775926589966,
"step": 925,
"valid_targets_mean": 2646.8,
"valid_targets_min": 469
},
{
"epoch": 1.4201680672268908,
"grad_norm": 0.7454444565263518,
"learning_rate": 3.8732940059256276e-05,
"loss": 0.5537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2992340326309204,
"step": 930,
"valid_targets_mean": 2702.8,
"valid_targets_min": 1111
},
{
"epoch": 1.427807486631016,
"grad_norm": 0.6734402228717832,
"learning_rate": 3.870613397231462e-05,
"loss": 0.5306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26427602767944336,
"step": 935,
"valid_targets_mean": 3468.4,
"valid_targets_min": 825
},
{
"epoch": 1.4354469060351414,
"grad_norm": 0.6807817371217704,
"learning_rate": 3.867905676333354e-05,
"loss": 0.5311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2101900577545166,
"step": 940,
"valid_targets_mean": 2051.8,
"valid_targets_min": 1237
},
{
"epoch": 1.4430863254392667,
"grad_norm": 0.7057342976825963,
"learning_rate": 3.8651708824763384e-05,
"loss": 0.5346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1674555391073227,
"step": 945,
"valid_targets_mean": 2166.4,
"valid_targets_min": 982
},
{
"epoch": 1.450725744843392,
"grad_norm": 0.7101649627528165,
"learning_rate": 3.862409055297831e-05,
"loss": 0.5648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19412991404533386,
"step": 950,
"valid_targets_mean": 2372.6,
"valid_targets_min": 1010
},
{
"epoch": 1.458365164247517,
"grad_norm": 0.7124796816451234,
"learning_rate": 3.8596202348270695e-05,
"loss": 0.525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34211790561676025,
"step": 955,
"valid_targets_mean": 3600.6,
"valid_targets_min": 1749
},
{
"epoch": 1.4660045836516424,
"grad_norm": 0.6495231524844639,
"learning_rate": 3.85680446148452e-05,
"loss": 0.5238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2449973225593567,
"step": 960,
"valid_targets_mean": 3596.6,
"valid_targets_min": 1903
},
{
"epoch": 1.4736440030557678,
"grad_norm": 0.7385068351743556,
"learning_rate": 3.853961776081299e-05,
"loss": 0.558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2591915726661682,
"step": 965,
"valid_targets_mean": 2599.1,
"valid_targets_min": 746
},
{
"epoch": 1.481283422459893,
"grad_norm": 0.6640970141796577,
"learning_rate": 3.8510922198185805e-05,
"loss": 0.5318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2822009325027466,
"step": 970,
"valid_targets_mean": 3411.0,
"valid_targets_min": 945
},
{
"epoch": 1.4889228418640184,
"grad_norm": 0.728614551507354,
"learning_rate": 3.8481958342869966e-05,
"loss": 0.5603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.47605425119400024,
"step": 975,
"valid_targets_mean": 4951.6,
"valid_targets_min": 921
},
{
"epoch": 1.4965622612681435,
"grad_norm": 0.5670458089086574,
"learning_rate": 3.8452726614660364e-05,
"loss": 0.4938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.246848464012146,
"step": 980,
"valid_targets_mean": 3967.6,
"valid_targets_min": 1739
},
{
"epoch": 1.504201680672269,
"grad_norm": 0.5967985021594041,
"learning_rate": 3.8423227437234385e-05,
"loss": 0.5159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21474456787109375,
"step": 985,
"valid_targets_mean": 3238.4,
"valid_targets_min": 1693
},
{
"epoch": 1.5118411000763943,
"grad_norm": 0.5896858060191866,
"learning_rate": 3.8393461238145737e-05,
"loss": 0.5241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27799534797668457,
"step": 990,
"valid_targets_mean": 3818.8,
"valid_targets_min": 1460
},
{
"epoch": 1.5194805194805194,
"grad_norm": 0.6403716120248297,
"learning_rate": 3.83634284488183e-05,
"loss": 0.5646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.310907781124115,
"step": 995,
"valid_targets_mean": 4377.5,
"valid_targets_min": 1251
},
{
"epoch": 1.5271199388846448,
"grad_norm": 0.6576858777363869,
"learning_rate": 3.833312950453981e-05,
"loss": 0.558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18086987733840942,
"step": 1000,
"valid_targets_mean": 2679.1,
"valid_targets_min": 980
},
{
"epoch": 1.53475935828877,
"grad_norm": 0.6264938830245572,
"learning_rate": 3.830256484445562e-05,
"loss": 0.5231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24808485805988312,
"step": 1005,
"valid_targets_mean": 3809.2,
"valid_targets_min": 1573
},
{
"epoch": 1.5423987776928954,
"grad_norm": 0.6947851643347049,
"learning_rate": 3.827173491156228e-05,
"loss": 0.5597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3576025068759918,
"step": 1010,
"valid_targets_mean": 3728.4,
"valid_targets_min": 1797
},
{
"epoch": 1.5500381970970207,
"grad_norm": 0.6065532261217823,
"learning_rate": 3.824064015270116e-05,
"loss": 0.5225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29614564776420593,
"step": 1015,
"valid_targets_mean": 3743.4,
"valid_targets_min": 605
},
{
"epoch": 1.557677616501146,
"grad_norm": 0.737923563809332,
"learning_rate": 3.820928101855193e-05,
"loss": 0.5736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3168005049228668,
"step": 1020,
"valid_targets_mean": 2394.5,
"valid_targets_min": 817
},
{
"epoch": 1.565317035905271,
"grad_norm": 0.692425445994189,
"learning_rate": 3.817765796362606e-05,
"loss": 0.518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30288469791412354,
"step": 1025,
"valid_targets_mean": 3822.5,
"valid_targets_min": 1556
},
{
"epoch": 1.5729564553093964,
"grad_norm": 0.7094886326492358,
"learning_rate": 3.814577144626021e-05,
"loss": 0.5404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22933900356292725,
"step": 1030,
"valid_targets_mean": 2317.1,
"valid_targets_min": 966
},
{
"epoch": 1.5805958747135218,
"grad_norm": 0.7336132414342458,
"learning_rate": 3.811362192860962e-05,
"loss": 0.5613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.260783851146698,
"step": 1035,
"valid_targets_mean": 2234.9,
"valid_targets_min": 994
},
{
"epoch": 1.5882352941176472,
"grad_norm": 0.6472450868846049,
"learning_rate": 3.808120987664137e-05,
"loss": 0.5421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3125843405723572,
"step": 1040,
"valid_targets_mean": 3125.6,
"valid_targets_min": 1001
},
{
"epoch": 1.5958747135217723,
"grad_norm": 0.6464488415033857,
"learning_rate": 3.804853576012767e-05,
"loss": 0.5357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17949353158473969,
"step": 1045,
"valid_targets_mean": 2726.9,
"valid_targets_min": 772
},
{
"epoch": 1.6035141329258975,
"grad_norm": 0.6816461927909948,
"learning_rate": 3.8015600052638994e-05,
"loss": 0.5328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2890270948410034,
"step": 1050,
"valid_targets_mean": 2916.8,
"valid_targets_min": 1128
},
{
"epoch": 1.6111535523300229,
"grad_norm": 0.7078659804169987,
"learning_rate": 3.798240323153729e-05,
"loss": 0.5186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2691645324230194,
"step": 1055,
"valid_targets_mean": 2478.0,
"valid_targets_min": 1475
},
{
"epoch": 1.6187929717341483,
"grad_norm": 0.5989882393105532,
"learning_rate": 3.7948945777968986e-05,
"loss": 0.5433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26992538571357727,
"step": 1060,
"valid_targets_mean": 3086.0,
"valid_targets_min": 1187
},
{
"epoch": 1.6264323911382736,
"grad_norm": 0.7037135548541353,
"learning_rate": 3.7915228176858076e-05,
"loss": 0.5291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1986842006444931,
"step": 1065,
"valid_targets_mean": 2687.5,
"valid_targets_min": 949
},
{
"epoch": 1.6340718105423988,
"grad_norm": 0.6048821928261803,
"learning_rate": 3.788125091689906e-05,
"loss": 0.5656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23728778958320618,
"step": 1070,
"valid_targets_mean": 3255.9,
"valid_targets_min": 761
},
{
"epoch": 1.641711229946524,
"grad_norm": 0.5355816192539666,
"learning_rate": 3.7847014490549865e-05,
"loss": 0.5188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24673610925674438,
"step": 1075,
"valid_targets_mean": 4140.5,
"valid_targets_min": 1148
},
{
"epoch": 1.6493506493506493,
"grad_norm": 0.636731420373111,
"learning_rate": 3.7812519394024714e-05,
"loss": 0.5173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28254377841949463,
"step": 1080,
"valid_targets_mean": 4065.0,
"valid_targets_min": 1622
},
{
"epoch": 1.6569900687547747,
"grad_norm": 0.584619470678609,
"learning_rate": 3.777776612728693e-05,
"loss": 0.5399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24916572868824005,
"step": 1085,
"valid_targets_mean": 3729.6,
"valid_targets_min": 1112
},
{
"epoch": 1.6646294881588999,
"grad_norm": 0.6309053969396224,
"learning_rate": 3.77427551940417e-05,
"loss": 0.5159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24699068069458008,
"step": 1090,
"valid_targets_mean": 3228.4,
"valid_targets_min": 1303
},
{
"epoch": 1.6722689075630253,
"grad_norm": 0.6306346754741646,
"learning_rate": 3.770748710172874e-05,
"loss": 0.5214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23530437052249908,
"step": 1095,
"valid_targets_mean": 3177.8,
"valid_targets_min": 1167
},
{
"epoch": 1.6799083269671504,
"grad_norm": 0.6802201791843018,
"learning_rate": 3.7671962361515e-05,
"loss": 0.5302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31233322620391846,
"step": 1100,
"valid_targets_mean": 3288.9,
"valid_targets_min": 856
},
{
"epoch": 1.6875477463712758,
"grad_norm": 0.7477194331243122,
"learning_rate": 3.76361814882872e-05,
"loss": 0.516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23209503293037415,
"step": 1105,
"valid_targets_mean": 2395.2,
"valid_targets_min": 911
},
{
"epoch": 1.6951871657754012,
"grad_norm": 0.6286405393933542,
"learning_rate": 3.760014500064437e-05,
"loss": 0.5525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3077746331691742,
"step": 1110,
"valid_targets_mean": 4294.1,
"valid_targets_min": 797
},
{
"epoch": 1.7028265851795263,
"grad_norm": 0.6815312970337704,
"learning_rate": 3.75638534208904e-05,
"loss": 0.5417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21405085921287537,
"step": 1115,
"valid_targets_mean": 2392.6,
"valid_targets_min": 849
},
{
"epoch": 1.7104660045836515,
"grad_norm": 0.5689062532951552,
"learning_rate": 3.7527307275026375e-05,
"loss": 0.4856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.196921706199646,
"step": 1120,
"valid_targets_mean": 3016.2,
"valid_targets_min": 705
},
{
"epoch": 1.7181054239877769,
"grad_norm": 0.4857698883011697,
"learning_rate": 3.749050709274303e-05,
"loss": 0.5104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22700002789497375,
"step": 1125,
"valid_targets_mean": 4638.6,
"valid_targets_min": 1595
},
{
"epoch": 1.7257448433919023,
"grad_norm": 0.6172079732872118,
"learning_rate": 3.7453453407413017e-05,
"loss": 0.5307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24322380125522614,
"step": 1130,
"valid_targets_mean": 2821.2,
"valid_targets_min": 1323
},
{
"epoch": 1.7333842627960276,
"grad_norm": 0.6090536328384808,
"learning_rate": 3.7416146756083206e-05,
"loss": 0.5621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2388569712638855,
"step": 1135,
"valid_targets_mean": 3844.5,
"valid_targets_min": 1783
},
{
"epoch": 1.7410236822001528,
"grad_norm": 0.5783456560647274,
"learning_rate": 3.7378587679466905e-05,
"loss": 0.5091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17862531542778015,
"step": 1140,
"valid_targets_mean": 3060.9,
"valid_targets_min": 906
},
{
"epoch": 1.748663101604278,
"grad_norm": 0.5769716592236767,
"learning_rate": 3.7340776721936e-05,
"loss": 0.5564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37400296330451965,
"step": 1145,
"valid_targets_mean": 4793.1,
"valid_targets_min": 2782
},
{
"epoch": 1.7563025210084033,
"grad_norm": 0.5706577300432857,
"learning_rate": 3.730271443151307e-05,
"loss": 0.5301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25871527194976807,
"step": 1150,
"valid_targets_mean": 3715.6,
"valid_targets_min": 1506
},
{
"epoch": 1.7639419404125287,
"grad_norm": 0.7272691515910408,
"learning_rate": 3.726440135986346e-05,
"loss": 0.5295,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2796229422092438,
"step": 1155,
"valid_targets_mean": 2538.6,
"valid_targets_min": 1183
},
{
"epoch": 1.771581359816654,
"grad_norm": 0.6317299325267872,
"learning_rate": 3.722583806228727e-05,
"loss": 0.5332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30438125133514404,
"step": 1160,
"valid_targets_mean": 3455.2,
"valid_targets_min": 1715
},
{
"epoch": 1.7792207792207793,
"grad_norm": 0.6091979304515164,
"learning_rate": 3.7187025097711325e-05,
"loss": 0.5465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19755399227142334,
"step": 1165,
"valid_targets_mean": 2997.4,
"valid_targets_min": 1016
},
{
"epoch": 1.7868601986249044,
"grad_norm": 0.7220416396847499,
"learning_rate": 3.714796302868105e-05,
"loss": 0.5383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3491123914718628,
"step": 1170,
"valid_targets_mean": 3392.4,
"valid_targets_min": 1653
},
{
"epoch": 1.7944996180290298,
"grad_norm": 0.5964619045278258,
"learning_rate": 3.710865242135231e-05,
"loss": 0.5371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24358564615249634,
"step": 1175,
"valid_targets_mean": 3734.4,
"valid_targets_min": 748
},
{
"epoch": 1.8021390374331552,
"grad_norm": 0.5873635920467295,
"learning_rate": 3.7069093845483265e-05,
"loss": 0.5058,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24197137355804443,
"step": 1180,
"valid_targets_mean": 3604.4,
"valid_targets_min": 1006
},
{
"epoch": 1.8097784568372803,
"grad_norm": 0.6984507077197806,
"learning_rate": 3.702928787442603e-05,
"loss": 0.506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37548327445983887,
"step": 1185,
"valid_targets_mean": 3504.6,
"valid_targets_min": 711
},
{
"epoch": 1.8174178762414055,
"grad_norm": 0.7830323580644593,
"learning_rate": 3.698923508511843e-05,
"loss": 0.5523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2729473412036896,
"step": 1190,
"valid_targets_mean": 2126.0,
"valid_targets_min": 651
},
{
"epoch": 1.8250572956455309,
"grad_norm": 0.5967750220721146,
"learning_rate": 3.69489360580756e-05,
"loss": 0.509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21153341233730316,
"step": 1195,
"valid_targets_mean": 3077.9,
"valid_targets_min": 253
},
{
"epoch": 1.8326967150496563,
"grad_norm": 0.5605236353838795,
"learning_rate": 3.690839137738159e-05,
"loss": 0.4913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2955290675163269,
"step": 1200,
"valid_targets_mean": 4730.1,
"valid_targets_min": 1271
},
{
"epoch": 1.8403361344537816,
"grad_norm": 0.6085256947878469,
"learning_rate": 3.6867601630680866e-05,
"loss": 0.555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29254335165023804,
"step": 1205,
"valid_targets_mean": 4159.6,
"valid_targets_min": 1517
},
{
"epoch": 1.8479755538579068,
"grad_norm": 0.7044349997653415,
"learning_rate": 3.682656740916986e-05,
"loss": 0.5505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3043631911277771,
"step": 1210,
"valid_targets_mean": 3770.8,
"valid_targets_min": 1189
},
{
"epoch": 1.855614973262032,
"grad_norm": 0.6550764600527469,
"learning_rate": 3.678528930758834e-05,
"loss": 0.5594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3247641623020172,
"step": 1215,
"valid_targets_mean": 3556.6,
"valid_targets_min": 1037
},
{
"epoch": 1.8632543926661573,
"grad_norm": 0.7190327175451237,
"learning_rate": 3.674376792421081e-05,
"loss": 0.5401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3061503469944,
"step": 1220,
"valid_targets_mean": 2849.2,
"valid_targets_min": 701
},
{
"epoch": 1.8708938120702827,
"grad_norm": 0.6887939667732077,
"learning_rate": 3.670200386083784e-05,
"loss": 0.5286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3267863392829895,
"step": 1225,
"valid_targets_mean": 3191.8,
"valid_targets_min": 719
},
{
"epoch": 1.878533231474408,
"grad_norm": 0.6379586545313669,
"learning_rate": 3.665999772278736e-05,
"loss": 0.5662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.39808523654937744,
"step": 1230,
"valid_targets_mean": 4236.0,
"valid_targets_min": 925
},
{
"epoch": 1.8861726508785333,
"grad_norm": 0.6902444540079928,
"learning_rate": 3.661775011888584e-05,
"loss": 0.5345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24210360646247864,
"step": 1235,
"valid_targets_mean": 3590.6,
"valid_targets_min": 2191
},
{
"epoch": 1.8938120702826584,
"grad_norm": 0.6622678829508013,
"learning_rate": 3.657526166145952e-05,
"loss": 0.4882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25689786672592163,
"step": 1240,
"valid_targets_mean": 2681.5,
"valid_targets_min": 1016
},
{
"epoch": 1.9014514896867838,
"grad_norm": 0.6762001298834552,
"learning_rate": 3.65325329663255e-05,
"loss": 0.5019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23240089416503906,
"step": 1245,
"valid_targets_mean": 3059.0,
"valid_targets_min": 943
},
{
"epoch": 1.9090909090909092,
"grad_norm": 0.7264235125054589,
"learning_rate": 3.648956465278284e-05,
"loss": 0.5196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22812113165855408,
"step": 1250,
"valid_targets_mean": 2430.2,
"valid_targets_min": 515
},
{
"epoch": 1.9167303284950343,
"grad_norm": 0.6846670975363754,
"learning_rate": 3.6446357343603536e-05,
"loss": 0.5425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2963109612464905,
"step": 1255,
"valid_targets_mean": 3483.8,
"valid_targets_min": 958
},
{
"epoch": 1.9243697478991597,
"grad_norm": 0.727888807975606,
"learning_rate": 3.6402911665023565e-05,
"loss": 0.5057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29520994424819946,
"step": 1260,
"valid_targets_mean": 3465.0,
"valid_targets_min": 1320
},
{
"epoch": 1.9320091673032849,
"grad_norm": 0.6640837422377913,
"learning_rate": 3.6359228246733744e-05,
"loss": 0.5472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34408777952194214,
"step": 1265,
"valid_targets_mean": 4042.9,
"valid_targets_min": 1297
},
{
"epoch": 1.9396485867074102,
"grad_norm": 0.6476482043969682,
"learning_rate": 3.631530772187065e-05,
"loss": 0.5313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2760136127471924,
"step": 1270,
"valid_targets_mean": 3540.1,
"valid_targets_min": 1170
},
{
"epoch": 1.9472880061115356,
"grad_norm": 0.6467092573010441,
"learning_rate": 3.627115072700741e-05,
"loss": 0.4999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32210585474967957,
"step": 1275,
"valid_targets_mean": 3878.0,
"valid_targets_min": 1552
},
{
"epoch": 1.9549274255156608,
"grad_norm": 0.5803166137506185,
"learning_rate": 3.6226757902144495e-05,
"loss": 0.5491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33720919489860535,
"step": 1280,
"valid_targets_mean": 4619.9,
"valid_targets_min": 919
},
{
"epoch": 1.962566844919786,
"grad_norm": 0.5328390011256504,
"learning_rate": 3.618212989070043e-05,
"loss": 0.513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18014609813690186,
"step": 1285,
"valid_targets_mean": 3435.1,
"valid_targets_min": 2096
},
{
"epoch": 1.9702062643239113,
"grad_norm": 0.6854626615968217,
"learning_rate": 3.613726733950248e-05,
"loss": 0.5191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34878984093666077,
"step": 1290,
"valid_targets_mean": 3824.2,
"valid_targets_min": 806
},
{
"epoch": 1.9778456837280367,
"grad_norm": 0.5949832136294794,
"learning_rate": 3.609217089877728e-05,
"loss": 0.5531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724492311477661,
"step": 1295,
"valid_targets_mean": 2781.6,
"valid_targets_min": 820
},
{
"epoch": 1.985485103132162,
"grad_norm": 0.8455545653427853,
"learning_rate": 3.604684122214138e-05,
"loss": 0.5478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2157420665025711,
"step": 1300,
"valid_targets_mean": 1768.0,
"valid_targets_min": 847
},
{
"epoch": 1.9931245225362872,
"grad_norm": 0.6959760784864205,
"learning_rate": 3.600127896659181e-05,
"loss": 0.5442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2532881200313568,
"step": 1305,
"valid_targets_mean": 2938.0,
"valid_targets_min": 1062
},
{
"epoch": 2.0,
"grad_norm": 0.9358773564606009,
"learning_rate": 3.5955484792496536e-05,
"loss": 0.4938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5185206532478333,
"step": 1310,
"valid_targets_mean": 3101.2,
"valid_targets_min": 1261
},
{
"epoch": 2.0076394194041254,
"grad_norm": 0.5317421829410245,
"learning_rate": 3.5909459363584895e-05,
"loss": 0.4783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2319856882095337,
"step": 1315,
"valid_targets_mean": 4424.4,
"valid_targets_min": 1783
},
{
"epoch": 2.0152788388082508,
"grad_norm": 0.7259614209577792,
"learning_rate": 3.5863203346937974e-05,
"loss": 0.4646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2661840319633484,
"step": 1320,
"valid_targets_mean": 3145.4,
"valid_targets_min": 882
},
{
"epoch": 2.0229182582123757,
"grad_norm": 0.6866135582932625,
"learning_rate": 3.5816717412978935e-05,
"loss": 0.4872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.274208664894104,
"step": 1325,
"valid_targets_mean": 4005.1,
"valid_targets_min": 1327
},
{
"epoch": 2.030557677616501,
"grad_norm": 0.6107569519174747,
"learning_rate": 3.577000223546331e-05,
"loss": 0.4855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2812064290046692,
"step": 1330,
"valid_targets_mean": 4395.8,
"valid_targets_min": 926
},
{
"epoch": 2.0381970970206265,
"grad_norm": 0.5841200969185655,
"learning_rate": 3.5723058491469226e-05,
"loss": 0.4616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18964403867721558,
"step": 1335,
"valid_targets_mean": 2951.0,
"valid_targets_min": 821
},
{
"epoch": 2.045836516424752,
"grad_norm": 0.7731622386210697,
"learning_rate": 3.56758868613876e-05,
"loss": 0.5099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22586776316165924,
"step": 1340,
"valid_targets_mean": 2463.9,
"valid_targets_min": 455
},
{
"epoch": 2.053475935828877,
"grad_norm": 0.8201482091316316,
"learning_rate": 3.5628488028912284e-05,
"loss": 0.5191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2765929102897644,
"step": 1345,
"valid_targets_mean": 2273.8,
"valid_targets_min": 976
},
{
"epoch": 2.061115355233002,
"grad_norm": 0.7559956865117078,
"learning_rate": 3.558086268103011e-05,
"loss": 0.4767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2768942713737488,
"step": 1350,
"valid_targets_mean": 3333.4,
"valid_targets_min": 1265
},
{
"epoch": 2.0687547746371275,
"grad_norm": 0.7010684764079771,
"learning_rate": 3.5533011508011e-05,
"loss": 0.4833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20257258415222168,
"step": 1355,
"valid_targets_mean": 3312.2,
"valid_targets_min": 407
},
{
"epoch": 2.076394194041253,
"grad_norm": 0.660599060190917,
"learning_rate": 3.548493520339792e-05,
"loss": 0.5111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21439898014068604,
"step": 1360,
"valid_targets_mean": 2463.9,
"valid_targets_min": 769
},
{
"epoch": 2.0840336134453783,
"grad_norm": 0.7722765277601109,
"learning_rate": 3.5436634463996834e-05,
"loss": 0.507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2662246823310852,
"step": 1365,
"valid_targets_mean": 2362.0,
"valid_targets_min": 1098
},
{
"epoch": 2.0916730328495032,
"grad_norm": 0.6657604945302164,
"learning_rate": 3.538810998986661e-05,
"loss": 0.5495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2910098731517792,
"step": 1370,
"valid_targets_mean": 3378.8,
"valid_targets_min": 565
},
{
"epoch": 2.0993124522536286,
"grad_norm": 0.6146058220275632,
"learning_rate": 3.533936248430887e-05,
"loss": 0.5278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2327723503112793,
"step": 1375,
"valid_targets_mean": 3400.5,
"valid_targets_min": 1404
},
{
"epoch": 2.106951871657754,
"grad_norm": 0.6323389179006582,
"learning_rate": 3.52903926538578e-05,
"loss": 0.4977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18094557523727417,
"step": 1380,
"valid_targets_mean": 3219.0,
"valid_targets_min": 1275
},
{
"epoch": 2.1145912910618794,
"grad_norm": 0.6714237005424043,
"learning_rate": 3.524120120826991e-05,
"loss": 0.5114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261186420917511,
"step": 1385,
"valid_targets_mean": 2986.6,
"valid_targets_min": 644
},
{
"epoch": 2.1222307104660048,
"grad_norm": 0.7168232477241365,
"learning_rate": 3.519178886051374e-05,
"loss": 0.4868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24357938766479492,
"step": 1390,
"valid_targets_mean": 3561.8,
"valid_targets_min": 1220
},
{
"epoch": 2.1298701298701297,
"grad_norm": 0.7179444771168448,
"learning_rate": 3.514215632675953e-05,
"loss": 0.4773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2347637414932251,
"step": 1395,
"valid_targets_mean": 3083.2,
"valid_targets_min": 760
},
{
"epoch": 2.137509549274255,
"grad_norm": 0.8502474110018483,
"learning_rate": 3.509230432636884e-05,
"loss": 0.5114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30212515592575073,
"step": 1400,
"valid_targets_mean": 2405.1,
"valid_targets_min": 835
},
{
"epoch": 2.1451489686783805,
"grad_norm": 0.619094616956861,
"learning_rate": 3.504223358188414e-05,
"loss": 0.4978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3284362554550171,
"step": 1405,
"valid_targets_mean": 4827.5,
"valid_targets_min": 1327
},
{
"epoch": 2.152788388082506,
"grad_norm": 0.7128343442681825,
"learning_rate": 3.4991944819018295e-05,
"loss": 0.4943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23888735473155975,
"step": 1410,
"valid_targets_mean": 3042.6,
"valid_targets_min": 1196
},
{
"epoch": 2.160427807486631,
"grad_norm": 0.5834794683505667,
"learning_rate": 3.4941438766644094e-05,
"loss": 0.4697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22566252946853638,
"step": 1415,
"valid_targets_mean": 4167.9,
"valid_targets_min": 600
},
{
"epoch": 2.168067226890756,
"grad_norm": 0.5505262571807923,
"learning_rate": 3.489071615678366e-05,
"loss": 0.4957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29685625433921814,
"step": 1420,
"valid_targets_mean": 5135.1,
"valid_targets_min": 1375
},
{
"epoch": 2.1757066462948815,
"grad_norm": 0.6704037109861748,
"learning_rate": 3.483977772459786e-05,
"loss": 0.4863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3806396424770355,
"step": 1425,
"valid_targets_mean": 4908.2,
"valid_targets_min": 699
},
{
"epoch": 2.183346065699007,
"grad_norm": 0.6015955329730339,
"learning_rate": 3.478862420837561e-05,
"loss": 0.4905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22024193406105042,
"step": 1430,
"valid_targets_mean": 3537.0,
"valid_targets_min": 1174
},
{
"epoch": 2.1909854851031323,
"grad_norm": 0.8149409610415594,
"learning_rate": 3.473725634952321e-05,
"loss": 0.5062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24890246987342834,
"step": 1435,
"valid_targets_mean": 2094.8,
"valid_targets_min": 679
},
{
"epoch": 2.1986249045072572,
"grad_norm": 0.729224011887746,
"learning_rate": 3.4685674892553604e-05,
"loss": 0.4551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2595076262950897,
"step": 1440,
"valid_targets_mean": 3288.8,
"valid_targets_min": 625
},
{
"epoch": 2.2062643239113826,
"grad_norm": 0.6441248015278864,
"learning_rate": 3.463388058507556e-05,
"loss": 0.4455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1921394020318985,
"step": 1445,
"valid_targets_mean": 2419.9,
"valid_targets_min": 949
},
{
"epoch": 2.213903743315508,
"grad_norm": 0.6762838196132268,
"learning_rate": 3.458187417778284e-05,
"loss": 0.4922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27211958169937134,
"step": 1450,
"valid_targets_mean": 3996.0,
"valid_targets_min": 1182
},
{
"epoch": 2.2215431627196334,
"grad_norm": 0.6261428817660788,
"learning_rate": 3.452965642444334e-05,
"loss": 0.4853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1550438106060028,
"step": 1455,
"valid_targets_mean": 2566.4,
"valid_targets_min": 884
},
{
"epoch": 2.2291825821237587,
"grad_norm": 0.7408606958154191,
"learning_rate": 3.447722808188816e-05,
"loss": 0.4831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18380820751190186,
"step": 1460,
"valid_targets_mean": 2003.5,
"valid_targets_min": 698
},
{
"epoch": 2.2368220015278837,
"grad_norm": 0.7861802803128333,
"learning_rate": 3.442458991000062e-05,
"loss": 0.5236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2023487538099289,
"step": 1465,
"valid_targets_mean": 1830.8,
"valid_targets_min": 737
},
{
"epoch": 2.244461420932009,
"grad_norm": 0.7124589412998297,
"learning_rate": 3.437174267170524e-05,
"loss": 0.5182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2585378885269165,
"step": 1470,
"valid_targets_mean": 2549.2,
"valid_targets_min": 438
},
{
"epoch": 2.2521008403361344,
"grad_norm": 0.6812098409271231,
"learning_rate": 3.4318687132956714e-05,
"loss": 0.4896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2898828387260437,
"step": 1475,
"valid_targets_mean": 4216.2,
"valid_targets_min": 1290
},
{
"epoch": 2.25974025974026,
"grad_norm": 0.7132327272659739,
"learning_rate": 3.426542406272879e-05,
"loss": 0.4805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22709037363529205,
"step": 1480,
"valid_targets_mean": 2697.4,
"valid_targets_min": 796
},
{
"epoch": 2.267379679144385,
"grad_norm": 0.7185720305215236,
"learning_rate": 3.4211954233003115e-05,
"loss": 0.5131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2051008939743042,
"step": 1485,
"valid_targets_mean": 2768.2,
"valid_targets_min": 750
},
{
"epoch": 2.27501909854851,
"grad_norm": 0.7435166801422771,
"learning_rate": 3.415827841875807e-05,
"loss": 0.4764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28377318382263184,
"step": 1490,
"valid_targets_mean": 3350.2,
"valid_targets_min": 1131
},
{
"epoch": 2.2826585179526355,
"grad_norm": 0.6818694893959436,
"learning_rate": 3.4104397397957495e-05,
"loss": 0.5384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2481977641582489,
"step": 1495,
"valid_targets_mean": 3382.8,
"valid_targets_min": 1961
},
{
"epoch": 2.290297937356761,
"grad_norm": 0.6664430457664224,
"learning_rate": 3.405031195153949e-05,
"loss": 0.4798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2219395637512207,
"step": 1500,
"valid_targets_mean": 2843.5,
"valid_targets_min": 650
},
{
"epoch": 2.2979373567608863,
"grad_norm": 0.52820138423304,
"learning_rate": 3.399602286340503e-05,
"loss": 0.4687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22768482565879822,
"step": 1505,
"valid_targets_mean": 5526.1,
"valid_targets_min": 1584
},
{
"epoch": 2.3055767761650117,
"grad_norm": 0.7120542733941014,
"learning_rate": 3.394153092040658e-05,
"loss": 0.5092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29083842039108276,
"step": 1510,
"valid_targets_mean": 3225.1,
"valid_targets_min": 901
},
{
"epoch": 2.3132161955691366,
"grad_norm": 0.6870040097106018,
"learning_rate": 3.3886836912336796e-05,
"loss": 0.5131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23260729014873505,
"step": 1515,
"valid_targets_mean": 2770.1,
"valid_targets_min": 859
},
{
"epoch": 2.320855614973262,
"grad_norm": 0.7055648665859806,
"learning_rate": 3.383194163191698e-05,
"loss": 0.475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26753556728363037,
"step": 1520,
"valid_targets_mean": 3388.2,
"valid_targets_min": 885
},
{
"epoch": 2.3284950343773874,
"grad_norm": 0.7916496584586002,
"learning_rate": 3.3776845874785624e-05,
"loss": 0.5013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2454243004322052,
"step": 1525,
"valid_targets_mean": 2547.4,
"valid_targets_min": 1427
},
{
"epoch": 2.3361344537815127,
"grad_norm": 0.7908259705075075,
"learning_rate": 3.37215504394869e-05,
"loss": 0.4798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2940301299095154,
"step": 1530,
"valid_targets_mean": 3533.6,
"valid_targets_min": 703
},
{
"epoch": 2.343773873185638,
"grad_norm": 0.6546979140910963,
"learning_rate": 3.366605612745906e-05,
"loss": 0.4925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26727956533432007,
"step": 1535,
"valid_targets_mean": 3162.8,
"valid_targets_min": 919
},
{
"epoch": 2.351413292589763,
"grad_norm": 0.6783177043359304,
"learning_rate": 3.3610363743022795e-05,
"loss": 0.4864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21130970120429993,
"step": 1540,
"valid_targets_mean": 3205.9,
"valid_targets_min": 1889
},
{
"epoch": 2.3590527119938884,
"grad_norm": 0.6555047268489784,
"learning_rate": 3.3554474093369656e-05,
"loss": 0.5,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31021979451179504,
"step": 1545,
"valid_targets_mean": 3555.1,
"valid_targets_min": 719
},
{
"epoch": 2.366692131398014,
"grad_norm": 0.7305711433653311,
"learning_rate": 3.349838798855027e-05,
"loss": 0.5091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.331775963306427,
"step": 1550,
"valid_targets_mean": 3734.6,
"valid_targets_min": 411
},
{
"epoch": 2.374331550802139,
"grad_norm": 0.559575508819546,
"learning_rate": 3.3442106241462645e-05,
"loss": 0.4559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19253335893154144,
"step": 1555,
"valid_targets_mean": 2387.5,
"valid_targets_min": 688
},
{
"epoch": 2.381970970206264,
"grad_norm": 0.7849640314141061,
"learning_rate": 3.338562966784038e-05,
"loss": 0.5004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22845134139060974,
"step": 1560,
"valid_targets_mean": 2045.8,
"valid_targets_min": 721
},
{
"epoch": 2.3896103896103895,
"grad_norm": 0.8097550048727009,
"learning_rate": 3.3328959086240876e-05,
"loss": 0.494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21622112393379211,
"step": 1565,
"valid_targets_mean": 2250.2,
"valid_targets_min": 658
},
{
"epoch": 2.397249809014515,
"grad_norm": 0.6803709574881871,
"learning_rate": 3.3272095318033376e-05,
"loss": 0.519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2511165738105774,
"step": 1570,
"valid_targets_mean": 2622.2,
"valid_targets_min": 869
},
{
"epoch": 2.4048892284186403,
"grad_norm": 0.6712742285853818,
"learning_rate": 3.321503918738716e-05,
"loss": 0.4903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16048851609230042,
"step": 1575,
"valid_targets_mean": 2250.4,
"valid_targets_min": 1503
},
{
"epoch": 2.4125286478227657,
"grad_norm": 0.677457396605636,
"learning_rate": 3.315779152125955e-05,
"loss": 0.4936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17943637073040009,
"step": 1580,
"valid_targets_mean": 1933.6,
"valid_targets_min": 918
},
{
"epoch": 2.4201680672268906,
"grad_norm": 0.5901481064339373,
"learning_rate": 3.310035314938394e-05,
"loss": 0.4993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22970394790172577,
"step": 1585,
"valid_targets_mean": 3705.9,
"valid_targets_min": 1259
},
{
"epoch": 2.427807486631016,
"grad_norm": 0.5963861967566215,
"learning_rate": 3.304272490425777e-05,
"loss": 0.4882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2982090711593628,
"step": 1590,
"valid_targets_mean": 5054.9,
"valid_targets_min": 1108
},
{
"epoch": 2.4354469060351414,
"grad_norm": 0.7130398946256007,
"learning_rate": 3.2984907621130435e-05,
"loss": 0.5389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35128599405288696,
"step": 1595,
"valid_targets_mean": 3656.8,
"valid_targets_min": 1166
},
{
"epoch": 2.4430863254392667,
"grad_norm": 0.6176299158495442,
"learning_rate": 3.292690213799122e-05,
"loss": 0.5318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24622666835784912,
"step": 1600,
"valid_targets_mean": 3358.4,
"valid_targets_min": 888
},
{
"epoch": 2.4507257448433917,
"grad_norm": 0.5981587869828613,
"learning_rate": 3.286870929555713e-05,
"loss": 0.5288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2027554214000702,
"step": 1605,
"valid_targets_mean": 3590.0,
"valid_targets_min": 1349
},
{
"epoch": 2.458365164247517,
"grad_norm": 0.5744990440096281,
"learning_rate": 3.281032993726071e-05,
"loss": 0.4947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1916375458240509,
"step": 1610,
"valid_targets_mean": 3543.8,
"valid_targets_min": 1484
},
{
"epoch": 2.4660045836516424,
"grad_norm": 0.7430996004414889,
"learning_rate": 3.275176490923781e-05,
"loss": 0.4733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26889270544052124,
"step": 1615,
"valid_targets_mean": 3089.4,
"valid_targets_min": 701
},
{
"epoch": 2.473644003055768,
"grad_norm": 0.7037506079471908,
"learning_rate": 3.269301506031534e-05,
"loss": 0.4731,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25602343678474426,
"step": 1620,
"valid_targets_mean": 2495.0,
"valid_targets_min": 778
},
{
"epoch": 2.481283422459893,
"grad_norm": 0.5842797711033675,
"learning_rate": 3.2634081241998954e-05,
"loss": 0.5177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2861538231372833,
"step": 1625,
"valid_targets_mean": 5589.2,
"valid_targets_min": 2931
},
{
"epoch": 2.488922841864018,
"grad_norm": 0.7575350211022752,
"learning_rate": 3.257496430846071e-05,
"loss": 0.525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2269067019224167,
"step": 1630,
"valid_targets_mean": 2871.0,
"valid_targets_min": 735
},
{
"epoch": 2.4965622612681435,
"grad_norm": 0.6181133672275352,
"learning_rate": 3.251566511652669e-05,
"loss": 0.4685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24582752585411072,
"step": 1635,
"valid_targets_mean": 3053.4,
"valid_targets_min": 878
},
{
"epoch": 2.504201680672269,
"grad_norm": 0.64742145917169,
"learning_rate": 3.245618452566461e-05,
"loss": 0.4816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3426717519760132,
"step": 1640,
"valid_targets_mean": 4025.6,
"valid_targets_min": 1175
},
{
"epoch": 2.5118411000763943,
"grad_norm": 0.6635442839695538,
"learning_rate": 3.23965233979713e-05,
"loss": 0.5,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17027682065963745,
"step": 1645,
"valid_targets_mean": 2165.4,
"valid_targets_min": 1113
},
{
"epoch": 2.5194805194805197,
"grad_norm": 0.5660316698532355,
"learning_rate": 3.233668259816026e-05,
"loss": 0.5077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22779259085655212,
"step": 1650,
"valid_targets_mean": 4539.5,
"valid_targets_min": 930
},
{
"epoch": 2.5271199388846446,
"grad_norm": 0.6224770591422036,
"learning_rate": 3.227666299354912e-05,
"loss": 0.5,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22263994812965393,
"step": 1655,
"valid_targets_mean": 3727.9,
"valid_targets_min": 1163
},
{
"epoch": 2.53475935828877,
"grad_norm": 0.6907752213015932,
"learning_rate": 3.221646545404706e-05,
"loss": 0.506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3159465193748474,
"step": 1660,
"valid_targets_mean": 4150.0,
"valid_targets_min": 1808
},
{
"epoch": 2.5423987776928954,
"grad_norm": 0.7191273755219711,
"learning_rate": 3.21560908521422e-05,
"loss": 0.4704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25996077060699463,
"step": 1665,
"valid_targets_mean": 2863.5,
"valid_targets_min": 885
},
{
"epoch": 2.5500381970970207,
"grad_norm": 0.680261011638979,
"learning_rate": 3.209554006288895e-05,
"loss": 0.4741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3104439377784729,
"step": 1670,
"valid_targets_mean": 4482.5,
"valid_targets_min": 1247
},
{
"epoch": 2.557677616501146,
"grad_norm": 0.6432998240930168,
"learning_rate": 3.203481396389535e-05,
"loss": 0.5118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2836974263191223,
"step": 1675,
"valid_targets_mean": 3161.0,
"valid_targets_min": 893
},
{
"epoch": 2.565317035905271,
"grad_norm": 0.6448940137147883,
"learning_rate": 3.1973913435310335e-05,
"loss": 0.4825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20341014862060547,
"step": 1680,
"valid_targets_mean": 2595.0,
"valid_targets_min": 1027
},
{
"epoch": 2.5729564553093964,
"grad_norm": 0.6826751568198045,
"learning_rate": 3.1912839359810974e-05,
"loss": 0.5003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23161211609840393,
"step": 1685,
"valid_targets_mean": 2430.1,
"valid_targets_min": 1225
},
{
"epoch": 2.580595874713522,
"grad_norm": 0.704783143383557,
"learning_rate": 3.185159262258967e-05,
"loss": 0.4805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29678064584732056,
"step": 1690,
"valid_targets_mean": 3600.0,
"valid_targets_min": 1446
},
{
"epoch": 2.588235294117647,
"grad_norm": 0.5753956792109161,
"learning_rate": 3.179017411134137e-05,
"loss": 0.4918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.268524706363678,
"step": 1695,
"valid_targets_mean": 4652.6,
"valid_targets_min": 1717
},
{
"epoch": 2.5958747135217726,
"grad_norm": 0.7042435298107268,
"learning_rate": 3.172858471625065e-05,
"loss": 0.4995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21800410747528076,
"step": 1700,
"valid_targets_mean": 2551.8,
"valid_targets_min": 695
},
{
"epoch": 2.6035141329258975,
"grad_norm": 0.6748037272112359,
"learning_rate": 3.166682532997883e-05,
"loss": 0.4978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30926668643951416,
"step": 1705,
"valid_targets_mean": 4062.9,
"valid_targets_min": 1157
},
{
"epoch": 2.611153552330023,
"grad_norm": 0.6581058243085496,
"learning_rate": 3.160489684765105e-05,
"loss": 0.4732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15238752961158752,
"step": 1710,
"valid_targets_mean": 2951.8,
"valid_targets_min": 997
},
{
"epoch": 2.6187929717341483,
"grad_norm": 0.5961485901668413,
"learning_rate": 3.154280016684329e-05,
"loss": 0.4727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28147566318511963,
"step": 1715,
"valid_targets_mean": 4090.0,
"valid_targets_min": 1696
},
{
"epoch": 2.6264323911382736,
"grad_norm": 0.6635627417191078,
"learning_rate": 3.148053618756936e-05,
"loss": 0.4939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27265307307243347,
"step": 1720,
"valid_targets_mean": 3721.9,
"valid_targets_min": 1634
},
{
"epoch": 2.634071810542399,
"grad_norm": 0.7282926360608749,
"learning_rate": 3.141810581226782e-05,
"loss": 0.4862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.312755286693573,
"step": 1725,
"valid_targets_mean": 3535.2,
"valid_targets_min": 796
},
{
"epoch": 2.641711229946524,
"grad_norm": 0.6956213326065784,
"learning_rate": 3.135550994578897e-05,
"loss": 0.4809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2344173789024353,
"step": 1730,
"valid_targets_mean": 3056.6,
"valid_targets_min": 1378
},
{
"epoch": 2.6493506493506493,
"grad_norm": 0.6031654478325641,
"learning_rate": 3.129274949538169e-05,
"loss": 0.5099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2556261122226715,
"step": 1735,
"valid_targets_mean": 3144.1,
"valid_targets_min": 1791
},
{
"epoch": 2.6569900687547747,
"grad_norm": 0.6706862876679621,
"learning_rate": 3.122982537068028e-05,
"loss": 0.4703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28426307439804077,
"step": 1740,
"valid_targets_mean": 4114.6,
"valid_targets_min": 1840
},
{
"epoch": 2.6646294881588997,
"grad_norm": 0.6346741898139652,
"learning_rate": 3.1166738483691305e-05,
"loss": 0.4571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2778932452201843,
"step": 1745,
"valid_targets_mean": 4111.8,
"valid_targets_min": 1251
},
{
"epoch": 2.6722689075630255,
"grad_norm": 0.8266245480740433,
"learning_rate": 3.110348974878038e-05,
"loss": 0.4965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2906370162963867,
"step": 1750,
"valid_targets_mean": 2386.2,
"valid_targets_min": 1074
},
{
"epoch": 2.6799083269671504,
"grad_norm": 0.6638752682144674,
"learning_rate": 3.104008008265888e-05,
"loss": 0.4863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27586424350738525,
"step": 1755,
"valid_targets_mean": 3002.8,
"valid_targets_min": 849
},
{
"epoch": 2.687547746371276,
"grad_norm": 0.5942821754327564,
"learning_rate": 3.09765104043707e-05,
"loss": 0.4809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20257282257080078,
"step": 1760,
"valid_targets_mean": 3590.9,
"valid_targets_min": 1851
},
{
"epoch": 2.695187165775401,
"grad_norm": 0.5927687488678979,
"learning_rate": 3.0912781635278886e-05,
"loss": 0.4641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1888626366853714,
"step": 1765,
"valid_targets_mean": 3535.0,
"valid_targets_min": 812
},
{
"epoch": 2.702826585179526,
"grad_norm": 0.7947503911879893,
"learning_rate": 3.0848894699052326e-05,
"loss": 0.507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21330304443836212,
"step": 1770,
"valid_targets_mean": 3395.4,
"valid_targets_min": 1866
},
{
"epoch": 2.7104660045836515,
"grad_norm": 0.5926029230343366,
"learning_rate": 3.0784850521652336e-05,
"loss": 0.4636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1835680454969406,
"step": 1775,
"valid_targets_mean": 3637.9,
"valid_targets_min": 833
},
{
"epoch": 2.718105423987777,
"grad_norm": 0.6649422002748281,
"learning_rate": 3.072065003131925e-05,
"loss": 0.4696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3594931364059448,
"step": 1780,
"valid_targets_mean": 3790.4,
"valid_targets_min": 2012
},
{
"epoch": 2.7257448433919023,
"grad_norm": 0.9506459102901791,
"learning_rate": 3.0656294158558954e-05,
"loss": 0.5542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2790099084377289,
"step": 1785,
"valid_targets_mean": 3921.5,
"valid_targets_min": 2246
},
{
"epoch": 2.7333842627960276,
"grad_norm": 0.7082670183686091,
"learning_rate": 3.059178383612941e-05,
"loss": 0.4799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25146788358688354,
"step": 1790,
"valid_targets_mean": 2553.1,
"valid_targets_min": 1141
},
{
"epoch": 2.7410236822001526,
"grad_norm": 0.706151992610167,
"learning_rate": 3.052711999902715e-05,
"loss": 0.477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32185858488082886,
"step": 1795,
"valid_targets_mean": 3541.9,
"valid_targets_min": 795
},
{
"epoch": 2.748663101604278,
"grad_norm": 0.6419423098815215,
"learning_rate": 3.0462303584473692e-05,
"loss": 0.5119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.327781081199646,
"step": 1800,
"valid_targets_mean": 4346.9,
"valid_targets_min": 2177
},
{
"epoch": 2.7563025210084033,
"grad_norm": 0.8570229225472685,
"learning_rate": 3.039733553190198e-05,
"loss": 0.4682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14253611862659454,
"step": 1805,
"valid_targets_mean": 1997.4,
"valid_targets_min": 641
},
{
"epoch": 2.7639419404125287,
"grad_norm": 0.7558810429065274,
"learning_rate": 3.0332216782942763e-05,
"loss": 0.4915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2567565441131592,
"step": 1810,
"valid_targets_mean": 2702.4,
"valid_targets_min": 1348
},
{
"epoch": 2.771581359816654,
"grad_norm": 0.5963411952289389,
"learning_rate": 3.0266948281410943e-05,
"loss": 0.4823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1956261396408081,
"step": 1815,
"valid_targets_mean": 3508.9,
"valid_targets_min": 865
},
{
"epoch": 2.779220779220779,
"grad_norm": 0.6388646518127971,
"learning_rate": 3.020153097329189e-05,
"loss": 0.4715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21967804431915283,
"step": 1820,
"valid_targets_mean": 3618.1,
"valid_targets_min": 965
},
{
"epoch": 2.7868601986249044,
"grad_norm": 0.6146109467059201,
"learning_rate": 3.013596580672777e-05,
"loss": 0.4841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20610034465789795,
"step": 1825,
"valid_targets_mean": 3072.5,
"valid_targets_min": 1280
},
{
"epoch": 2.79449961802903,
"grad_norm": 0.8220069533572829,
"learning_rate": 3.0070253732003736e-05,
"loss": 0.5067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.287387490272522,
"step": 1830,
"valid_targets_mean": 2372.0,
"valid_targets_min": 719
},
{
"epoch": 2.802139037433155,
"grad_norm": 0.6060216832677047,
"learning_rate": 3.0004395701534208e-05,
"loss": 0.5046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1976098269224167,
"step": 1835,
"valid_targets_mean": 3524.0,
"valid_targets_min": 1211
},
{
"epoch": 2.8097784568372806,
"grad_norm": 0.6533429306985723,
"learning_rate": 2.9938392669849053e-05,
"loss": 0.4447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26395583152770996,
"step": 1840,
"valid_targets_mean": 3673.1,
"valid_targets_min": 994
},
{
"epoch": 2.8174178762414055,
"grad_norm": 0.7125496744028057,
"learning_rate": 2.9872245593579752e-05,
"loss": 0.494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25991716980934143,
"step": 1845,
"valid_targets_mean": 2532.6,
"valid_targets_min": 1158
},
{
"epoch": 2.825057295645531,
"grad_norm": 0.6313460986453029,
"learning_rate": 2.9805955431445514e-05,
"loss": 0.4549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2249601185321808,
"step": 1850,
"valid_targets_mean": 4385.2,
"valid_targets_min": 1337
},
{
"epoch": 2.8326967150496563,
"grad_norm": 0.6358505528090321,
"learning_rate": 2.973952314423943e-05,
"loss": 0.4566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28464820981025696,
"step": 1855,
"valid_targets_mean": 4168.4,
"valid_targets_min": 1499
},
{
"epoch": 2.8403361344537816,
"grad_norm": 0.7230163206181031,
"learning_rate": 2.9672949694814485e-05,
"loss": 0.4829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24439480900764465,
"step": 1860,
"valid_targets_mean": 2667.0,
"valid_targets_min": 755
},
{
"epoch": 2.847975553857907,
"grad_norm": 0.6704723628046145,
"learning_rate": 2.9606236048069655e-05,
"loss": 0.5093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18326005339622498,
"step": 1865,
"valid_targets_mean": 2370.1,
"valid_targets_min": 907
},
{
"epoch": 2.855614973262032,
"grad_norm": 0.6270630791742493,
"learning_rate": 2.9539383170935888e-05,
"loss": 0.5206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20464631915092468,
"step": 1870,
"valid_targets_mean": 2579.9,
"valid_targets_min": 551
},
{
"epoch": 2.8632543926661573,
"grad_norm": 0.6911077958995703,
"learning_rate": 2.9472392032362118e-05,
"loss": 0.5005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27718856930732727,
"step": 1875,
"valid_targets_mean": 3162.6,
"valid_targets_min": 1687
},
{
"epoch": 2.8708938120702827,
"grad_norm": 0.6414965035160827,
"learning_rate": 2.9405263603301185e-05,
"loss": 0.5001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2760189473628998,
"step": 1880,
"valid_targets_mean": 4009.4,
"valid_targets_min": 935
},
{
"epoch": 2.878533231474408,
"grad_norm": 0.6551981321713435,
"learning_rate": 2.93379988566958e-05,
"loss": 0.4851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3242207169532776,
"step": 1885,
"valid_targets_mean": 4115.9,
"valid_targets_min": 1409
},
{
"epoch": 2.8861726508785335,
"grad_norm": 0.679402550463882,
"learning_rate": 2.9270598767464422e-05,
"loss": 0.4948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25107401609420776,
"step": 1890,
"valid_targets_mean": 3046.4,
"valid_targets_min": 1207
},
{
"epoch": 2.8938120702826584,
"grad_norm": 0.6390110048027222,
"learning_rate": 2.920306431248712e-05,
"loss": 0.5069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22953186929225922,
"step": 1895,
"valid_targets_mean": 3236.5,
"valid_targets_min": 977
},
{
"epoch": 2.901451489686784,
"grad_norm": 0.6664644335329467,
"learning_rate": 2.9135396470591456e-05,
"loss": 0.4846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2379942238330841,
"step": 1900,
"valid_targets_mean": 2498.2,
"valid_targets_min": 1587
},
{
"epoch": 2.909090909090909,
"grad_norm": 0.7196033199681839,
"learning_rate": 2.9067596222538234e-05,
"loss": 0.5126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28052574396133423,
"step": 1905,
"valid_targets_mean": 3221.8,
"valid_targets_min": 1281
},
{
"epoch": 2.916730328495034,
"grad_norm": 0.7282565137655552,
"learning_rate": 2.8999664551007344e-05,
"loss": 0.5072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.298537015914917,
"step": 1910,
"valid_targets_mean": 2929.0,
"valid_targets_min": 1486
},
{
"epoch": 2.92436974789916,
"grad_norm": 0.6119949515081662,
"learning_rate": 2.8931602440583488e-05,
"loss": 0.505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22523435950279236,
"step": 1915,
"valid_targets_mean": 3136.1,
"valid_targets_min": 791
},
{
"epoch": 2.932009167303285,
"grad_norm": 0.5399954941991891,
"learning_rate": 2.8863410877741906e-05,
"loss": 0.5075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24924825131893158,
"step": 1920,
"valid_targets_mean": 4078.1,
"valid_targets_min": 1382
},
{
"epoch": 2.9396485867074102,
"grad_norm": 0.6177014347831229,
"learning_rate": 2.8795090850834113e-05,
"loss": 0.5141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30639275908470154,
"step": 1925,
"valid_targets_mean": 4244.5,
"valid_targets_min": 1024
},
{
"epoch": 2.9472880061115356,
"grad_norm": 0.6346987774339923,
"learning_rate": 2.8726643350073528e-05,
"loss": 0.4939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30813929438591003,
"step": 1930,
"valid_targets_mean": 4161.6,
"valid_targets_min": 1781
},
{
"epoch": 2.9549274255156606,
"grad_norm": 0.5630616587425123,
"learning_rate": 2.865806936752115e-05,
"loss": 0.4925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20618033409118652,
"step": 1935,
"valid_targets_mean": 3727.6,
"valid_targets_min": 1029
},
{
"epoch": 2.962566844919786,
"grad_norm": 0.6042368887587112,
"learning_rate": 2.8589369897071174e-05,
"loss": 0.4893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3170982003211975,
"step": 1940,
"valid_targets_mean": 4726.5,
"valid_targets_min": 1030
},
{
"epoch": 2.9702062643239113,
"grad_norm": 0.7568286827833816,
"learning_rate": 2.8520545934436602e-05,
"loss": 0.5234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21794971823692322,
"step": 1945,
"valid_targets_mean": 2020.6,
"valid_targets_min": 721
},
{
"epoch": 2.9778456837280367,
"grad_norm": 0.6106059417680693,
"learning_rate": 2.845159847713477e-05,
"loss": 0.4762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24992212653160095,
"step": 1950,
"valid_targets_mean": 3954.1,
"valid_targets_min": 1360
},
{
"epoch": 2.985485103132162,
"grad_norm": 0.5435572161508933,
"learning_rate": 2.8382528524472916e-05,
"loss": 0.479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23369833827018738,
"step": 1955,
"valid_targets_mean": 4845.0,
"valid_targets_min": 976
},
{
"epoch": 2.993124522536287,
"grad_norm": 0.6506312663229364,
"learning_rate": 2.831333707753372e-05,
"loss": 0.5213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3393819332122803,
"step": 1960,
"valid_targets_mean": 4771.0,
"valid_targets_min": 2823
},
{
"epoch": 3.0,
"grad_norm": 0.7542635576732258,
"learning_rate": 2.8244025139160745e-05,
"loss": 0.4668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.45052003860473633,
"step": 1965,
"valid_targets_mean": 4757.8,
"valid_targets_min": 1701
},
{
"epoch": 3.0076394194041254,
"grad_norm": 0.8520083341535113,
"learning_rate": 2.8174593713943933e-05,
"loss": 0.4627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.256170392036438,
"step": 1970,
"valid_targets_mean": 3575.5,
"valid_targets_min": 1617
},
{
"epoch": 3.0152788388082508,
"grad_norm": 0.6927471642692427,
"learning_rate": 2.8105043808205042e-05,
"loss": 0.4775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13694897294044495,
"step": 1975,
"valid_targets_mean": 2587.1,
"valid_targets_min": 1278
},
{
"epoch": 3.0229182582123757,
"grad_norm": 0.6552096347277138,
"learning_rate": 2.803537642998307e-05,
"loss": 0.4444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18564541637897491,
"step": 1980,
"valid_targets_mean": 2760.9,
"valid_targets_min": 1688
},
{
"epoch": 3.030557677616501,
"grad_norm": 0.7055118318105523,
"learning_rate": 2.79655925890196e-05,
"loss": 0.462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26022660732269287,
"step": 1985,
"valid_targets_mean": 3840.8,
"valid_targets_min": 1374
},
{
"epoch": 3.0381970970206265,
"grad_norm": 0.6819692775207933,
"learning_rate": 2.789569329674422e-05,
"loss": 0.4743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2793933153152466,
"step": 1990,
"valid_targets_mean": 3820.4,
"valid_targets_min": 2194
},
{
"epoch": 3.045836516424752,
"grad_norm": 0.6759014212454788,
"learning_rate": 2.7825679566259834e-05,
"loss": 0.4322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31307685375213623,
"step": 1995,
"valid_targets_mean": 4136.8,
"valid_targets_min": 1345
},
{
"epoch": 3.053475935828877,
"grad_norm": 0.7186371415409949,
"learning_rate": 2.7755552412327996e-05,
"loss": 0.5,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2766656279563904,
"step": 2000,
"valid_targets_mean": 3391.2,
"valid_targets_min": 976
},
{
"epoch": 3.061115355233002,
"grad_norm": 0.8200488852788307,
"learning_rate": 2.768531285135417e-05,
"loss": 0.433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21261753141880035,
"step": 2005,
"valid_targets_mean": 3123.6,
"valid_targets_min": 1113
},
{
"epoch": 3.0687547746371275,
"grad_norm": 0.7072416391028573,
"learning_rate": 2.7614961901373027e-05,
"loss": 0.446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2160511314868927,
"step": 2010,
"valid_targets_mean": 2450.9,
"valid_targets_min": 989
},
{
"epoch": 3.076394194041253,
"grad_norm": 0.650830887467269,
"learning_rate": 2.7544500582033706e-05,
"loss": 0.4686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36730068922042847,
"step": 2015,
"valid_targets_mean": 4055.4,
"valid_targets_min": 1037
},
{
"epoch": 3.0840336134453783,
"grad_norm": 0.690349423058777,
"learning_rate": 2.7473929914584977e-05,
"loss": 0.4463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23585245013237,
"step": 2020,
"valid_targets_mean": 3368.2,
"valid_targets_min": 1710
},
{
"epoch": 3.0916730328495032,
"grad_norm": 0.650718819701116,
"learning_rate": 2.7403250921860497e-05,
"loss": 0.453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25358718633651733,
"step": 2025,
"valid_targets_mean": 4090.8,
"valid_targets_min": 778
},
{
"epoch": 3.0993124522536286,
"grad_norm": 0.5963126945918865,
"learning_rate": 2.7332464628263945e-05,
"loss": 0.4718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22683659195899963,
"step": 2030,
"valid_targets_mean": 4324.2,
"valid_targets_min": 1248
},
{
"epoch": 3.106951871657754,
"grad_norm": 0.7170890890169099,
"learning_rate": 2.7261572059754217e-05,
"loss": 0.4698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21194159984588623,
"step": 2035,
"valid_targets_mean": 2557.9,
"valid_targets_min": 651
},
{
"epoch": 3.1145912910618794,
"grad_norm": 0.6270816527342218,
"learning_rate": 2.7190574243830505e-05,
"loss": 0.4708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25633394718170166,
"step": 2040,
"valid_targets_mean": 4321.0,
"valid_targets_min": 1909
},
{
"epoch": 3.1222307104660048,
"grad_norm": 0.6768057541438881,
"learning_rate": 2.7119472209517442e-05,
"loss": 0.4434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14575080573558807,
"step": 2045,
"valid_targets_mean": 2207.1,
"valid_targets_min": 698
},
{
"epoch": 3.1298701298701297,
"grad_norm": 0.6233377285938715,
"learning_rate": 2.7048266987350183e-05,
"loss": 0.4766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24185675382614136,
"step": 2050,
"valid_targets_mean": 3896.8,
"valid_targets_min": 1606
},
{
"epoch": 3.137509549274255,
"grad_norm": 0.8300155530398309,
"learning_rate": 2.6976959609359447e-05,
"loss": 0.4393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20969784259796143,
"step": 2055,
"valid_targets_mean": 2864.4,
"valid_targets_min": 855
},
{
"epoch": 3.1451489686783805,
"grad_norm": 0.7022719532986335,
"learning_rate": 2.6905551109056598e-05,
"loss": 0.4505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17745709419250488,
"step": 2060,
"valid_targets_mean": 2705.0,
"valid_targets_min": 1099
},
{
"epoch": 3.152788388082506,
"grad_norm": 0.7176816603828999,
"learning_rate": 2.6834042521418604e-05,
"loss": 0.4618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27983376383781433,
"step": 2065,
"valid_targets_mean": 3271.4,
"valid_targets_min": 1878
},
{
"epoch": 3.160427807486631,
"grad_norm": 0.5748440814115998,
"learning_rate": 2.6762434882873116e-05,
"loss": 0.4114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23593346774578094,
"step": 2070,
"valid_targets_mean": 4988.9,
"valid_targets_min": 2159
},
{
"epoch": 3.168067226890756,
"grad_norm": 0.6550371187304824,
"learning_rate": 2.6690729231283374e-05,
"loss": 0.4752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21643373370170593,
"step": 2075,
"valid_targets_mean": 3548.8,
"valid_targets_min": 914
},
{
"epoch": 3.1757066462948815,
"grad_norm": 0.7666764522952328,
"learning_rate": 2.66189266059332e-05,
"loss": 0.4793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32998839020729065,
"step": 2080,
"valid_targets_mean": 3029.2,
"valid_targets_min": 1459
},
{
"epoch": 3.183346065699007,
"grad_norm": 0.7500681322915863,
"learning_rate": 2.6547028047511943e-05,
"loss": 0.4558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17174682021141052,
"step": 2085,
"valid_targets_mean": 2901.1,
"valid_targets_min": 1174
},
{
"epoch": 3.1909854851031323,
"grad_norm": 0.7097897437767872,
"learning_rate": 2.6475034598099372e-05,
"loss": 0.4833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2244066298007965,
"step": 2090,
"valid_targets_mean": 3690.8,
"valid_targets_min": 1187
},
{
"epoch": 3.1986249045072572,
"grad_norm": 0.6152739239508643,
"learning_rate": 2.6402947301150583e-05,
"loss": 0.4655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2872171998023987,
"step": 2095,
"valid_targets_mean": 3874.6,
"valid_targets_min": 818
},
{
"epoch": 3.2062643239113826,
"grad_norm": 0.6686147346154969,
"learning_rate": 2.6330767201480873e-05,
"loss": 0.4547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22372795641422272,
"step": 2100,
"valid_targets_mean": 3518.4,
"valid_targets_min": 859
},
{
"epoch": 3.213903743315508,
"grad_norm": 0.6456365193151155,
"learning_rate": 2.62584953452506e-05,
"loss": 0.4367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21859055757522583,
"step": 2105,
"valid_targets_mean": 3339.4,
"valid_targets_min": 1347
},
{
"epoch": 3.2215431627196334,
"grad_norm": 0.7593984041165075,
"learning_rate": 2.6186132779950022e-05,
"loss": 0.4772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26761341094970703,
"step": 2110,
"valid_targets_mean": 2970.4,
"valid_targets_min": 1902
},
{
"epoch": 3.2291825821237587,
"grad_norm": 0.6501007799307098,
"learning_rate": 2.6113680554384107e-05,
"loss": 0.4602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2438923865556717,
"step": 2115,
"valid_targets_mean": 4634.4,
"valid_targets_min": 1688
},
{
"epoch": 3.2368220015278837,
"grad_norm": 0.5797241376930075,
"learning_rate": 2.604113971865734e-05,
"loss": 0.4383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31843867897987366,
"step": 2120,
"valid_targets_mean": 6170.1,
"valid_targets_min": 2066
},
{
"epoch": 3.244461420932009,
"grad_norm": 0.6842024873599893,
"learning_rate": 2.59685113241585e-05,
"loss": 0.463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35103440284729004,
"step": 2125,
"valid_targets_mean": 4209.1,
"valid_targets_min": 1380
},
{
"epoch": 3.2521008403361344,
"grad_norm": 0.752689560807153,
"learning_rate": 2.5895796423545418e-05,
"loss": 0.461,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20140741765499115,
"step": 2130,
"valid_targets_mean": 2656.8,
"valid_targets_min": 1519
},
{
"epoch": 3.25974025974026,
"grad_norm": 0.6413068877083942,
"learning_rate": 2.5822996070729723e-05,
"loss": 0.4546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21095341444015503,
"step": 2135,
"valid_targets_mean": 3406.9,
"valid_targets_min": 1623
},
{
"epoch": 3.267379679144385,
"grad_norm": 0.6451875065112788,
"learning_rate": 2.575011132086157e-05,
"loss": 0.4528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25910890102386475,
"step": 2140,
"valid_targets_mean": 4925.0,
"valid_targets_min": 1077
},
{
"epoch": 3.27501909854851,
"grad_norm": 0.9084443226542351,
"learning_rate": 2.567714323031434e-05,
"loss": 0.4391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22554218769073486,
"step": 2145,
"valid_targets_mean": 1927.1,
"valid_targets_min": 1180
},
{
"epoch": 3.2826585179526355,
"grad_norm": 0.7610395813343054,
"learning_rate": 2.560409285666933e-05,
"loss": 0.4654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23040610551834106,
"step": 2150,
"valid_targets_mean": 3317.0,
"valid_targets_min": 1487
},
{
"epoch": 3.290297937356761,
"grad_norm": 0.6121775750148253,
"learning_rate": 2.5530961258700444e-05,
"loss": 0.4053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1965913474559784,
"step": 2155,
"valid_targets_mean": 3397.2,
"valid_targets_min": 722
},
{
"epoch": 3.2979373567608863,
"grad_norm": 0.5434110974544242,
"learning_rate": 2.545774949635881e-05,
"loss": 0.4473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12601837515830994,
"step": 2160,
"valid_targets_mean": 3408.4,
"valid_targets_min": 979
},
{
"epoch": 3.3055767761650117,
"grad_norm": 0.6224547099221401,
"learning_rate": 2.5384458630757456e-05,
"loss": 0.459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25731584429740906,
"step": 2165,
"valid_targets_mean": 4671.9,
"valid_targets_min": 1430
},
{
"epoch": 3.3132161955691366,
"grad_norm": 0.6957316558389659,
"learning_rate": 2.5311089724155896e-05,
"loss": 0.4592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15687590837478638,
"step": 2170,
"valid_targets_mean": 2381.5,
"valid_targets_min": 939
},
{
"epoch": 3.320855614973262,
"grad_norm": 0.6437378155332701,
"learning_rate": 2.5237643839944774e-05,
"loss": 0.4614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18906278908252716,
"step": 2175,
"valid_targets_mean": 3104.6,
"valid_targets_min": 1500
},
{
"epoch": 3.3284950343773874,
"grad_norm": 0.7374192641903924,
"learning_rate": 2.5164122042630405e-05,
"loss": 0.4579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20864637196063995,
"step": 2180,
"valid_targets_mean": 2575.0,
"valid_targets_min": 839
},
{
"epoch": 3.3361344537815127,
"grad_norm": 0.6409476943750227,
"learning_rate": 2.509052539781937e-05,
"loss": 0.4325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2770101726055145,
"step": 2185,
"valid_targets_mean": 4118.1,
"valid_targets_min": 797
},
{
"epoch": 3.343773873185638,
"grad_norm": 1.0079250001951137,
"learning_rate": 2.5016854972203094e-05,
"loss": 0.4945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20084837079048157,
"step": 2190,
"valid_targets_mean": 1417.4,
"valid_targets_min": 813
},
{
"epoch": 3.351413292589763,
"grad_norm": 0.8895234998263297,
"learning_rate": 2.4943111833542333e-05,
"loss": 0.4724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28576815128326416,
"step": 2195,
"valid_targets_mean": 2029.2,
"valid_targets_min": 634
},
{
"epoch": 3.3590527119938884,
"grad_norm": 0.681661277197927,
"learning_rate": 2.4869297050651765e-05,
"loss": 0.4782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21255749464035034,
"step": 2200,
"valid_targets_mean": 3347.1,
"valid_targets_min": 925
},
{
"epoch": 3.366692131398014,
"grad_norm": 0.6721290525161261,
"learning_rate": 2.479541169338442e-05,
"loss": 0.474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2670324742794037,
"step": 2205,
"valid_targets_mean": 3668.6,
"valid_targets_min": 1138
},
{
"epoch": 3.374331550802139,
"grad_norm": 0.7347531309138814,
"learning_rate": 2.4721456832616247e-05,
"loss": 0.5287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2706944942474365,
"step": 2210,
"valid_targets_mean": 2375.9,
"valid_targets_min": 911
},
{
"epoch": 3.381970970206264,
"grad_norm": 0.6102358699138265,
"learning_rate": 2.4647433540230547e-05,
"loss": 0.4516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22291956841945648,
"step": 2215,
"valid_targets_mean": 4539.0,
"valid_targets_min": 1127
},
{
"epoch": 3.3896103896103895,
"grad_norm": 0.6827759823432588,
"learning_rate": 2.4573342889102443e-05,
"loss": 0.4694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1694415807723999,
"step": 2220,
"valid_targets_mean": 2403.1,
"valid_targets_min": 690
},
{
"epoch": 3.397249809014515,
"grad_norm": 0.6951348124592946,
"learning_rate": 2.4499185953083363e-05,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18465524911880493,
"step": 2225,
"valid_targets_mean": 2890.0,
"valid_targets_min": 1722
},
{
"epoch": 3.4048892284186403,
"grad_norm": 0.5973099924759062,
"learning_rate": 2.4424963806985432e-05,
"loss": 0.4948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22179313004016876,
"step": 2230,
"valid_targets_mean": 3594.6,
"valid_targets_min": 1134
},
{
"epoch": 3.4125286478227657,
"grad_norm": 0.750343525606607,
"learning_rate": 2.4350677526565934e-05,
"loss": 0.4442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3058930039405823,
"step": 2235,
"valid_targets_mean": 3820.2,
"valid_targets_min": 1639
},
{
"epoch": 3.4201680672268906,
"grad_norm": 0.8202808105318293,
"learning_rate": 2.427632818851166e-05,
"loss": 0.4853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28285735845565796,
"step": 2240,
"valid_targets_mean": 3445.6,
"valid_targets_min": 1053
},
{
"epoch": 3.427807486631016,
"grad_norm": 0.7045598247602469,
"learning_rate": 2.4201916870423393e-05,
"loss": 0.4965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17256322503089905,
"step": 2245,
"valid_targets_mean": 2347.6,
"valid_targets_min": 610
},
{
"epoch": 3.4354469060351414,
"grad_norm": 0.7389047344210837,
"learning_rate": 2.4127444650800203e-05,
"loss": 0.4842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2350621223449707,
"step": 2250,
"valid_targets_mean": 2283.5,
"valid_targets_min": 760
},
{
"epoch": 3.4430863254392667,
"grad_norm": 0.5995621961731215,
"learning_rate": 2.405291260902387e-05,
"loss": 0.4814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18150877952575684,
"step": 2255,
"valid_targets_mean": 3665.9,
"valid_targets_min": 1568
},
{
"epoch": 3.4507257448433917,
"grad_norm": 0.6681977273319017,
"learning_rate": 2.3978321825343206e-05,
"loss": 0.4655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22443902492523193,
"step": 2260,
"valid_targets_mean": 3334.6,
"valid_targets_min": 1305
},
{
"epoch": 3.458365164247517,
"grad_norm": 0.7011279817974063,
"learning_rate": 2.390367338085843e-05,
"loss": 0.4542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15961575508117676,
"step": 2265,
"valid_targets_mean": 1922.6,
"valid_targets_min": 832
},
{
"epoch": 3.4660045836516424,
"grad_norm": 0.6225101653595909,
"learning_rate": 2.382896835750547e-05,
"loss": 0.4334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17323069274425507,
"step": 2270,
"valid_targets_mean": 3204.8,
"valid_targets_min": 1141
},
{
"epoch": 3.473644003055768,
"grad_norm": 0.7095294516028836,
"learning_rate": 2.3754207838040296e-05,
"loss": 0.4482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1739782691001892,
"step": 2275,
"valid_targets_mean": 2280.6,
"valid_targets_min": 1130
},
{
"epoch": 3.481283422459893,
"grad_norm": 0.6968490266068142,
"learning_rate": 2.367939290602324e-05,
"loss": 0.4817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17820501327514648,
"step": 2280,
"valid_targets_mean": 2033.0,
"valid_targets_min": 917
},
{
"epoch": 3.488922841864018,
"grad_norm": 0.6648554409574585,
"learning_rate": 2.360452464580326e-05,
"loss": 0.4778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2294338345527649,
"step": 2285,
"valid_targets_mean": 3581.5,
"valid_targets_min": 935
},
{
"epoch": 3.4965622612681435,
"grad_norm": 0.7430674337203963,
"learning_rate": 2.352960414250223e-05,
"loss": 0.4631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24158762395381927,
"step": 2290,
"valid_targets_mean": 2921.4,
"valid_targets_min": 852
},
{
"epoch": 3.504201680672269,
"grad_norm": 0.7298796222195553,
"learning_rate": 2.345463248199925e-05,
"loss": 0.4822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23775427043437958,
"step": 2295,
"valid_targets_mean": 2701.9,
"valid_targets_min": 560
},
{
"epoch": 3.5118411000763943,
"grad_norm": 0.5806557240484798,
"learning_rate": 2.337961075091486e-05,
"loss": 0.4335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.221890389919281,
"step": 2300,
"valid_targets_mean": 4218.2,
"valid_targets_min": 1092
},
{
"epoch": 3.5194805194805197,
"grad_norm": 0.7571866275166863,
"learning_rate": 2.3304540036595313e-05,
"loss": 0.4776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2549300789833069,
"step": 2305,
"valid_targets_mean": 2839.0,
"valid_targets_min": 1288
},
{
"epoch": 3.5271199388846446,
"grad_norm": 0.5758410523457546,
"learning_rate": 2.322942142709682e-05,
"loss": 0.4637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26692140102386475,
"step": 2310,
"valid_targets_mean": 4998.4,
"valid_targets_min": 1708
},
{
"epoch": 3.53475935828877,
"grad_norm": 0.6878409192331846,
"learning_rate": 2.3154256011169758e-05,
"loss": 0.4551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17327441275119781,
"step": 2315,
"valid_targets_mean": 2440.4,
"valid_targets_min": 841
},
{
"epoch": 3.5423987776928954,
"grad_norm": 0.6394586452229399,
"learning_rate": 2.3079044878242934e-05,
"loss": 0.4654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19388046860694885,
"step": 2320,
"valid_targets_mean": 3832.6,
"valid_targets_min": 605
},
{
"epoch": 3.5500381970970207,
"grad_norm": 0.6385412390527023,
"learning_rate": 2.300378911840773e-05,
"loss": 0.439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21402673423290253,
"step": 2325,
"valid_targets_mean": 3548.6,
"valid_targets_min": 2209
},
{
"epoch": 3.557677616501146,
"grad_norm": 0.7468771536187816,
"learning_rate": 2.2928489822402363e-05,
"loss": 0.4712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27554431557655334,
"step": 2330,
"valid_targets_mean": 3242.6,
"valid_targets_min": 778
},
{
"epoch": 3.565317035905271,
"grad_norm": 0.8019666864327368,
"learning_rate": 2.285314808159604e-05,
"loss": 0.4488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22434744238853455,
"step": 2335,
"valid_targets_mean": 2466.4,
"valid_targets_min": 1480
},
{
"epoch": 3.5729564553093964,
"grad_norm": 0.6877910040053126,
"learning_rate": 2.2777764987973167e-05,
"loss": 0.4621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2005833387374878,
"step": 2340,
"valid_targets_mean": 2540.5,
"valid_targets_min": 1062
},
{
"epoch": 3.580595874713522,
"grad_norm": 0.6611814458537609,
"learning_rate": 2.2702341634117487e-05,
"loss": 0.4665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27685844898223877,
"step": 2345,
"valid_targets_mean": 3624.1,
"valid_targets_min": 1303
},
{
"epoch": 3.588235294117647,
"grad_norm": 0.7269943364354757,
"learning_rate": 2.262687911319628e-05,
"loss": 0.4541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2215583324432373,
"step": 2350,
"valid_targets_mean": 3072.8,
"valid_targets_min": 1418
},
{
"epoch": 3.5958747135217726,
"grad_norm": 0.7803987380189772,
"learning_rate": 2.2551378518944505e-05,
"loss": 0.4519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18608278036117554,
"step": 2355,
"valid_targets_mean": 2090.5,
"valid_targets_min": 931
},
{
"epoch": 3.6035141329258975,
"grad_norm": 0.7800039264188372,
"learning_rate": 2.247584094564894e-05,
"loss": 0.4157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2047506868839264,
"step": 2360,
"valid_targets_mean": 2571.6,
"valid_targets_min": 1560
},
{
"epoch": 3.611153552330023,
"grad_norm": 0.7134902841112694,
"learning_rate": 2.240026748813232e-05,
"loss": 0.4754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2151254266500473,
"step": 2365,
"valid_targets_mean": 2401.8,
"valid_targets_min": 1298
},
{
"epoch": 3.6187929717341483,
"grad_norm": 0.7075951063514955,
"learning_rate": 2.2324659241737495e-05,
"loss": 0.4702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21446746587753296,
"step": 2370,
"valid_targets_mean": 2707.9,
"valid_targets_min": 1052
},
{
"epoch": 3.6264323911382736,
"grad_norm": 0.6949316016720868,
"learning_rate": 2.2249017302311527e-05,
"loss": 0.4511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18831145763397217,
"step": 2375,
"valid_targets_mean": 1897.2,
"valid_targets_min": 435
},
{
"epoch": 3.634071810542399,
"grad_norm": 0.629633789269152,
"learning_rate": 2.2173342766189803e-05,
"loss": 0.4597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25491413474082947,
"step": 2380,
"valid_targets_mean": 4428.2,
"valid_targets_min": 1121
},
{
"epoch": 3.641711229946524,
"grad_norm": 0.5838022402143164,
"learning_rate": 2.209763673018019e-05,
"loss": 0.4803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20996476709842682,
"step": 2385,
"valid_targets_mean": 3756.1,
"valid_targets_min": 1593
},
{
"epoch": 3.6493506493506493,
"grad_norm": 0.7815834244454084,
"learning_rate": 2.202190029154708e-05,
"loss": 0.4427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23983490467071533,
"step": 2390,
"valid_targets_mean": 2568.0,
"valid_targets_min": 1599
},
{
"epoch": 3.6569900687547747,
"grad_norm": 0.7150259118212184,
"learning_rate": 2.1946134547995524e-05,
"loss": 0.4577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22549794614315033,
"step": 2395,
"valid_targets_mean": 2506.2,
"valid_targets_min": 1096
},
{
"epoch": 3.6646294881588997,
"grad_norm": 0.6335828466810162,
"learning_rate": 2.1870340597655303e-05,
"loss": 0.4405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22980603575706482,
"step": 2400,
"valid_targets_mean": 3558.9,
"valid_targets_min": 835
},
{
"epoch": 3.6722689075630255,
"grad_norm": 0.5764257422938297,
"learning_rate": 2.1794519539065037e-05,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25543129444122314,
"step": 2405,
"valid_targets_mean": 4303.6,
"valid_targets_min": 1453
},
{
"epoch": 3.6799083269671504,
"grad_norm": 0.6545961859716691,
"learning_rate": 2.171867247115622e-05,
"loss": 0.4624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21702466905117035,
"step": 2410,
"valid_targets_mean": 3388.0,
"valid_targets_min": 1089
},
{
"epoch": 3.687547746371276,
"grad_norm": 0.644534217804787,
"learning_rate": 2.1642800493237343e-05,
"loss": 0.4353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2263290137052536,
"step": 2415,
"valid_targets_mean": 3678.1,
"valid_targets_min": 1118
},
{
"epoch": 3.695187165775401,
"grad_norm": 0.6221388982483342,
"learning_rate": 2.1566904704977925e-05,
"loss": 0.4741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2882634401321411,
"step": 2420,
"valid_targets_mean": 4166.2,
"valid_targets_min": 1327
},
{
"epoch": 3.702826585179526,
"grad_norm": 0.6658830128145721,
"learning_rate": 2.1490986206392598e-05,
"loss": 0.4841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18079718947410583,
"step": 2425,
"valid_targets_mean": 2733.5,
"valid_targets_min": 1694
},
{
"epoch": 3.7104660045836515,
"grad_norm": 0.7140090226865587,
"learning_rate": 2.1415046097825126e-05,
"loss": 0.4792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1596052497625351,
"step": 2430,
"valid_targets_mean": 2203.0,
"valid_targets_min": 1246
},
{
"epoch": 3.718105423987777,
"grad_norm": 0.6683971640083712,
"learning_rate": 2.1339085479932503e-05,
"loss": 0.5025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2300308346748352,
"step": 2435,
"valid_targets_mean": 3503.5,
"valid_targets_min": 573
},
{
"epoch": 3.7257448433919023,
"grad_norm": 0.7666648806984934,
"learning_rate": 2.1263105453668987e-05,
"loss": 0.4922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20825770497322083,
"step": 2440,
"valid_targets_mean": 2057.6,
"valid_targets_min": 795
},
{
"epoch": 3.7333842627960276,
"grad_norm": 0.7095697789754806,
"learning_rate": 2.1187107120270115e-05,
"loss": 0.4759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2333410680294037,
"step": 2445,
"valid_targets_mean": 2544.0,
"valid_targets_min": 817
},
{
"epoch": 3.7410236822001526,
"grad_norm": 0.7848497019198811,
"learning_rate": 2.1111091581236764e-05,
"loss": 0.453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23937958478927612,
"step": 2450,
"valid_targets_mean": 2462.8,
"valid_targets_min": 750
},
{
"epoch": 3.748663101604278,
"grad_norm": 0.7309498905361822,
"learning_rate": 2.1035059938319212e-05,
"loss": 0.4407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18757390975952148,
"step": 2455,
"valid_targets_mean": 2259.8,
"valid_targets_min": 994
},
{
"epoch": 3.7563025210084033,
"grad_norm": 0.6296154351875214,
"learning_rate": 2.0959013293501117e-05,
"loss": 0.4533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1372356116771698,
"step": 2460,
"valid_targets_mean": 2102.8,
"valid_targets_min": 877
},
{
"epoch": 3.7639419404125287,
"grad_norm": 0.6363160856990357,
"learning_rate": 2.0882952748983586e-05,
"loss": 0.4877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2305780053138733,
"step": 2465,
"valid_targets_mean": 3732.1,
"valid_targets_min": 1882
},
{
"epoch": 3.771581359816654,
"grad_norm": 0.7045522442945755,
"learning_rate": 2.080687940716916e-05,
"loss": 0.445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1693146526813507,
"step": 2470,
"valid_targets_mean": 2391.8,
"valid_targets_min": 864
},
{
"epoch": 3.779220779220779,
"grad_norm": 0.8102188625701466,
"learning_rate": 2.0730794370645895e-05,
"loss": 0.4462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3031376004219055,
"step": 2475,
"valid_targets_mean": 4573.8,
"valid_targets_min": 1604
},
{
"epoch": 3.7868601986249044,
"grad_norm": 0.5563888204797931,
"learning_rate": 2.0654698742171324e-05,
"loss": 0.4215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1911643147468567,
"step": 2480,
"valid_targets_mean": 3630.9,
"valid_targets_min": 851
},
{
"epoch": 3.79449961802903,
"grad_norm": 0.5959316920949063,
"learning_rate": 2.05785936246565e-05,
"loss": 0.4614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.191148579120636,
"step": 2485,
"valid_targets_mean": 3104.6,
"valid_targets_min": 581
},
{
"epoch": 3.802139037433155,
"grad_norm": 0.553521615537144,
"learning_rate": 2.050248012115001e-05,
"loss": 0.4291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17974773049354553,
"step": 2490,
"valid_targets_mean": 3192.0,
"valid_targets_min": 864
},
{
"epoch": 3.8097784568372806,
"grad_norm": 0.6997963953790906,
"learning_rate": 2.0426359334822e-05,
"loss": 0.453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2714889943599701,
"step": 2495,
"valid_targets_mean": 3805.4,
"valid_targets_min": 1498
},
{
"epoch": 3.8174178762414055,
"grad_norm": 0.6771839343218619,
"learning_rate": 2.035023236894815e-05,
"loss": 0.4673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20033538341522217,
"step": 2500,
"valid_targets_mean": 3261.2,
"valid_targets_min": 843
},
{
"epoch": 3.825057295645531,
"grad_norm": 0.6777326221424306,
"learning_rate": 2.0274100326893707e-05,
"loss": 0.4696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24825991690158844,
"step": 2505,
"valid_targets_mean": 3330.6,
"valid_targets_min": 684
},
{
"epoch": 3.8326967150496563,
"grad_norm": 0.7787026130733954,
"learning_rate": 2.0197964312097506e-05,
"loss": 0.4553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1855577826499939,
"step": 2510,
"valid_targets_mean": 2357.2,
"valid_targets_min": 812
},
{
"epoch": 3.8403361344537816,
"grad_norm": 0.6224254712363454,
"learning_rate": 2.012182542805595e-05,
"loss": 0.4693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21993130445480347,
"step": 2515,
"valid_targets_mean": 4545.5,
"valid_targets_min": 1754
},
{
"epoch": 3.847975553857907,
"grad_norm": 0.867489528747725,
"learning_rate": 2.004568477830703e-05,
"loss": 0.4698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23368635773658752,
"step": 2520,
"valid_targets_mean": 2934.0,
"valid_targets_min": 1020
},
{
"epoch": 3.855614973262032,
"grad_norm": 0.6239465544977696,
"learning_rate": 1.9969543466414322e-05,
"loss": 0.4457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2778353691101074,
"step": 2525,
"valid_targets_mean": 4597.9,
"valid_targets_min": 1207
},
{
"epoch": 3.8632543926661573,
"grad_norm": 0.8117178518330349,
"learning_rate": 1.989340259595102e-05,
"loss": 0.4726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33868181705474854,
"step": 2530,
"valid_targets_mean": 2752.0,
"valid_targets_min": 410
},
{
"epoch": 3.8708938120702827,
"grad_norm": 0.6934224395837933,
"learning_rate": 1.9817263270483905e-05,
"loss": 0.4556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20168477296829224,
"step": 2535,
"valid_targets_mean": 3182.5,
"valid_targets_min": 826
},
{
"epoch": 3.878533231474408,
"grad_norm": 0.8264078961610266,
"learning_rate": 1.9741126593557353e-05,
"loss": 0.4348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26114290952682495,
"step": 2540,
"valid_targets_mean": 3085.1,
"valid_targets_min": 1204
},
{
"epoch": 3.8861726508785335,
"grad_norm": 0.5747399845624196,
"learning_rate": 1.9664993668677387e-05,
"loss": 0.4539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21519362926483154,
"step": 2545,
"valid_targets_mean": 4435.5,
"valid_targets_min": 876
},
{
"epoch": 3.8938120702826584,
"grad_norm": 0.6078829505251382,
"learning_rate": 1.958886559929561e-05,
"loss": 0.4467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22459211945533752,
"step": 2550,
"valid_targets_mean": 3909.1,
"valid_targets_min": 979
},
{
"epoch": 3.901451489686784,
"grad_norm": 0.6421094318252095,
"learning_rate": 1.9512743488793272e-05,
"loss": 0.4512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23274767398834229,
"step": 2555,
"valid_targets_mean": 3336.9,
"valid_targets_min": 1185
},
{
"epoch": 3.909090909090909,
"grad_norm": 0.6246019102739618,
"learning_rate": 1.9436628440465267e-05,
"loss": 0.4673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21863816678524017,
"step": 2560,
"valid_targets_mean": 2936.9,
"valid_targets_min": 968
},
{
"epoch": 3.916730328495034,
"grad_norm": 0.6435846868106468,
"learning_rate": 1.9360521557504102e-05,
"loss": 0.435,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21502043306827545,
"step": 2565,
"valid_targets_mean": 3620.2,
"valid_targets_min": 1533
},
{
"epoch": 3.92436974789916,
"grad_norm": 0.7828764498827379,
"learning_rate": 1.928442394298397e-05,
"loss": 0.4702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1875026375055313,
"step": 2570,
"valid_targets_mean": 1726.6,
"valid_targets_min": 1143
},
{
"epoch": 3.932009167303285,
"grad_norm": 0.5941210989208424,
"learning_rate": 1.9208336699844695e-05,
"loss": 0.4621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1600552201271057,
"step": 2575,
"valid_targets_mean": 3049.6,
"valid_targets_min": 1331
},
{
"epoch": 3.9396485867074102,
"grad_norm": 0.6554685877224805,
"learning_rate": 1.913226093087581e-05,
"loss": 0.5097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22393539547920227,
"step": 2580,
"valid_targets_mean": 3305.1,
"valid_targets_min": 852
},
{
"epoch": 3.9472880061115356,
"grad_norm": 0.7422842219293272,
"learning_rate": 1.905619773870052e-05,
"loss": 0.4846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29345467686653137,
"step": 2585,
"valid_targets_mean": 3128.4,
"valid_targets_min": 1269
},
{
"epoch": 3.9549274255156606,
"grad_norm": 0.6220768386463338,
"learning_rate": 1.898014822575977e-05,
"loss": 0.4482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17033663392066956,
"step": 2590,
"valid_targets_mean": 2552.4,
"valid_targets_min": 1205
},
{
"epoch": 3.962566844919786,
"grad_norm": 0.6903241768662477,
"learning_rate": 1.890411349429623e-05,
"loss": 0.4633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20769096910953522,
"step": 2595,
"valid_targets_mean": 2664.8,
"valid_targets_min": 820
},
{
"epoch": 3.9702062643239113,
"grad_norm": 0.6154692002970737,
"learning_rate": 1.8828094646338323e-05,
"loss": 0.4755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22253820300102234,
"step": 2600,
"valid_targets_mean": 3467.6,
"valid_targets_min": 619
},
{
"epoch": 3.9778456837280367,
"grad_norm": 0.5858709827232779,
"learning_rate": 1.875209278368428e-05,
"loss": 0.4247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25010430812835693,
"step": 2605,
"valid_targets_mean": 4649.6,
"valid_targets_min": 2062
},
{
"epoch": 3.985485103132162,
"grad_norm": 0.7705722890771514,
"learning_rate": 1.867610900788612e-05,
"loss": 0.4601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24480944871902466,
"step": 2610,
"valid_targets_mean": 2811.4,
"valid_targets_min": 1077
},
{
"epoch": 3.993124522536287,
"grad_norm": 0.7432406655539916,
"learning_rate": 1.8600144420233752e-05,
"loss": 0.4532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3015478551387787,
"step": 2615,
"valid_targets_mean": 3291.5,
"valid_targets_min": 1244
},
{
"epoch": 4.0,
"grad_norm": 1.118384436602522,
"learning_rate": 1.8524200121738948e-05,
"loss": 0.492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5947331190109253,
"step": 2620,
"valid_targets_mean": 2656.5,
"valid_targets_min": 455
},
{
"epoch": 4.007639419404125,
"grad_norm": 0.7690026283732248,
"learning_rate": 1.844827721311943e-05,
"loss": 0.4482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21468114852905273,
"step": 2625,
"valid_targets_mean": 3231.8,
"valid_targets_min": 1540
},
{
"epoch": 4.015278838808251,
"grad_norm": 0.681129686061914,
"learning_rate": 1.83723767947829e-05,
"loss": 0.4226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1789844036102295,
"step": 2630,
"valid_targets_mean": 2767.0,
"valid_targets_min": 1733
},
{
"epoch": 4.022918258212376,
"grad_norm": 0.710910135229329,
"learning_rate": 1.829649996681108e-05,
"loss": 0.4452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22730287909507751,
"step": 2635,
"valid_targets_mean": 3989.2,
"valid_targets_min": 1211
},
{
"epoch": 4.0305576776165015,
"grad_norm": 0.7390014967088522,
"learning_rate": 1.8220647828943798e-05,
"loss": 0.419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1696176379919052,
"step": 2640,
"valid_targets_mean": 2481.0,
"valid_targets_min": 822
},
{
"epoch": 4.0381970970206265,
"grad_norm": 0.7079151818997759,
"learning_rate": 1.8144821480563004e-05,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18761557340621948,
"step": 2645,
"valid_targets_mean": 2711.4,
"valid_targets_min": 949
},
{
"epoch": 4.045836516424751,
"grad_norm": 0.7977337206226138,
"learning_rate": 1.8069022020676883e-05,
"loss": 0.4329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2581322193145752,
"step": 2650,
"valid_targets_mean": 2545.1,
"valid_targets_min": 530
},
{
"epoch": 4.053475935828877,
"grad_norm": 0.706216871603318,
"learning_rate": 1.7993250547903898e-05,
"loss": 0.4365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16597332060337067,
"step": 2655,
"valid_targets_mean": 2274.2,
"valid_targets_min": 828
},
{
"epoch": 4.061115355233002,
"grad_norm": 0.6452920539721788,
"learning_rate": 1.791750816045687e-05,
"loss": 0.4409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20056098699569702,
"step": 2660,
"valid_targets_mean": 4523.8,
"valid_targets_min": 464
},
{
"epoch": 4.068754774637128,
"grad_norm": 0.7588857980340116,
"learning_rate": 1.7841795956127076e-05,
"loss": 0.4164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2161455899477005,
"step": 2665,
"valid_targets_mean": 2293.6,
"valid_targets_min": 703
},
{
"epoch": 4.076394194041253,
"grad_norm": 0.6876134340921465,
"learning_rate": 1.7766115032268313e-05,
"loss": 0.4106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.299022912979126,
"step": 2670,
"valid_targets_mean": 4430.9,
"valid_targets_min": 1197
},
{
"epoch": 4.084033613445378,
"grad_norm": 0.6926601809186282,
"learning_rate": 1.769046648578102e-05,
"loss": 0.4538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2319658249616623,
"step": 2675,
"valid_targets_mean": 3480.9,
"valid_targets_min": 1354
},
{
"epoch": 4.091673032849504,
"grad_norm": 0.6594589767473226,
"learning_rate": 1.7614851413096338e-05,
"loss": 0.4423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19595220685005188,
"step": 2680,
"valid_targets_mean": 3187.6,
"valid_targets_min": 671
},
{
"epoch": 4.099312452253629,
"grad_norm": 0.790419683409844,
"learning_rate": 1.753927091016029e-05,
"loss": 0.423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20953130722045898,
"step": 2685,
"valid_targets_mean": 3638.5,
"valid_targets_min": 870
},
{
"epoch": 4.106951871657754,
"grad_norm": 0.7733355338048273,
"learning_rate": 1.746372607241782e-05,
"loss": 0.4761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20323872566223145,
"step": 2690,
"valid_targets_mean": 2683.2,
"valid_targets_min": 1323
},
{
"epoch": 4.114591291061879,
"grad_norm": 0.6552366064915041,
"learning_rate": 1.738821799479696e-05,
"loss": 0.4312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24009570479393005,
"step": 2695,
"valid_targets_mean": 3705.1,
"valid_targets_min": 1134
},
{
"epoch": 4.122230710466004,
"grad_norm": 0.7529808173350705,
"learning_rate": 1.731274777169296e-05,
"loss": 0.4277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14969006180763245,
"step": 2700,
"valid_targets_mean": 2055.2,
"valid_targets_min": 1427
},
{
"epoch": 4.12987012987013,
"grad_norm": 0.6936218633949953,
"learning_rate": 1.72373164969524e-05,
"loss": 0.4449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20020580291748047,
"step": 2705,
"valid_targets_mean": 2911.5,
"valid_targets_min": 826
},
{
"epoch": 4.137509549274255,
"grad_norm": 0.6778934162946096,
"learning_rate": 1.7161925263857367e-05,
"loss": 0.4402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17394796013832092,
"step": 2710,
"valid_targets_mean": 2909.0,
"valid_targets_min": 1183
},
{
"epoch": 4.145148968678381,
"grad_norm": 0.7116686368909119,
"learning_rate": 1.7086575165109576e-05,
"loss": 0.4603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23824220895767212,
"step": 2715,
"valid_targets_mean": 3688.0,
"valid_targets_min": 836
},
{
"epoch": 4.152788388082506,
"grad_norm": 0.7389107606127957,
"learning_rate": 1.7011267292814567e-05,
"loss": 0.416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2256026566028595,
"step": 2720,
"valid_targets_mean": 3048.5,
"valid_targets_min": 914
},
{
"epoch": 4.160427807486631,
"grad_norm": 0.6209290096899042,
"learning_rate": 1.6936002738465852e-05,
"loss": 0.4299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2748083174228668,
"step": 2725,
"valid_targets_mean": 5696.2,
"valid_targets_min": 1923
},
{
"epoch": 4.168067226890757,
"grad_norm": 0.7609911879557028,
"learning_rate": 1.686078259292911e-05,
"loss": 0.4333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22729676961898804,
"step": 2730,
"valid_targets_mean": 3419.4,
"valid_targets_min": 2046
},
{
"epoch": 4.1757066462948815,
"grad_norm": 0.7136364581542297,
"learning_rate": 1.6785607946426365e-05,
"loss": 0.431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2431565523147583,
"step": 2735,
"valid_targets_mean": 4014.6,
"valid_targets_min": 740
},
{
"epoch": 4.1833460656990065,
"grad_norm": 0.653814674078787,
"learning_rate": 1.671047988852019e-05,
"loss": 0.4323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26763594150543213,
"step": 2740,
"valid_targets_mean": 4340.1,
"valid_targets_min": 735
},
{
"epoch": 4.190985485103132,
"grad_norm": 0.6477365295148055,
"learning_rate": 1.663539950809792e-05,
"loss": 0.4154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20111311972141266,
"step": 2745,
"valid_targets_mean": 3306.9,
"valid_targets_min": 921
},
{
"epoch": 4.198624904507257,
"grad_norm": 0.6923380432257537,
"learning_rate": 1.6560367893355852e-05,
"loss": 0.4078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15234971046447754,
"step": 2750,
"valid_targets_mean": 2417.6,
"valid_targets_min": 921
},
{
"epoch": 4.206264323911383,
"grad_norm": 0.7693482875043431,
"learning_rate": 1.6485386131783495e-05,
"loss": 0.4319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2205432653427124,
"step": 2755,
"valid_targets_mean": 2677.0,
"valid_targets_min": 997
},
{
"epoch": 4.213903743315508,
"grad_norm": 0.615414794511978,
"learning_rate": 1.6410455310147797e-05,
"loss": 0.4536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2940524220466614,
"step": 2760,
"valid_targets_mean": 3730.5,
"valid_targets_min": 1592
},
{
"epoch": 4.221543162719633,
"grad_norm": 0.7076306553236521,
"learning_rate": 1.63355765144774e-05,
"loss": 0.4086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16093017160892487,
"step": 2765,
"valid_targets_mean": 3209.5,
"valid_targets_min": 1221
},
{
"epoch": 4.229182582123759,
"grad_norm": 0.8056253074864008,
"learning_rate": 1.6260750830046876e-05,
"loss": 0.4166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.245550736784935,
"step": 2770,
"valid_targets_mean": 3017.1,
"valid_targets_min": 1784
},
{
"epoch": 4.236822001527884,
"grad_norm": 0.748600942244156,
"learning_rate": 1.6185979341361037e-05,
"loss": 0.4275,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19234326481819153,
"step": 2775,
"valid_targets_mean": 2891.6,
"valid_targets_min": 1149
},
{
"epoch": 4.2444614209320095,
"grad_norm": 0.5918768300976833,
"learning_rate": 1.6111263132139198e-05,
"loss": 0.4173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2575937509536743,
"step": 2780,
"valid_targets_mean": 5343.8,
"valid_targets_min": 2623
},
{
"epoch": 4.2521008403361344,
"grad_norm": 0.7756708955173703,
"learning_rate": 1.6036603285299443e-05,
"loss": 0.4585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19431465864181519,
"step": 2785,
"valid_targets_mean": 2496.0,
"valid_targets_min": 785
},
{
"epoch": 4.259740259740259,
"grad_norm": 0.7551317271285645,
"learning_rate": 1.596200088294297e-05,
"loss": 0.4041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2065984159708023,
"step": 2790,
"valid_targets_mean": 2938.9,
"valid_targets_min": 1360
},
{
"epoch": 4.267379679144385,
"grad_norm": 0.7576742731600777,
"learning_rate": 1.588745700633839e-05,
"loss": 0.4341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2416866570711136,
"step": 2795,
"valid_targets_mean": 2821.4,
"valid_targets_min": 1032
},
{
"epoch": 4.27501909854851,
"grad_norm": 0.7111031081474437,
"learning_rate": 1.5812972735906066e-05,
"loss": 0.4069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13971193134784698,
"step": 2800,
"valid_targets_mean": 2554.2,
"valid_targets_min": 820
},
{
"epoch": 4.282658517952636,
"grad_norm": 0.6615809212808664,
"learning_rate": 1.5738549151202407e-05,
"loss": 0.4319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20371738076210022,
"step": 2805,
"valid_targets_mean": 3638.4,
"valid_targets_min": 1205
},
{
"epoch": 4.290297937356761,
"grad_norm": 0.8364032589879101,
"learning_rate": 1.5664187330904306e-05,
"loss": 0.4446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19082514941692352,
"step": 2810,
"valid_targets_mean": 2542.2,
"valid_targets_min": 907
},
{
"epoch": 4.297937356760886,
"grad_norm": 0.7049427991206001,
"learning_rate": 1.5589888352793436e-05,
"loss": 0.4502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22058123350143433,
"step": 2815,
"valid_targets_mean": 4915.6,
"valid_targets_min": 1269
},
{
"epoch": 4.305576776165012,
"grad_norm": 0.7212184176724953,
"learning_rate": 1.5515653293740637e-05,
"loss": 0.4387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25808072090148926,
"step": 2820,
"valid_targets_mean": 3785.6,
"valid_targets_min": 1016
},
{
"epoch": 4.313216195569137,
"grad_norm": 0.6826238022765982,
"learning_rate": 1.544148322969035e-05,
"loss": 0.4278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22490471601486206,
"step": 2825,
"valid_targets_mean": 3405.4,
"valid_targets_min": 545
},
{
"epoch": 4.320855614973262,
"grad_norm": 0.8261773124931177,
"learning_rate": 1.5367379235644973e-05,
"loss": 0.4179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19495196640491486,
"step": 2830,
"valid_targets_mean": 2450.9,
"valid_targets_min": 1140
},
{
"epoch": 4.328495034377387,
"grad_norm": 0.6390880153692574,
"learning_rate": 1.529334238564932e-05,
"loss": 0.4201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17437967658042908,
"step": 2835,
"valid_targets_mean": 4055.9,
"valid_targets_min": 889
},
{
"epoch": 4.336134453781512,
"grad_norm": 0.7703651186273575,
"learning_rate": 1.521937375277501e-05,
"loss": 0.4335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18413357436656952,
"step": 2840,
"valid_targets_mean": 2652.8,
"valid_targets_min": 814
},
{
"epoch": 4.343773873185638,
"grad_norm": 0.6368753230093523,
"learning_rate": 1.5145474409104962e-05,
"loss": 0.4265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2968963384628296,
"step": 2845,
"valid_targets_mean": 4633.8,
"valid_targets_min": 797
},
{
"epoch": 4.351413292589763,
"grad_norm": 0.5903985232599476,
"learning_rate": 1.507164542571784e-05,
"loss": 0.4196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18544989824295044,
"step": 2850,
"valid_targets_mean": 3483.8,
"valid_targets_min": 407
},
{
"epoch": 4.359052711993888,
"grad_norm": 0.662217973508679,
"learning_rate": 1.49978878726725e-05,
"loss": 0.4607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17374002933502197,
"step": 2855,
"valid_targets_mean": 2742.6,
"valid_targets_min": 797
},
{
"epoch": 4.366692131398014,
"grad_norm": 0.6636333553320053,
"learning_rate": 1.4924202818992517e-05,
"loss": 0.4384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3518938720226288,
"step": 2860,
"valid_targets_mean": 4384.1,
"valid_targets_min": 1059
},
{
"epoch": 4.374331550802139,
"grad_norm": 0.8000423908088488,
"learning_rate": 1.4850591332650679e-05,
"loss": 0.4178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17594996094703674,
"step": 2865,
"valid_targets_mean": 2390.4,
"valid_targets_min": 1549
},
{
"epoch": 4.381970970206265,
"grad_norm": 0.6055308221886132,
"learning_rate": 1.4777054480553514e-05,
"loss": 0.4552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24170832335948944,
"step": 2870,
"valid_targets_mean": 4342.2,
"valid_targets_min": 975
},
{
"epoch": 4.3896103896103895,
"grad_norm": 0.6903510024741975,
"learning_rate": 1.47035933285258e-05,
"loss": 0.4326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21987634897232056,
"step": 2875,
"valid_targets_mean": 3401.8,
"valid_targets_min": 991
},
{
"epoch": 4.3972498090145145,
"grad_norm": 0.6979371022754717,
"learning_rate": 1.4630208941295156e-05,
"loss": 0.399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1578153818845749,
"step": 2880,
"valid_targets_mean": 2634.9,
"valid_targets_min": 841
},
{
"epoch": 4.40488922841864,
"grad_norm": 0.7514413276024192,
"learning_rate": 1.4556902382476579e-05,
"loss": 0.4158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23249536752700806,
"step": 2885,
"valid_targets_mean": 3987.5,
"valid_targets_min": 682
},
{
"epoch": 4.412528647822765,
"grad_norm": 0.7198762011769154,
"learning_rate": 1.448367471455705e-05,
"loss": 0.4487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.207943394780159,
"step": 2890,
"valid_targets_mean": 2996.8,
"valid_targets_min": 1069
},
{
"epoch": 4.420168067226891,
"grad_norm": 0.6599812130280833,
"learning_rate": 1.4410526998880122e-05,
"loss": 0.4602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23088182508945465,
"step": 2895,
"valid_targets_mean": 4051.1,
"valid_targets_min": 1394
},
{
"epoch": 4.427807486631016,
"grad_norm": 0.9040364751596435,
"learning_rate": 1.4337460295630531e-05,
"loss": 0.4528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2535208463668823,
"step": 2900,
"valid_targets_mean": 4407.2,
"valid_targets_min": 1606
},
{
"epoch": 4.435446906035141,
"grad_norm": 0.6946233200223303,
"learning_rate": 1.4264475663818864e-05,
"loss": 0.4225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20772013068199158,
"step": 2905,
"valid_targets_mean": 3627.0,
"valid_targets_min": 1727
},
{
"epoch": 4.443086325439267,
"grad_norm": 0.6996399854509193,
"learning_rate": 1.419157416126615e-05,
"loss": 0.4594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23996701836585999,
"step": 2910,
"valid_targets_mean": 3127.0,
"valid_targets_min": 751
},
{
"epoch": 4.450725744843392,
"grad_norm": 0.6603193020020982,
"learning_rate": 1.4118756844588585e-05,
"loss": 0.4441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22003193199634552,
"step": 2915,
"valid_targets_mean": 4034.8,
"valid_targets_min": 989
},
{
"epoch": 4.4583651642475175,
"grad_norm": 0.667399183048132,
"learning_rate": 1.4046024769182194e-05,
"loss": 0.4148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23613163828849792,
"step": 2920,
"valid_targets_mean": 4173.1,
"valid_targets_min": 1640
},
{
"epoch": 4.466004583651642,
"grad_norm": 0.8259826448808988,
"learning_rate": 1.3973378989207535e-05,
"loss": 0.4363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2937498092651367,
"step": 2925,
"valid_targets_mean": 3235.8,
"valid_targets_min": 702
},
{
"epoch": 4.473644003055767,
"grad_norm": 0.7033941655509587,
"learning_rate": 1.3900820557574425e-05,
"loss": 0.4472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23923955857753754,
"step": 2930,
"valid_targets_mean": 4048.2,
"valid_targets_min": 1459
},
{
"epoch": 4.481283422459893,
"grad_norm": 0.7454285606687833,
"learning_rate": 1.3828350525926663e-05,
"loss": 0.4237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21835088729858398,
"step": 2935,
"valid_targets_mean": 2663.1,
"valid_targets_min": 1070
},
{
"epoch": 4.488922841864018,
"grad_norm": 0.7110475251004348,
"learning_rate": 1.3755969944626823e-05,
"loss": 0.4194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2952437996864319,
"step": 2940,
"valid_targets_mean": 4387.2,
"valid_targets_min": 867
},
{
"epoch": 4.496562261268144,
"grad_norm": 0.8828237294270216,
"learning_rate": 1.368367986274098e-05,
"loss": 0.4394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2030916064977646,
"step": 2945,
"valid_targets_mean": 1706.4,
"valid_targets_min": 813
},
{
"epoch": 4.504201680672269,
"grad_norm": 0.6954473223855169,
"learning_rate": 1.3611481328023554e-05,
"loss": 0.4564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25050777196884155,
"step": 2950,
"valid_targets_mean": 3577.8,
"valid_targets_min": 911
},
{
"epoch": 4.511841100076394,
"grad_norm": 0.6422040953597707,
"learning_rate": 1.3539375386902092e-05,
"loss": 0.4139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19034726917743683,
"step": 2955,
"valid_targets_mean": 3637.6,
"valid_targets_min": 784
},
{
"epoch": 4.51948051948052,
"grad_norm": 0.813407071704735,
"learning_rate": 1.3467363084462122e-05,
"loss": 0.4588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22248804569244385,
"step": 2960,
"valid_targets_mean": 2901.4,
"valid_targets_min": 802
},
{
"epoch": 4.527119938884645,
"grad_norm": 0.598255408018068,
"learning_rate": 1.3395445464431997e-05,
"loss": 0.4403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788901925086975,
"step": 2965,
"valid_targets_mean": 5120.8,
"valid_targets_min": 1669
},
{
"epoch": 4.53475935828877,
"grad_norm": 0.7320702572816888,
"learning_rate": 1.3323623569167748e-05,
"loss": 0.4426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2455928921699524,
"step": 2970,
"valid_targets_mean": 3704.1,
"valid_targets_min": 885
},
{
"epoch": 4.542398777692895,
"grad_norm": 0.8656712332196725,
"learning_rate": 1.3251898439638025e-05,
"loss": 0.4323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28234678506851196,
"step": 2975,
"valid_targets_mean": 2744.9,
"valid_targets_min": 619
},
{
"epoch": 4.55003819709702,
"grad_norm": 0.6145036757635849,
"learning_rate": 1.3180271115408944e-05,
"loss": 0.4606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20645278692245483,
"step": 2980,
"valid_targets_mean": 4847.0,
"valid_targets_min": 1823
},
{
"epoch": 4.557677616501146,
"grad_norm": 0.7084910960235971,
"learning_rate": 1.310874263462909e-05,
"loss": 0.409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17451977729797363,
"step": 2985,
"valid_targets_mean": 2182.5,
"valid_targets_min": 831
},
{
"epoch": 4.565317035905271,
"grad_norm": 0.6562259432752094,
"learning_rate": 1.303731403401441e-05,
"loss": 0.4415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2443830817937851,
"step": 2990,
"valid_targets_mean": 4561.2,
"valid_targets_min": 2325
},
{
"epoch": 4.572956455309397,
"grad_norm": 0.696214858440501,
"learning_rate": 1.2965986348833229e-05,
"loss": 0.4487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27823278307914734,
"step": 2995,
"valid_targets_mean": 4183.0,
"valid_targets_min": 1061
},
{
"epoch": 4.580595874713522,
"grad_norm": 0.7307211959598596,
"learning_rate": 1.2894760612891219e-05,
"loss": 0.4133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17543989419937134,
"step": 3000,
"valid_targets_mean": 3196.6,
"valid_targets_min": 915
},
{
"epoch": 4.588235294117647,
"grad_norm": 0.7005195593755522,
"learning_rate": 1.2823637858516432e-05,
"loss": 0.4569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24170951545238495,
"step": 3005,
"valid_targets_mean": 3459.9,
"valid_targets_min": 636
},
{
"epoch": 4.595874713521773,
"grad_norm": 0.7209567127788638,
"learning_rate": 1.2752619116544333e-05,
"loss": 0.4303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22956225275993347,
"step": 3010,
"valid_targets_mean": 3502.8,
"valid_targets_min": 916
},
{
"epoch": 4.6035141329258975,
"grad_norm": 0.6653489435920646,
"learning_rate": 1.2681705416302839e-05,
"loss": 0.4554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18298763036727905,
"step": 3015,
"valid_targets_mean": 3679.9,
"valid_targets_min": 1256
},
{
"epoch": 4.611153552330023,
"grad_norm": 0.7852042606455901,
"learning_rate": 1.2610897785597441e-05,
"loss": 0.458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2998313307762146,
"step": 3020,
"valid_targets_mean": 3142.8,
"valid_targets_min": 748
},
{
"epoch": 4.618792971734148,
"grad_norm": 0.7486001259075058,
"learning_rate": 1.2540197250696266e-05,
"loss": 0.4231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27724653482437134,
"step": 3025,
"valid_targets_mean": 3724.6,
"valid_targets_min": 1254
},
{
"epoch": 4.626432391138273,
"grad_norm": 0.6340367863972102,
"learning_rate": 1.2469604836315237e-05,
"loss": 0.4362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3218015730381012,
"step": 3030,
"valid_targets_mean": 5287.8,
"valid_targets_min": 1415
},
{
"epoch": 4.634071810542399,
"grad_norm": 0.8297601491978646,
"learning_rate": 1.2399121565603203e-05,
"loss": 0.4173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27993282675743103,
"step": 3035,
"valid_targets_mean": 3140.9,
"valid_targets_min": 766
},
{
"epoch": 4.641711229946524,
"grad_norm": 0.8392576086594048,
"learning_rate": 1.2328748460127095e-05,
"loss": 0.4372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24703417718410492,
"step": 3040,
"valid_targets_mean": 2254.0,
"valid_targets_min": 811
},
{
"epoch": 4.64935064935065,
"grad_norm": 0.76403301632943,
"learning_rate": 1.2258486539857163e-05,
"loss": 0.4339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.214448019862175,
"step": 3045,
"valid_targets_mean": 2798.6,
"valid_targets_min": 1137
},
{
"epoch": 4.656990068754775,
"grad_norm": 0.7607712205600897,
"learning_rate": 1.2188336823152137e-05,
"loss": 0.456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2419661283493042,
"step": 3050,
"valid_targets_mean": 3125.0,
"valid_targets_min": 1810
},
{
"epoch": 4.6646294881589,
"grad_norm": 0.6780774718582251,
"learning_rate": 1.2118300326744525e-05,
"loss": 0.4407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2228745073080063,
"step": 3055,
"valid_targets_mean": 3821.5,
"valid_targets_min": 943
},
{
"epoch": 4.6722689075630255,
"grad_norm": 0.7415756571172493,
"learning_rate": 1.2048378065725821e-05,
"loss": 0.4282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21102388203144073,
"step": 3060,
"valid_targets_mean": 2965.5,
"valid_targets_min": 823
},
{
"epoch": 4.67990832696715,
"grad_norm": 0.826558813326542,
"learning_rate": 1.1978571053531848e-05,
"loss": 0.4675,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27071088552474976,
"step": 3065,
"valid_targets_mean": 3043.9,
"valid_targets_min": 780
},
{
"epoch": 4.687547746371276,
"grad_norm": 0.8463261732397126,
"learning_rate": 1.1908880301928012e-05,
"loss": 0.4489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25644421577453613,
"step": 3070,
"valid_targets_mean": 2437.5,
"valid_targets_min": 1480
},
{
"epoch": 4.695187165775401,
"grad_norm": 0.7807727309561482,
"learning_rate": 1.1839306820994692e-05,
"loss": 0.4537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23279087245464325,
"step": 3075,
"valid_targets_mean": 3059.1,
"valid_targets_min": 1494
},
{
"epoch": 4.702826585179526,
"grad_norm": 0.664795453987691,
"learning_rate": 1.1769851619112571e-05,
"loss": 0.4268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1653788685798645,
"step": 3080,
"valid_targets_mean": 2827.6,
"valid_targets_min": 952
},
{
"epoch": 4.710466004583652,
"grad_norm": 0.7404044663755746,
"learning_rate": 1.1700515702948003e-05,
"loss": 0.4363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18012934923171997,
"step": 3085,
"valid_targets_mean": 2408.6,
"valid_targets_min": 689
},
{
"epoch": 4.718105423987777,
"grad_norm": 0.6959670506262801,
"learning_rate": 1.1631300077438474e-05,
"loss": 0.4032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1842706799507141,
"step": 3090,
"valid_targets_mean": 2286.6,
"valid_targets_min": 1089
},
{
"epoch": 4.725744843391903,
"grad_norm": 0.6789388370499856,
"learning_rate": 1.1562205745777976e-05,
"loss": 0.4147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16564428806304932,
"step": 3095,
"valid_targets_mean": 3138.4,
"valid_targets_min": 1894
},
{
"epoch": 4.733384262796028,
"grad_norm": 0.6829775331974125,
"learning_rate": 1.149323370940254e-05,
"loss": 0.4374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20033124089241028,
"step": 3100,
"valid_targets_mean": 2759.4,
"valid_targets_min": 910
},
{
"epoch": 4.741023682200153,
"grad_norm": 0.6955835942094102,
"learning_rate": 1.1424384967975638e-05,
"loss": 0.4386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19949236512184143,
"step": 3105,
"valid_targets_mean": 2783.8,
"valid_targets_min": 1222
},
{
"epoch": 4.748663101604278,
"grad_norm": 0.8058435461758185,
"learning_rate": 1.1355660519373757e-05,
"loss": 0.4324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2256844937801361,
"step": 3110,
"valid_targets_mean": 3453.5,
"valid_targets_min": 1166
},
{
"epoch": 4.756302521008403,
"grad_norm": 0.543464576904595,
"learning_rate": 1.1287061359671918e-05,
"loss": 0.4511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1765793263912201,
"step": 3115,
"valid_targets_mean": 4341.4,
"valid_targets_min": 1047
},
{
"epoch": 4.763941940412528,
"grad_norm": 0.6367461792370757,
"learning_rate": 1.1218588483129226e-05,
"loss": 0.4428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.232584148645401,
"step": 3120,
"valid_targets_mean": 3673.0,
"valid_targets_min": 721
},
{
"epoch": 4.771581359816654,
"grad_norm": 0.635073599945755,
"learning_rate": 1.115024288217447e-05,
"loss": 0.4254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18331608176231384,
"step": 3125,
"valid_targets_mean": 3576.4,
"valid_targets_min": 487
},
{
"epoch": 4.779220779220779,
"grad_norm": 0.7428588724353016,
"learning_rate": 1.1082025547391742e-05,
"loss": 0.4409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22744230926036835,
"step": 3130,
"valid_targets_mean": 2550.1,
"valid_targets_min": 951
},
{
"epoch": 4.786860198624905,
"grad_norm": 0.831972596497422,
"learning_rate": 1.1013937467506075e-05,
"loss": 0.4348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24062250554561615,
"step": 3135,
"valid_targets_mean": 2996.0,
"valid_targets_min": 888
},
{
"epoch": 4.79449961802903,
"grad_norm": 0.7072316785824789,
"learning_rate": 1.0945979629369103e-05,
"loss": 0.4284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20350953936576843,
"step": 3140,
"valid_targets_mean": 3159.4,
"valid_targets_min": 1559
},
{
"epoch": 4.802139037433155,
"grad_norm": 0.7422268731369834,
"learning_rate": 1.0878153017944801e-05,
"loss": 0.4664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37612760066986084,
"step": 3145,
"valid_targets_mean": 4292.4,
"valid_targets_min": 922
},
{
"epoch": 4.809778456837281,
"grad_norm": 0.7624693176548212,
"learning_rate": 1.0810458616295146e-05,
"loss": 0.4421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21782265603542328,
"step": 3150,
"valid_targets_mean": 2382.0,
"valid_targets_min": 1072
},
{
"epoch": 4.8174178762414055,
"grad_norm": 0.7281106937968902,
"learning_rate": 1.0742897405565892e-05,
"loss": 0.4394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2107025533914566,
"step": 3155,
"valid_targets_mean": 3610.5,
"valid_targets_min": 1363
},
{
"epoch": 4.825057295645531,
"grad_norm": 0.6543758653177835,
"learning_rate": 1.0675470364972412e-05,
"loss": 0.4434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2604054808616638,
"step": 3160,
"valid_targets_mean": 4376.6,
"valid_targets_min": 1138
},
{
"epoch": 4.832696715049656,
"grad_norm": 0.7376066895580519,
"learning_rate": 1.0608178471785369e-05,
"loss": 0.4605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2066906839609146,
"step": 3165,
"valid_targets_mean": 2716.8,
"valid_targets_min": 868
},
{
"epoch": 4.840336134453781,
"grad_norm": 0.867558948336844,
"learning_rate": 1.0541022701316704e-05,
"loss": 0.415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22561189532279968,
"step": 3170,
"valid_targets_mean": 2282.2,
"valid_targets_min": 937
},
{
"epoch": 4.847975553857907,
"grad_norm": 0.753345607833048,
"learning_rate": 1.0474004026905393e-05,
"loss": 0.4214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17792923748493195,
"step": 3175,
"valid_targets_mean": 2575.5,
"valid_targets_min": 822
},
{
"epoch": 4.855614973262032,
"grad_norm": 0.6965195935418431,
"learning_rate": 1.040712341990338e-05,
"loss": 0.4427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21977144479751587,
"step": 3180,
"valid_targets_mean": 3192.2,
"valid_targets_min": 1430
},
{
"epoch": 4.863254392666157,
"grad_norm": 0.7244562227938083,
"learning_rate": 1.0340381849661512e-05,
"loss": 0.4209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20825041830539703,
"step": 3185,
"valid_targets_mean": 2705.8,
"valid_targets_min": 1218
},
{
"epoch": 4.870893812070283,
"grad_norm": 1.1658836220367665,
"learning_rate": 1.027378028351545e-05,
"loss": 0.4843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23123201727867126,
"step": 3190,
"valid_targets_mean": 2676.0,
"valid_targets_min": 1005
},
{
"epoch": 4.878533231474408,
"grad_norm": 0.6428607046807531,
"learning_rate": 1.020731968677168e-05,
"loss": 0.4559,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2840641140937805,
"step": 3195,
"valid_targets_mean": 4760.5,
"valid_targets_min": 1489
},
{
"epoch": 4.8861726508785335,
"grad_norm": 0.6424493789075727,
"learning_rate": 1.0141001022693513e-05,
"loss": 0.4392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19804728031158447,
"step": 3200,
"valid_targets_mean": 4134.6,
"valid_targets_min": 1719
},
{
"epoch": 4.893812070282658,
"grad_norm": 0.6689835440970003,
"learning_rate": 1.0074825252487124e-05,
"loss": 0.4411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25073152780532837,
"step": 3205,
"valid_targets_mean": 4041.5,
"valid_targets_min": 714
},
{
"epoch": 4.901451489686783,
"grad_norm": 0.6395385434248182,
"learning_rate": 1.0008793335287605e-05,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18766605854034424,
"step": 3210,
"valid_targets_mean": 3877.2,
"valid_targets_min": 799
},
{
"epoch": 4.909090909090909,
"grad_norm": 0.5500861300454841,
"learning_rate": 9.942906228145123e-06,
"loss": 0.4486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19914793968200684,
"step": 3215,
"valid_targets_mean": 5092.1,
"valid_targets_min": 823
},
{
"epoch": 4.916730328495034,
"grad_norm": 0.7386027211516123,
"learning_rate": 9.877164886010938e-06,
"loss": 0.4429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2817431688308716,
"step": 3220,
"valid_targets_mean": 4743.6,
"valid_targets_min": 1186
},
{
"epoch": 4.92436974789916,
"grad_norm": 0.7019719562878625,
"learning_rate": 9.811570261723676e-06,
"loss": 0.4377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19408079981803894,
"step": 3225,
"valid_targets_mean": 3703.9,
"valid_targets_min": 2009
},
{
"epoch": 4.932009167303285,
"grad_norm": 0.5384230165710143,
"learning_rate": 9.746123305995476e-06,
"loss": 0.4166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2503221035003662,
"step": 3230,
"valid_targets_mean": 5923.2,
"valid_targets_min": 712
},
{
"epoch": 4.93964858670741,
"grad_norm": 0.5960933611824211,
"learning_rate": 9.68082496739816e-06,
"loss": 0.4418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16890287399291992,
"step": 3235,
"valid_targets_mean": 3072.4,
"valid_targets_min": 760
},
{
"epoch": 4.947288006111536,
"grad_norm": 0.6770220213062155,
"learning_rate": 9.615676192349577e-06,
"loss": 0.4071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525444030761719,
"step": 3240,
"valid_targets_mean": 4509.0,
"valid_targets_min": 1865
},
{
"epoch": 4.954927425515661,
"grad_norm": 0.6485055817592701,
"learning_rate": 9.550677925099815e-06,
"loss": 0.4239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1657400280237198,
"step": 3245,
"valid_targets_mean": 3076.2,
"valid_targets_min": 681
},
{
"epoch": 4.962566844919786,
"grad_norm": 0.6337463064952114,
"learning_rate": 9.485831107717547e-06,
"loss": 0.4375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18350504338741302,
"step": 3250,
"valid_targets_mean": 3156.8,
"valid_targets_min": 938
},
{
"epoch": 4.970206264323911,
"grad_norm": 0.7324159499991673,
"learning_rate": 9.421136680076365e-06,
"loss": 0.4194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22422681748867035,
"step": 3255,
"valid_targets_mean": 3919.8,
"valid_targets_min": 899
},
{
"epoch": 4.977845683728036,
"grad_norm": 0.7105972910190749,
"learning_rate": 9.356595579841158e-06,
"loss": 0.4544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23887526988983154,
"step": 3260,
"valid_targets_mean": 3753.4,
"valid_targets_min": 540
},
{
"epoch": 4.985485103132162,
"grad_norm": 0.7336493987221758,
"learning_rate": 9.292208742454549e-06,
"loss": 0.4498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2927570641040802,
"step": 3265,
"valid_targets_mean": 4896.9,
"valid_targets_min": 783
},
{
"epoch": 4.993124522536287,
"grad_norm": 0.6727667356515784,
"learning_rate": 9.227977101123287e-06,
"loss": 0.4317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1748276650905609,
"step": 3270,
"valid_targets_mean": 2757.0,
"valid_targets_min": 974
},
{
"epoch": 5.0,
"grad_norm": 0.9434978159648666,
"learning_rate": 9.16390158680476e-06,
"loss": 0.4491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4982553720474243,
"step": 3275,
"valid_targets_mean": 3907.4,
"valid_targets_min": 2144
},
{
"epoch": 5.007639419404125,
"grad_norm": 0.6507985228704842,
"learning_rate": 9.099983128193481e-06,
"loss": 0.411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18580271303653717,
"step": 3280,
"valid_targets_mean": 2795.2,
"valid_targets_min": 1168
},
{
"epoch": 5.015278838808251,
"grad_norm": 0.7057074937993735,
"learning_rate": 9.036222651707666e-06,
"loss": 0.4068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2280879020690918,
"step": 3285,
"valid_targets_mean": 4809.2,
"valid_targets_min": 1883
},
{
"epoch": 5.022918258212376,
"grad_norm": 0.5656641524682343,
"learning_rate": 8.972621081475727e-06,
"loss": 0.4542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10994422435760498,
"step": 3290,
"valid_targets_mean": 2460.4,
"valid_targets_min": 872
},
{
"epoch": 5.0305576776165015,
"grad_norm": 0.8761421207054235,
"learning_rate": 8.909179339322971e-06,
"loss": 0.4142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22071196138858795,
"step": 3295,
"valid_targets_mean": 2460.5,
"valid_targets_min": 780
},
{
"epoch": 5.0381970970206265,
"grad_norm": 0.7295305809963956,
"learning_rate": 8.845898344758199e-06,
"loss": 0.4163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19741207361221313,
"step": 3300,
"valid_targets_mean": 2860.1,
"valid_targets_min": 1663
},
{
"epoch": 5.045836516424751,
"grad_norm": 0.7112452731180018,
"learning_rate": 8.782779014960327e-06,
"loss": 0.4009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17603464424610138,
"step": 3305,
"valid_targets_mean": 2539.2,
"valid_targets_min": 1289
},
{
"epoch": 5.053475935828877,
"grad_norm": 0.7839524218700084,
"learning_rate": 8.719822264765204e-06,
"loss": 0.418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24770452082157135,
"step": 3310,
"valid_targets_mean": 3061.1,
"valid_targets_min": 641
},
{
"epoch": 5.061115355233002,
"grad_norm": 0.6200210304675198,
"learning_rate": 8.657029006652247e-06,
"loss": 0.3937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1898297518491745,
"step": 3315,
"valid_targets_mean": 4409.4,
"valid_targets_min": 1434
},
{
"epoch": 5.068754774637128,
"grad_norm": 0.7448282508495098,
"learning_rate": 8.594400150731278e-06,
"loss": 0.4165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20044977962970734,
"step": 3320,
"valid_targets_mean": 3152.1,
"valid_targets_min": 1468
},
{
"epoch": 5.076394194041253,
"grad_norm": 0.7330563381797555,
"learning_rate": 8.531936604729315e-06,
"loss": 0.4048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2015673816204071,
"step": 3325,
"valid_targets_mean": 3392.9,
"valid_targets_min": 1959
},
{
"epoch": 5.084033613445378,
"grad_norm": 0.6574570667834281,
"learning_rate": 8.469639273977404e-06,
"loss": 0.4092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2060699760913849,
"step": 3330,
"valid_targets_mean": 3534.9,
"valid_targets_min": 772
},
{
"epoch": 5.091673032849504,
"grad_norm": 0.7192898176205931,
"learning_rate": 8.407509061397525e-06,
"loss": 0.4242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19831335544586182,
"step": 3335,
"valid_targets_mean": 3844.0,
"valid_targets_min": 1320
},
{
"epoch": 5.099312452253629,
"grad_norm": 0.6989885300271562,
"learning_rate": 8.345546867489478e-06,
"loss": 0.431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22625543177127838,
"step": 3340,
"valid_targets_mean": 3683.0,
"valid_targets_min": 1248
},
{
"epoch": 5.106951871657754,
"grad_norm": 0.6891661447879618,
"learning_rate": 8.283753590317844e-06,
"loss": 0.4167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1683456003665924,
"step": 3345,
"valid_targets_mean": 2819.9,
"valid_targets_min": 879
},
{
"epoch": 5.114591291061879,
"grad_norm": 0.6744309100184774,
"learning_rate": 8.222130125498959e-06,
"loss": 0.4175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2619309425354004,
"step": 3350,
"valid_targets_mean": 4709.9,
"valid_targets_min": 1766
},
{
"epoch": 5.122230710466004,
"grad_norm": 0.7643882359784762,
"learning_rate": 8.160677366187973e-06,
"loss": 0.4037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24490387737751007,
"step": 3355,
"valid_targets_mean": 4076.8,
"valid_targets_min": 641
},
{
"epoch": 5.12987012987013,
"grad_norm": 0.765032206390207,
"learning_rate": 8.099396203065818e-06,
"loss": 0.4049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15527962148189545,
"step": 3360,
"valid_targets_mean": 2164.2,
"valid_targets_min": 1001
},
{
"epoch": 5.137509549274255,
"grad_norm": 0.672539908906615,
"learning_rate": 8.038287524326412e-06,
"loss": 0.4215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17782077193260193,
"step": 3365,
"valid_targets_mean": 3591.0,
"valid_targets_min": 1006
},
{
"epoch": 5.145148968678381,
"grad_norm": 0.7211933101160407,
"learning_rate": 7.977352215663687e-06,
"loss": 0.4217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15421822667121887,
"step": 3370,
"valid_targets_mean": 2195.5,
"valid_targets_min": 868
},
{
"epoch": 5.152788388082506,
"grad_norm": 0.8298079760424127,
"learning_rate": 7.916591160258801e-06,
"loss": 0.4492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18245047330856323,
"step": 3375,
"valid_targets_mean": 2769.5,
"valid_targets_min": 1123
},
{
"epoch": 5.160427807486631,
"grad_norm": 0.7848489488943335,
"learning_rate": 7.856005238767352e-06,
"loss": 0.4031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1802041083574295,
"step": 3380,
"valid_targets_mean": 2449.5,
"valid_targets_min": 739
},
{
"epoch": 5.168067226890757,
"grad_norm": 0.828689552301754,
"learning_rate": 7.79559532930656e-06,
"loss": 0.4003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17640046775341034,
"step": 3385,
"valid_targets_mean": 2253.6,
"valid_targets_min": 605
},
{
"epoch": 5.1757066462948815,
"grad_norm": 0.8939948317428271,
"learning_rate": 7.735362307442587e-06,
"loss": 0.4254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20057544112205505,
"step": 3390,
"valid_targets_mean": 2309.8,
"valid_targets_min": 711
},
{
"epoch": 5.1833460656990065,
"grad_norm": 0.7064878087869875,
"learning_rate": 7.675307046177824e-06,
"loss": 0.444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1704927682876587,
"step": 3395,
"valid_targets_mean": 3034.6,
"valid_targets_min": 668
},
{
"epoch": 5.190985485103132,
"grad_norm": 0.8392581300544377,
"learning_rate": 7.615430415938247e-06,
"loss": 0.4146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26886194944381714,
"step": 3400,
"valid_targets_mean": 3126.4,
"valid_targets_min": 868
},
{
"epoch": 5.198624904507257,
"grad_norm": 0.5899801518379102,
"learning_rate": 7.555733284560791e-06,
"loss": 0.4166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19343039393424988,
"step": 3405,
"valid_targets_mean": 4824.8,
"valid_targets_min": 1434
},
{
"epoch": 5.206264323911383,
"grad_norm": 0.6828929324395993,
"learning_rate": 7.496216517280801e-06,
"loss": 0.4104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21579919755458832,
"step": 3410,
"valid_targets_mean": 3761.9,
"valid_targets_min": 2207
},
{
"epoch": 5.213903743315508,
"grad_norm": 0.7563428889342848,
"learning_rate": 7.436880976719447e-06,
"loss": 0.4272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22617709636688232,
"step": 3415,
"valid_targets_mean": 3657.2,
"valid_targets_min": 802
},
{
"epoch": 5.221543162719633,
"grad_norm": 0.9220246281743919,
"learning_rate": 7.377727522871246e-06,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20721417665481567,
"step": 3420,
"valid_targets_mean": 2134.1,
"valid_targets_min": 800
},
{
"epoch": 5.229182582123759,
"grad_norm": 0.7834904193038889,
"learning_rate": 7.318757013091622e-06,
"loss": 0.3837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1851697862148285,
"step": 3425,
"valid_targets_mean": 2451.8,
"valid_targets_min": 951
},
{
"epoch": 5.236822001527884,
"grad_norm": 0.648240952651534,
"learning_rate": 7.259970302084405e-06,
"loss": 0.3728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18699084222316742,
"step": 3430,
"valid_targets_mean": 3529.8,
"valid_targets_min": 939
},
{
"epoch": 5.2444614209320095,
"grad_norm": 0.8208594769460752,
"learning_rate": 7.2013682418895435e-06,
"loss": 0.4363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20773524045944214,
"step": 3435,
"valid_targets_mean": 2560.2,
"valid_targets_min": 826
},
{
"epoch": 5.2521008403361344,
"grad_norm": 0.8545535257360884,
"learning_rate": 7.142951681870669e-06,
"loss": 0.4256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21555760502815247,
"step": 3440,
"valid_targets_mean": 2220.1,
"valid_targets_min": 685
},
{
"epoch": 5.259740259740259,
"grad_norm": 0.7813176036108497,
"learning_rate": 7.084721468702822e-06,
"loss": 0.3894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22744975984096527,
"step": 3445,
"valid_targets_mean": 2960.5,
"valid_targets_min": 1632
},
{
"epoch": 5.267379679144385,
"grad_norm": 0.7830401754519163,
"learning_rate": 7.026678446360204e-06,
"loss": 0.3987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18200945854187012,
"step": 3450,
"valid_targets_mean": 2975.2,
"valid_targets_min": 1274
},
{
"epoch": 5.27501909854851,
"grad_norm": 0.7338311439811203,
"learning_rate": 6.9688234561038925e-06,
"loss": 0.4252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16019290685653687,
"step": 3455,
"valid_targets_mean": 2500.2,
"valid_targets_min": 1106
},
{
"epoch": 5.282658517952636,
"grad_norm": 0.7882790373444832,
"learning_rate": 6.911157336469685e-06,
"loss": 0.4159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18955618143081665,
"step": 3460,
"valid_targets_mean": 3472.8,
"valid_targets_min": 787
},
{
"epoch": 5.290297937356761,
"grad_norm": 0.8243210594375885,
"learning_rate": 6.853680923255932e-06,
"loss": 0.4084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24365636706352234,
"step": 3465,
"valid_targets_mean": 3001.8,
"valid_targets_min": 750
},
{
"epoch": 5.297937356760886,
"grad_norm": 0.7590409540259425,
"learning_rate": 6.796395049511431e-06,
"loss": 0.4149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21231132745742798,
"step": 3470,
"valid_targets_mean": 3273.2,
"valid_targets_min": 931
},
{
"epoch": 5.305576776165012,
"grad_norm": 1.0632303615019383,
"learning_rate": 6.739300545523335e-06,
"loss": 0.4052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2338356226682663,
"step": 3475,
"valid_targets_mean": 3178.6,
"valid_targets_min": 947
},
{
"epoch": 5.313216195569137,
"grad_norm": 0.756230519495017,
"learning_rate": 6.682398238805161e-06,
"loss": 0.4145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24491998553276062,
"step": 3480,
"valid_targets_mean": 2977.2,
"valid_targets_min": 998
},
{
"epoch": 5.320855614973262,
"grad_norm": 0.845343670274438,
"learning_rate": 6.625688954084739e-06,
"loss": 0.3901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1987672746181488,
"step": 3485,
"valid_targets_mean": 2708.9,
"valid_targets_min": 871
},
{
"epoch": 5.328495034377387,
"grad_norm": 0.7592874195569738,
"learning_rate": 6.569173513292289e-06,
"loss": 0.4121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2058597207069397,
"step": 3490,
"valid_targets_mean": 2993.6,
"valid_targets_min": 1043
},
{
"epoch": 5.336134453781512,
"grad_norm": 0.7987958580833625,
"learning_rate": 6.512852735548529e-06,
"loss": 0.4422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18779411911964417,
"step": 3495,
"valid_targets_mean": 2571.9,
"valid_targets_min": 808
},
{
"epoch": 5.343773873185638,
"grad_norm": 0.6740552418391473,
"learning_rate": 6.456727437152737e-06,
"loss": 0.4181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21062324941158295,
"step": 3500,
"valid_targets_mean": 3471.2,
"valid_targets_min": 893
},
{
"epoch": 5.351413292589763,
"grad_norm": 0.7949901183059733,
"learning_rate": 6.400798431571009e-06,
"loss": 0.4309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19252058863639832,
"step": 3505,
"valid_targets_mean": 2609.5,
"valid_targets_min": 1768
},
{
"epoch": 5.359052711993888,
"grad_norm": 0.9011653868394018,
"learning_rate": 6.345066529424391e-06,
"loss": 0.4146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19950778782367706,
"step": 3510,
"valid_targets_mean": 2509.4,
"valid_targets_min": 863
},
{
"epoch": 5.366692131398014,
"grad_norm": 0.8226863591976814,
"learning_rate": 6.289532538477163e-06,
"loss": 0.4199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16507697105407715,
"step": 3515,
"valid_targets_mean": 2465.1,
"valid_targets_min": 1014
},
{
"epoch": 5.374331550802139,
"grad_norm": 0.7702667277518003,
"learning_rate": 6.234197263625157e-06,
"loss": 0.4154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18763992190361023,
"step": 3520,
"valid_targets_mean": 2658.5,
"valid_targets_min": 1043
},
{
"epoch": 5.381970970206265,
"grad_norm": 0.7546441510309715,
"learning_rate": 6.179061506884018e-06,
"loss": 0.4036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20631533861160278,
"step": 3525,
"valid_targets_mean": 3253.8,
"valid_targets_min": 1863
},
{
"epoch": 5.3896103896103895,
"grad_norm": 1.0332493720632743,
"learning_rate": 6.124126067377669e-06,
"loss": 0.4486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18635576963424683,
"step": 3530,
"valid_targets_mean": 2523.4,
"valid_targets_min": 882
},
{
"epoch": 5.3972498090145145,
"grad_norm": 0.8600167635311569,
"learning_rate": 6.069391741326658e-06,
"loss": 0.4272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23452191054821014,
"step": 3535,
"valid_targets_mean": 3307.4,
"valid_targets_min": 1234
},
{
"epoch": 5.40488922841864,
"grad_norm": 0.7472968803751108,
"learning_rate": 6.014859322036655e-06,
"loss": 0.475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25068214535713196,
"step": 3540,
"valid_targets_mean": 3746.0,
"valid_targets_min": 1742
},
{
"epoch": 5.412528647822765,
"grad_norm": 0.7724354110335331,
"learning_rate": 5.960529599886933e-06,
"loss": 0.4249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2862878441810608,
"step": 3545,
"valid_targets_mean": 3475.9,
"valid_targets_min": 871
},
{
"epoch": 5.420168067226891,
"grad_norm": 0.5927597795747025,
"learning_rate": 5.906403362318953e-06,
"loss": 0.4233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13544148206710815,
"step": 3550,
"valid_targets_mean": 3212.5,
"valid_targets_min": 1620
},
{
"epoch": 5.427807486631016,
"grad_norm": 0.8215858475471198,
"learning_rate": 5.852481393824876e-06,
"loss": 0.4273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1856689155101776,
"step": 3555,
"valid_targets_mean": 2500.4,
"valid_targets_min": 436
},
{
"epoch": 5.435446906035141,
"grad_norm": 0.7534978382823645,
"learning_rate": 5.7987644759362715e-06,
"loss": 0.4056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2625764310359955,
"step": 3560,
"valid_targets_mean": 3408.6,
"valid_targets_min": 1712
},
{
"epoch": 5.443086325439267,
"grad_norm": 0.7365666325994856,
"learning_rate": 5.745253387212759e-06,
"loss": 0.4148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22502942383289337,
"step": 3565,
"valid_targets_mean": 3521.4,
"valid_targets_min": 841
},
{
"epoch": 5.450725744843392,
"grad_norm": 0.7997567097717743,
"learning_rate": 5.691948903230691e-06,
"loss": 0.3924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2259596586227417,
"step": 3570,
"valid_targets_mean": 3082.4,
"valid_targets_min": 694
},
{
"epoch": 5.4583651642475175,
"grad_norm": 0.8822731379082949,
"learning_rate": 5.638851796571974e-06,
"loss": 0.4349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22405478358268738,
"step": 3575,
"valid_targets_mean": 2302.9,
"valid_targets_min": 962
},
{
"epoch": 5.466004583651642,
"grad_norm": 0.7443175145614003,
"learning_rate": 5.585962836812822e-06,
"loss": 0.4053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3522719144821167,
"step": 3580,
"valid_targets_mean": 4707.1,
"valid_targets_min": 686
},
{
"epoch": 5.473644003055767,
"grad_norm": 0.7684422668048446,
"learning_rate": 5.533282790512624e-06,
"loss": 0.3872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18864914774894714,
"step": 3585,
"valid_targets_mean": 2916.6,
"valid_targets_min": 758
},
{
"epoch": 5.481283422459893,
"grad_norm": 0.6752647565568806,
"learning_rate": 5.480812421202828e-06,
"loss": 0.4047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17078009247779846,
"step": 3590,
"valid_targets_mean": 3693.9,
"valid_targets_min": 1209
},
{
"epoch": 5.488922841864018,
"grad_norm": 0.815831254632104,
"learning_rate": 5.428552489375876e-06,
"loss": 0.4002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18773040175437927,
"step": 3595,
"valid_targets_mean": 2936.0,
"valid_targets_min": 1065
},
{
"epoch": 5.496562261268144,
"grad_norm": 0.6615077791531486,
"learning_rate": 5.376503752474191e-06,
"loss": 0.3985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13504765927791595,
"step": 3600,
"valid_targets_mean": 3119.9,
"valid_targets_min": 606
},
{
"epoch": 5.504201680672269,
"grad_norm": 0.6605364243810754,
"learning_rate": 5.32466696487918e-06,
"loss": 0.417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17553292214870453,
"step": 3605,
"valid_targets_mean": 3754.2,
"valid_targets_min": 947
},
{
"epoch": 5.511841100076394,
"grad_norm": 0.6762092368293349,
"learning_rate": 5.273042877900308e-06,
"loss": 0.4103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14567619562149048,
"step": 3610,
"valid_targets_mean": 2932.9,
"valid_targets_min": 867
},
{
"epoch": 5.51948051948052,
"grad_norm": 0.6178381332291257,
"learning_rate": 5.221632239764207e-06,
"loss": 0.4082,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16620564460754395,
"step": 3615,
"valid_targets_mean": 4656.1,
"valid_targets_min": 2486
},
{
"epoch": 5.527119938884645,
"grad_norm": 0.7235563732760826,
"learning_rate": 5.170435795603863e-06,
"loss": 0.4218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1886502504348755,
"step": 3620,
"valid_targets_mean": 3256.5,
"valid_targets_min": 1766
},
{
"epoch": 5.53475935828877,
"grad_norm": 0.8302130888371341,
"learning_rate": 5.119454287447738e-06,
"loss": 0.4508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29996421933174133,
"step": 3625,
"valid_targets_mean": 3539.0,
"valid_targets_min": 1062
},
{
"epoch": 5.542398777692895,
"grad_norm": 0.6664804259859938,
"learning_rate": 5.068688454209114e-06,
"loss": 0.4187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20061370730400085,
"step": 3630,
"valid_targets_mean": 4539.8,
"valid_targets_min": 2136
},
{
"epoch": 5.55003819709702,
"grad_norm": 0.8158756541380983,
"learning_rate": 5.018139031675309e-06,
"loss": 0.3994,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.287477046251297,
"step": 3635,
"valid_targets_mean": 3718.4,
"valid_targets_min": 1199
},
{
"epoch": 5.557677616501146,
"grad_norm": 0.7383633611419538,
"learning_rate": 4.967806752497036e-06,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20177043974399567,
"step": 3640,
"valid_targets_mean": 3811.8,
"valid_targets_min": 643
},
{
"epoch": 5.565317035905271,
"grad_norm": 0.6984282055877477,
"learning_rate": 4.917692346177804e-06,
"loss": 0.4224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18860375881195068,
"step": 3645,
"valid_targets_mean": 2725.0,
"valid_targets_min": 790
},
{
"epoch": 5.572956455309397,
"grad_norm": 0.7157370657179769,
"learning_rate": 4.8677965390633145e-06,
"loss": 0.4094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1753612458705902,
"step": 3650,
"valid_targets_mean": 3218.1,
"valid_targets_min": 959
},
{
"epoch": 5.580595874713522,
"grad_norm": 0.8658457792874761,
"learning_rate": 4.818120054330946e-06,
"loss": 0.4224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23552726209163666,
"step": 3655,
"valid_targets_mean": 2594.4,
"valid_targets_min": 1090
},
{
"epoch": 5.588235294117647,
"grad_norm": 0.6971295570889691,
"learning_rate": 4.768663611979276e-06,
"loss": 0.4246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18920549750328064,
"step": 3660,
"valid_targets_mean": 2897.9,
"valid_targets_min": 1045
},
{
"epoch": 5.595874713521773,
"grad_norm": 0.7536367310381494,
"learning_rate": 4.719427928817637e-06,
"loss": 0.3903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23616181313991547,
"step": 3665,
"valid_targets_mean": 3631.9,
"valid_targets_min": 897
},
{
"epoch": 5.6035141329258975,
"grad_norm": 0.7259568515171714,
"learning_rate": 4.670413718455753e-06,
"loss": 0.4041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16838884353637695,
"step": 3670,
"valid_targets_mean": 3266.1,
"valid_targets_min": 1098
},
{
"epoch": 5.611153552330023,
"grad_norm": 0.6880333970118933,
"learning_rate": 4.6216216912933546e-06,
"loss": 0.4116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17340365052223206,
"step": 3675,
"valid_targets_mean": 4112.2,
"valid_targets_min": 983
},
{
"epoch": 5.618792971734148,
"grad_norm": 0.6469773412047066,
"learning_rate": 4.5730525545099095e-06,
"loss": 0.4107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17914192378520966,
"step": 3680,
"valid_targets_mean": 4227.9,
"valid_targets_min": 783
},
{
"epoch": 5.626432391138273,
"grad_norm": 0.7773716945089362,
"learning_rate": 4.524707012054368e-06,
"loss": 0.4294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15195128321647644,
"step": 3685,
"valid_targets_mean": 2487.1,
"valid_targets_min": 1543
},
{
"epoch": 5.634071810542399,
"grad_norm": 0.7776984018425589,
"learning_rate": 4.476585764634975e-06,
"loss": 0.4114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1720089614391327,
"step": 3690,
"valid_targets_mean": 2077.1,
"valid_targets_min": 885
},
{
"epoch": 5.641711229946524,
"grad_norm": 0.7688079872450757,
"learning_rate": 4.4286895097090695e-06,
"loss": 0.4307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16758956015110016,
"step": 3695,
"valid_targets_mean": 2742.0,
"valid_targets_min": 1281
},
{
"epoch": 5.64935064935065,
"grad_norm": 0.8486912659015311,
"learning_rate": 4.381018941473037e-06,
"loss": 0.4381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19494405388832092,
"step": 3700,
"valid_targets_mean": 2297.6,
"valid_targets_min": 1116
},
{
"epoch": 5.656990068754775,
"grad_norm": 0.6372751365054492,
"learning_rate": 4.333574750852194e-06,
"loss": 0.4181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16869252920150757,
"step": 3705,
"valid_targets_mean": 3551.4,
"valid_targets_min": 1137
},
{
"epoch": 5.6646294881589,
"grad_norm": 0.7390356711726472,
"learning_rate": 4.2863576254908e-06,
"loss": 0.4226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2157163769006729,
"step": 3710,
"valid_targets_mean": 3476.8,
"valid_targets_min": 1540
},
{
"epoch": 5.6722689075630255,
"grad_norm": 0.6872901624459158,
"learning_rate": 4.239368249742102e-06,
"loss": 0.4236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13273492455482483,
"step": 3715,
"valid_targets_mean": 3911.5,
"valid_targets_min": 671
},
{
"epoch": 5.67990832696715,
"grad_norm": 0.6586970729788763,
"learning_rate": 4.192607304658387e-06,
"loss": 0.4125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2191186547279358,
"step": 3720,
"valid_targets_mean": 4228.1,
"valid_targets_min": 2073
},
{
"epoch": 5.687547746371276,
"grad_norm": 0.749146299694098,
"learning_rate": 4.146075467981125e-06,
"loss": 0.4663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23675943911075592,
"step": 3725,
"valid_targets_mean": 3733.4,
"valid_targets_min": 562
},
{
"epoch": 5.695187165775401,
"grad_norm": 0.7237635954729931,
"learning_rate": 4.09977341413115e-06,
"loss": 0.4271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2258036732673645,
"step": 3730,
"valid_targets_mean": 3386.2,
"valid_targets_min": 1131
},
{
"epoch": 5.702826585179526,
"grad_norm": 0.8123035113980734,
"learning_rate": 4.053701814198882e-06,
"loss": 0.4025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21003013849258423,
"step": 3735,
"valid_targets_mean": 2482.4,
"valid_targets_min": 673
},
{
"epoch": 5.710466004583652,
"grad_norm": 0.8015439623306877,
"learning_rate": 4.0078613359345884e-06,
"loss": 0.4187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21075120568275452,
"step": 3740,
"valid_targets_mean": 2767.1,
"valid_targets_min": 1106
},
{
"epoch": 5.718105423987777,
"grad_norm": 1.0739970964489634,
"learning_rate": 3.962252643738742e-06,
"loss": 0.4154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23278754949569702,
"step": 3745,
"valid_targets_mean": 4178.6,
"valid_targets_min": 2456
},
{
"epoch": 5.725744843391903,
"grad_norm": 0.8237327127175776,
"learning_rate": 3.916876398652338e-06,
"loss": 0.4236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19142091274261475,
"step": 3750,
"valid_targets_mean": 2622.1,
"valid_targets_min": 642
},
{
"epoch": 5.733384262796028,
"grad_norm": 0.7601068750941172,
"learning_rate": 3.8717332583473545e-06,
"loss": 0.4194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21591442823410034,
"step": 3755,
"valid_targets_mean": 2982.9,
"valid_targets_min": 960
},
{
"epoch": 5.741023682200153,
"grad_norm": 0.6831402579456276,
"learning_rate": 3.826823877117218e-06,
"loss": 0.402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23567482829093933,
"step": 3760,
"valid_targets_mean": 4372.5,
"valid_targets_min": 921
},
{
"epoch": 5.748663101604278,
"grad_norm": 0.7518305106243018,
"learning_rate": 3.7821489058672754e-06,
"loss": 0.3925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19822347164154053,
"step": 3765,
"valid_targets_mean": 2959.9,
"valid_targets_min": 1891
},
{
"epoch": 5.756302521008403,
"grad_norm": 0.7856806336487985,
"learning_rate": 3.7377089921054355e-06,
"loss": 0.4083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1958726942539215,
"step": 3770,
"valid_targets_mean": 2575.6,
"valid_targets_min": 1215
},
{
"epoch": 5.763941940412528,
"grad_norm": 0.820934440949876,
"learning_rate": 3.6935047799327107e-06,
"loss": 0.4336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23241233825683594,
"step": 3775,
"valid_targets_mean": 2996.4,
"valid_targets_min": 1430
},
{
"epoch": 5.771581359816654,
"grad_norm": 0.7654930925671581,
"learning_rate": 3.649536910033926e-06,
"loss": 0.4282,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29833102226257324,
"step": 3780,
"valid_targets_mean": 3378.2,
"valid_targets_min": 850
},
{
"epoch": 5.779220779220779,
"grad_norm": 0.6768166172539385,
"learning_rate": 3.605806019668432e-06,
"loss": 0.4232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1405220776796341,
"step": 3785,
"valid_targets_mean": 2789.8,
"valid_targets_min": 1081
},
{
"epoch": 5.786860198624905,
"grad_norm": 0.772007067318885,
"learning_rate": 3.562312742660825e-06,
"loss": 0.4247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20937494933605194,
"step": 3790,
"valid_targets_mean": 3826.2,
"valid_targets_min": 1032
},
{
"epoch": 5.79449961802903,
"grad_norm": 0.9119664688683919,
"learning_rate": 3.5190577093918266e-06,
"loss": 0.4449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2521716356277466,
"step": 3795,
"valid_targets_mean": 2620.5,
"valid_targets_min": 700
},
{
"epoch": 5.802139037433155,
"grad_norm": 0.7883929824332396,
"learning_rate": 3.476041546789095e-06,
"loss": 0.4243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16708248853683472,
"step": 3800,
"valid_targets_mean": 2520.9,
"valid_targets_min": 926
},
{
"epoch": 5.809778456837281,
"grad_norm": 0.7676063261588877,
"learning_rate": 3.433264878318159e-06,
"loss": 0.4288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724417507648468,
"step": 3805,
"valid_targets_mean": 2547.8,
"valid_targets_min": 855
},
{
"epoch": 5.8174178762414055,
"grad_norm": 0.6236657792139778,
"learning_rate": 3.390728323973376e-06,
"loss": 0.4071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21887004375457764,
"step": 3810,
"valid_targets_mean": 3950.0,
"valid_targets_min": 1549
},
{
"epoch": 5.825057295645531,
"grad_norm": 0.6774652652821819,
"learning_rate": 3.3484325002689653e-06,
"loss": 0.4448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1620153933763504,
"step": 3815,
"valid_targets_mean": 2540.0,
"valid_targets_min": 937
},
{
"epoch": 5.832696715049656,
"grad_norm": 0.7869552702440537,
"learning_rate": 3.3063780202300365e-06,
"loss": 0.4425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21578902006149292,
"step": 3820,
"valid_targets_mean": 3193.5,
"valid_targets_min": 1207
},
{
"epoch": 5.840336134453781,
"grad_norm": 0.7777560326400809,
"learning_rate": 3.264565493383729e-06,
"loss": 0.4271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19921430945396423,
"step": 3825,
"valid_targets_mean": 2760.4,
"valid_targets_min": 812
},
{
"epoch": 5.847975553857907,
"grad_norm": 0.7448361766226455,
"learning_rate": 3.222995525750392e-06,
"loss": 0.3845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18640117347240448,
"step": 3830,
"valid_targets_mean": 2556.9,
"valid_targets_min": 793
},
{
"epoch": 5.855614973262032,
"grad_norm": 0.7582221040698467,
"learning_rate": 3.181668719834745e-06,
"loss": 0.4,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2028721570968628,
"step": 3835,
"valid_targets_mean": 2988.4,
"valid_targets_min": 1683
},
{
"epoch": 5.863254392666157,
"grad_norm": 0.8320638276938915,
"learning_rate": 3.14058567461722e-06,
"loss": 0.415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22501055896282196,
"step": 3840,
"valid_targets_mean": 3268.4,
"valid_targets_min": 761
},
{
"epoch": 5.870893812070283,
"grad_norm": 0.8161565674228954,
"learning_rate": 3.0997469855452222e-06,
"loss": 0.4349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24944055080413818,
"step": 3845,
"valid_targets_mean": 2357.2,
"valid_targets_min": 769
},
{
"epoch": 5.878533231474408,
"grad_norm": 0.7146833623918105,
"learning_rate": 3.0591532445245155e-06,
"loss": 0.4424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2273748219013214,
"step": 3850,
"valid_targets_mean": 3512.4,
"valid_targets_min": 425
},
{
"epoch": 5.8861726508785335,
"grad_norm": 0.7530428991334562,
"learning_rate": 3.0188050399106726e-06,
"loss": 0.414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22839196026325226,
"step": 3855,
"valid_targets_mean": 3654.9,
"valid_targets_min": 1410
},
{
"epoch": 5.893812070282658,
"grad_norm": 0.7187394717038206,
"learning_rate": 2.9787029565004856e-06,
"loss": 0.4129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16635143756866455,
"step": 3860,
"valid_targets_mean": 2724.4,
"valid_targets_min": 852
},
{
"epoch": 5.901451489686783,
"grad_norm": 0.8174325937619282,
"learning_rate": 2.93884757552356e-06,
"loss": 0.3855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2066618800163269,
"step": 3865,
"valid_targets_mean": 2795.5,
"valid_targets_min": 848
},
{
"epoch": 5.909090909090909,
"grad_norm": 0.809517014176693,
"learning_rate": 2.8992394746338457e-06,
"loss": 0.4305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21883273124694824,
"step": 3870,
"valid_targets_mean": 3162.0,
"valid_targets_min": 1149
},
{
"epoch": 5.916730328495034,
"grad_norm": 0.7913869749669057,
"learning_rate": 2.8598792279012745e-06,
"loss": 0.4229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2036246955394745,
"step": 3875,
"valid_targets_mean": 3123.5,
"valid_targets_min": 1275
},
{
"epoch": 5.92436974789916,
"grad_norm": 0.7449934448241319,
"learning_rate": 2.8207674058034374e-06,
"loss": 0.4367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19343721866607666,
"step": 3880,
"valid_targets_mean": 3974.1,
"valid_targets_min": 1119
},
{
"epoch": 5.932009167303285,
"grad_norm": 0.702412074741444,
"learning_rate": 2.7819045752173425e-06,
"loss": 0.3896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15918338298797607,
"step": 3885,
"valid_targets_mean": 3438.9,
"valid_targets_min": 1062
},
{
"epoch": 5.93964858670741,
"grad_norm": 0.7471411887353139,
"learning_rate": 2.7432912994111417e-06,
"loss": 0.4329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.206735759973526,
"step": 3890,
"valid_targets_mean": 3419.1,
"valid_targets_min": 1536
},
{
"epoch": 5.947288006111536,
"grad_norm": 0.78771027659784,
"learning_rate": 2.7049281380360382e-06,
"loss": 0.443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3115561008453369,
"step": 3895,
"valid_targets_mean": 3303.0,
"valid_targets_min": 705
},
{
"epoch": 5.954927425515661,
"grad_norm": 0.7524415873142796,
"learning_rate": 2.666815647118117e-06,
"loss": 0.4348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23538583517074585,
"step": 3900,
"valid_targets_mean": 3236.2,
"valid_targets_min": 1325
},
{
"epoch": 5.962566844919786,
"grad_norm": 0.6883297919046488,
"learning_rate": 2.6289543790503103e-06,
"loss": 0.4034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2727777659893036,
"step": 3905,
"valid_targets_mean": 4847.6,
"valid_targets_min": 1004
},
{
"epoch": 5.970206264323911,
"grad_norm": 0.7745226944687247,
"learning_rate": 2.591344882584401e-06,
"loss": 0.4449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19000530242919922,
"step": 3910,
"valid_targets_mean": 2781.6,
"valid_targets_min": 693
},
{
"epoch": 5.977845683728036,
"grad_norm": 0.6578254545339572,
"learning_rate": 2.5539877028230442e-06,
"loss": 0.4289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13370674848556519,
"step": 3915,
"valid_targets_mean": 2355.8,
"valid_targets_min": 869
},
{
"epoch": 5.985485103132162,
"grad_norm": 0.8718248131787556,
"learning_rate": 2.5168833812118855e-06,
"loss": 0.4427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21779406070709229,
"step": 3920,
"valid_targets_mean": 2524.6,
"valid_targets_min": 359
},
{
"epoch": 5.993124522536287,
"grad_norm": 0.6650728699135563,
"learning_rate": 2.480032455531707e-06,
"loss": 0.4061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17643976211547852,
"step": 3925,
"valid_targets_mean": 2614.1,
"valid_targets_min": 832
},
{
"epoch": 6.0,
"grad_norm": 1.031459537664997,
"learning_rate": 2.443435459890626e-06,
"loss": 0.4544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44087493419647217,
"step": 3930,
"valid_targets_mean": 3814.1,
"valid_targets_min": 1027
},
{
"epoch": 6.007639419404125,
"grad_norm": 0.6863931120269993,
"learning_rate": 2.4070929247163764e-06,
"loss": 0.4425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252174437046051,
"step": 3935,
"valid_targets_mean": 3363.9,
"valid_targets_min": 851
},
{
"epoch": 6.015278838808251,
"grad_norm": 0.8065060516729766,
"learning_rate": 2.371005376748596e-06,
"loss": 0.381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19682547450065613,
"step": 3940,
"valid_targets_mean": 2635.6,
"valid_targets_min": 992
},
{
"epoch": 6.022918258212376,
"grad_norm": 0.6875190773960217,
"learning_rate": 2.3351733390312005e-06,
"loss": 0.4147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1877930611371994,
"step": 3945,
"valid_targets_mean": 3125.6,
"valid_targets_min": 1002
},
{
"epoch": 6.0305576776165015,
"grad_norm": 0.7113750000743607,
"learning_rate": 2.2995973309048013e-06,
"loss": 0.3916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18945392966270447,
"step": 3950,
"valid_targets_mean": 3022.5,
"valid_targets_min": 787
},
{
"epoch": 6.0381970970206265,
"grad_norm": 0.7668863834844798,
"learning_rate": 2.2642778679992007e-06,
"loss": 0.441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18376567959785461,
"step": 3955,
"valid_targets_mean": 2929.2,
"valid_targets_min": 1078
},
{
"epoch": 6.045836516424751,
"grad_norm": 0.6400997176841478,
"learning_rate": 2.2292154622258623e-06,
"loss": 0.4039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10822135210037231,
"step": 3960,
"valid_targets_mean": 2783.8,
"valid_targets_min": 1233
},
{
"epoch": 6.053475935828877,
"grad_norm": 0.6827622640359982,
"learning_rate": 2.194410621770566e-06,
"loss": 0.395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2305392324924469,
"step": 3965,
"valid_targets_mean": 4637.6,
"valid_targets_min": 1234
},
{
"epoch": 6.061115355233002,
"grad_norm": 0.6742130374126593,
"learning_rate": 2.1598638510859795e-06,
"loss": 0.3969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17292946577072144,
"step": 3970,
"valid_targets_mean": 3895.4,
"valid_targets_min": 1183
},
{
"epoch": 6.068754774637128,
"grad_norm": 0.7224201918662315,
"learning_rate": 2.1255756508843774e-06,
"loss": 0.4092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2280636876821518,
"step": 3975,
"valid_targets_mean": 3655.5,
"valid_targets_min": 550
},
{
"epoch": 6.076394194041253,
"grad_norm": 0.696693155288902,
"learning_rate": 2.0915465181303874e-06,
"loss": 0.4309,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18954971432685852,
"step": 3980,
"valid_targets_mean": 3254.5,
"valid_targets_min": 1125
},
{
"epoch": 6.084033613445378,
"grad_norm": 0.7159544890081604,
"learning_rate": 2.057776946033765e-06,
"loss": 0.396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17513585090637207,
"step": 3985,
"valid_targets_mean": 3132.8,
"valid_targets_min": 764
},
{
"epoch": 6.091673032849504,
"grad_norm": 0.7488349752843247,
"learning_rate": 2.0242674240422655e-06,
"loss": 0.404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14049875736236572,
"step": 3990,
"valid_targets_mean": 2235.8,
"valid_targets_min": 1256
},
{
"epoch": 6.099312452253629,
"grad_norm": 0.7563615274137214,
"learning_rate": 1.991018437834542e-06,
"loss": 0.4378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19269230961799622,
"step": 3995,
"valid_targets_mean": 3002.5,
"valid_targets_min": 794
},
{
"epoch": 6.106951871657754,
"grad_norm": 0.7581872453513444,
"learning_rate": 1.9580304693131015e-06,
"loss": 0.4248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2181900590658188,
"step": 4000,
"valid_targets_mean": 3014.9,
"valid_targets_min": 1194
},
{
"epoch": 6.114591291061879,
"grad_norm": 0.7927614418513154,
"learning_rate": 1.925303996597341e-06,
"loss": 0.3909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17333531379699707,
"step": 4005,
"valid_targets_mean": 2303.4,
"valid_targets_min": 1163
},
{
"epoch": 6.122230710466004,
"grad_norm": 0.6627386326218554,
"learning_rate": 1.8928394940165828e-06,
"loss": 0.422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21585026383399963,
"step": 4010,
"valid_targets_mean": 4336.9,
"valid_targets_min": 962
},
{
"epoch": 6.12987012987013,
"grad_norm": 0.6910708074716676,
"learning_rate": 1.860637432103234e-06,
"loss": 0.4067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18705642223358154,
"step": 4015,
"valid_targets_mean": 3601.0,
"valid_targets_min": 1149
},
{
"epoch": 6.137509549274255,
"grad_norm": 0.654947784139743,
"learning_rate": 1.8286982775859407e-06,
"loss": 0.3906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21154358983039856,
"step": 4020,
"valid_targets_mean": 4067.4,
"valid_targets_min": 944
},
{
"epoch": 6.145148968678381,
"grad_norm": 0.786026884990914,
"learning_rate": 1.7970224933828539e-06,
"loss": 0.4181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17581038177013397,
"step": 4025,
"valid_targets_mean": 2357.8,
"valid_targets_min": 1129
},
{
"epoch": 6.152788388082506,
"grad_norm": 0.6201923882409753,
"learning_rate": 1.7656105385948708e-06,
"loss": 0.3878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32060492038726807,
"step": 4030,
"valid_targets_mean": 6241.4,
"valid_targets_min": 531
},
{
"epoch": 6.160427807486631,
"grad_norm": 0.821742202354764,
"learning_rate": 1.7344628684990405e-06,
"loss": 0.4066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22368258237838745,
"step": 4035,
"valid_targets_mean": 2545.4,
"valid_targets_min": 871
},
{
"epoch": 6.168067226890757,
"grad_norm": 0.787669642326113,
"learning_rate": 1.7035799345419212e-06,
"loss": 0.4129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22682487964630127,
"step": 4040,
"valid_targets_mean": 3353.8,
"valid_targets_min": 712
},
{
"epoch": 6.1757066462948815,
"grad_norm": 0.647719500085238,
"learning_rate": 1.672962184333049e-06,
"loss": 0.4063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25017115473747253,
"step": 4045,
"valid_targets_mean": 4126.0,
"valid_targets_min": 1178
},
{
"epoch": 6.1833460656990065,
"grad_norm": 0.7747670126199028,
"learning_rate": 1.6426100616384654e-06,
"loss": 0.4065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16823174059391022,
"step": 4050,
"valid_targets_mean": 2440.1,
"valid_targets_min": 1561
},
{
"epoch": 6.190985485103132,
"grad_norm": 0.7476785216452516,
"learning_rate": 1.6125240063742565e-06,
"loss": 0.3991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19015461206436157,
"step": 4055,
"valid_targets_mean": 3180.9,
"valid_targets_min": 903
},
{
"epoch": 6.198624904507257,
"grad_norm": 0.7815290028556419,
"learning_rate": 1.582704454600208e-06,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18614669144153595,
"step": 4060,
"valid_targets_mean": 2710.0,
"valid_targets_min": 683
},
{
"epoch": 6.206264323911383,
"grad_norm": 0.727274439614293,
"learning_rate": 1.5531518385134625e-06,
"loss": 0.3997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15869663655757904,
"step": 4065,
"valid_targets_mean": 2874.2,
"valid_targets_min": 740
},
{
"epoch": 6.213903743315508,
"grad_norm": 0.7405238943348815,
"learning_rate": 1.5238665864422665e-06,
"loss": 0.4392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18218465149402618,
"step": 4070,
"valid_targets_mean": 2788.8,
"valid_targets_min": 1449
},
{
"epoch": 6.221543162719633,
"grad_norm": 0.6971040390142008,
"learning_rate": 1.4948491228397544e-06,
"loss": 0.3981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15370672941207886,
"step": 4075,
"valid_targets_mean": 2588.0,
"valid_targets_min": 1384
},
{
"epoch": 6.229182582123759,
"grad_norm": 0.6481267442709662,
"learning_rate": 1.4660998682778105e-06,
"loss": 0.3941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17396646738052368,
"step": 4080,
"valid_targets_mean": 3749.6,
"valid_targets_min": 1736
},
{
"epoch": 6.236822001527884,
"grad_norm": 0.7595999593253812,
"learning_rate": 1.4376192394409571e-06,
"loss": 0.3894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15226925909519196,
"step": 4085,
"valid_targets_mean": 1917.9,
"valid_targets_min": 828
},
{
"epoch": 6.2444614209320095,
"grad_norm": 0.7375012589840757,
"learning_rate": 1.409407649120318e-06,
"loss": 0.4365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2002945989370346,
"step": 4090,
"valid_targets_mean": 3363.8,
"valid_targets_min": 1323
},
{
"epoch": 6.2521008403361344,
"grad_norm": 0.6737898597954428,
"learning_rate": 1.38146550620766e-06,
"loss": 0.4201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18218186497688293,
"step": 4095,
"valid_targets_mean": 3539.6,
"valid_targets_min": 1262
},
{
"epoch": 6.259740259740259,
"grad_norm": 0.7675540823076344,
"learning_rate": 1.353793215689414e-06,
"loss": 0.4405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2069307118654251,
"step": 4100,
"valid_targets_mean": 2938.4,
"valid_targets_min": 1579
},
{
"epoch": 6.267379679144385,
"grad_norm": 0.8436198032007797,
"learning_rate": 1.326391178640869e-06,
"loss": 0.4023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20973223447799683,
"step": 4105,
"valid_targets_mean": 2793.8,
"valid_targets_min": 1364
},
{
"epoch": 6.27501909854851,
"grad_norm": 0.8653534524601917,
"learning_rate": 1.2992597922203087e-06,
"loss": 0.4166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17687362432479858,
"step": 4110,
"valid_targets_mean": 2699.1,
"valid_targets_min": 605
},
{
"epoch": 6.282658517952636,
"grad_norm": 0.7695788197633405,
"learning_rate": 1.2723994496632775e-06,
"loss": 0.389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24052169919013977,
"step": 4115,
"valid_targets_mean": 3462.8,
"valid_targets_min": 695
},
{
"epoch": 6.290297937356761,
"grad_norm": 0.9251655508633336,
"learning_rate": 1.2458105402768905e-06,
"loss": 0.4135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18550032377243042,
"step": 4120,
"valid_targets_mean": 1907.9,
"valid_targets_min": 1138
},
{
"epoch": 6.297937356760886,
"grad_norm": 0.9075744467608439,
"learning_rate": 1.2194934494341548e-06,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1659584939479828,
"step": 4125,
"valid_targets_mean": 1987.1,
"valid_targets_min": 807
},
{
"epoch": 6.305576776165012,
"grad_norm": 0.8343949143994032,
"learning_rate": 1.1934485585684286e-06,
"loss": 0.4045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18994081020355225,
"step": 4130,
"valid_targets_mean": 2424.1,
"valid_targets_min": 716
},
{
"epoch": 6.313216195569137,
"grad_norm": 0.7719958475586056,
"learning_rate": 1.1676762451678592e-06,
"loss": 0.4074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15388676524162292,
"step": 4135,
"valid_targets_mean": 1865.9,
"valid_targets_min": 718
},
{
"epoch": 6.320855614973262,
"grad_norm": 0.6607601792071848,
"learning_rate": 1.1421768827699297e-06,
"loss": 0.3883,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21211379766464233,
"step": 4140,
"valid_targets_mean": 3929.9,
"valid_targets_min": 924
},
{
"epoch": 6.328495034377387,
"grad_norm": 0.6647948062348348,
"learning_rate": 1.1169508409560326e-06,
"loss": 0.3842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14956669509410858,
"step": 4145,
"valid_targets_mean": 3332.8,
"valid_targets_min": 1628
},
{
"epoch": 6.336134453781512,
"grad_norm": 0.8833312270676275,
"learning_rate": 1.091998485346133e-06,
"loss": 0.4035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2864078879356384,
"step": 4150,
"valid_targets_mean": 3066.8,
"valid_targets_min": 560
},
{
"epoch": 6.343773873185638,
"grad_norm": 0.5784561383842487,
"learning_rate": 1.067320177593445e-06,
"loss": 0.4323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2022693157196045,
"step": 4155,
"valid_targets_mean": 5883.6,
"valid_targets_min": 1397
},
{
"epoch": 6.351413292589763,
"grad_norm": 0.7000964975069451,
"learning_rate": 1.0429162753792044e-06,
"loss": 0.3926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17252172529697418,
"step": 4160,
"valid_targets_mean": 3317.1,
"valid_targets_min": 895
},
{
"epoch": 6.359052711993888,
"grad_norm": 0.8238761195026589,
"learning_rate": 1.0187871324074817e-06,
"loss": 0.3856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1751250922679901,
"step": 4165,
"valid_targets_mean": 2360.1,
"valid_targets_min": 867
},
{
"epoch": 6.366692131398014,
"grad_norm": 0.6494877601984028,
"learning_rate": 9.94933098400055e-07,
"loss": 0.4099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22490882873535156,
"step": 4170,
"valid_targets_mean": 4196.5,
"valid_targets_min": 1234
},
{
"epoch": 6.374331550802139,
"grad_norm": 0.8728852143884642,
"learning_rate": 9.713545190913476e-07,
"loss": 0.4277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.201102614402771,
"step": 4175,
"valid_targets_mean": 2424.6,
"valid_targets_min": 814
},
{
"epoch": 6.381970970206265,
"grad_norm": 0.749192164055093,
"learning_rate": 9.480517362234032e-07,
"loss": 0.3976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2019495815038681,
"step": 4180,
"valid_targets_mean": 3497.0,
"valid_targets_min": 1721
},
{
"epoch": 6.3896103896103895,
"grad_norm": 0.638180410821364,
"learning_rate": 9.250250875409383e-07,
"loss": 0.393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14714564383029938,
"step": 4185,
"valid_targets_mean": 3203.1,
"valid_targets_min": 1783
},
{
"epoch": 6.3972498090145145,
"grad_norm": 0.8607560920587862,
"learning_rate": 9.022749067864689e-07,
"loss": 0.3939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2053133249282837,
"step": 4190,
"valid_targets_mean": 2401.1,
"valid_targets_min": 320
},
{
"epoch": 6.40488922841864,
"grad_norm": 0.7670657586929429,
"learning_rate": 8.798015236954227e-07,
"loss": 0.3922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17581060528755188,
"step": 4195,
"valid_targets_mean": 2269.9,
"valid_targets_min": 359
},
{
"epoch": 6.412528647822765,
"grad_norm": 0.7059107747645008,
"learning_rate": 8.57605263991419e-07,
"loss": 0.3943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19902944564819336,
"step": 4200,
"valid_targets_mean": 3872.6,
"valid_targets_min": 1255
},
{
"epoch": 6.420168067226891,
"grad_norm": 0.7986131923796598,
"learning_rate": 8.356864493815075e-07,
"loss": 0.3897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16714152693748474,
"step": 4205,
"valid_targets_mean": 2283.8,
"valid_targets_min": 1434
},
{
"epoch": 6.427807486631016,
"grad_norm": 0.7984289049100618,
"learning_rate": 8.14045397551515e-07,
"loss": 0.4303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19162634015083313,
"step": 4210,
"valid_targets_mean": 2795.0,
"valid_targets_min": 1235
},
{
"epoch": 6.435446906035141,
"grad_norm": 1.951568058224522,
"learning_rate": 7.926824221614504e-07,
"loss": 0.394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23274573683738708,
"step": 4215,
"valid_targets_mean": 2335.2,
"valid_targets_min": 1209
},
{
"epoch": 6.443086325439267,
"grad_norm": 0.7101960443226988,
"learning_rate": 7.715978328409557e-07,
"loss": 0.438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1813594102859497,
"step": 4220,
"valid_targets_mean": 3580.1,
"valid_targets_min": 1070
},
{
"epoch": 6.450725744843392,
"grad_norm": 0.6571344450932545,
"learning_rate": 7.507919351847981e-07,
"loss": 0.4103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18891257047653198,
"step": 4225,
"valid_targets_mean": 4464.8,
"valid_targets_min": 2225
},
{
"epoch": 6.4583651642475175,
"grad_norm": 0.7851602265875163,
"learning_rate": 7.30265030748476e-07,
"loss": 0.423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21480068564414978,
"step": 4230,
"valid_targets_mean": 2892.2,
"valid_targets_min": 925
},
{
"epoch": 6.466004583651642,
"grad_norm": 0.8880996159628666,
"learning_rate": 7.100174170438201e-07,
"loss": 0.4379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25237733125686646,
"step": 4235,
"valid_targets_mean": 2963.4,
"valid_targets_min": 1664
},
{
"epoch": 6.473644003055767,
"grad_norm": 0.7559016985627138,
"learning_rate": 6.900493875346881e-07,
"loss": 0.4064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1809263825416565,
"step": 4240,
"valid_targets_mean": 2675.2,
"valid_targets_min": 707
},
{
"epoch": 6.481283422459893,
"grad_norm": 0.8329205888133813,
"learning_rate": 6.703612316327235e-07,
"loss": 0.3957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18009233474731445,
"step": 4245,
"valid_targets_mean": 2314.6,
"valid_targets_min": 336
},
{
"epoch": 6.488922841864018,
"grad_norm": 0.7520955113985317,
"learning_rate": 6.509532346931458e-07,
"loss": 0.427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29548799991607666,
"step": 4250,
"valid_targets_mean": 4104.2,
"valid_targets_min": 1550
},
{
"epoch": 6.496562261268144,
"grad_norm": 0.6690947855209332,
"learning_rate": 6.318256780106202e-07,
"loss": 0.3992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18764840066432953,
"step": 4255,
"valid_targets_mean": 3462.2,
"valid_targets_min": 1657
},
{
"epoch": 6.504201680672269,
"grad_norm": 0.7368821627461865,
"learning_rate": 6.129788388151837e-07,
"loss": 0.4374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1427152156829834,
"step": 4260,
"valid_targets_mean": 2727.9,
"valid_targets_min": 1300
},
{
"epoch": 6.511841100076394,
"grad_norm": 0.71263809616908,
"learning_rate": 5.94412990268216e-07,
"loss": 0.4113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2381899654865265,
"step": 4265,
"valid_targets_mean": 3497.4,
"valid_targets_min": 897
},
{
"epoch": 6.51948051948052,
"grad_norm": 0.6447965631661843,
"learning_rate": 5.761284014585044e-07,
"loss": 0.4191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14833205938339233,
"step": 4270,
"valid_targets_mean": 4181.8,
"valid_targets_min": 1642
},
{
"epoch": 6.527119938884645,
"grad_norm": 0.9278788809414662,
"learning_rate": 5.581253373983097e-07,
"loss": 0.4025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31120574474334717,
"step": 4275,
"valid_targets_mean": 2991.6,
"valid_targets_min": 1091
},
{
"epoch": 6.53475935828877,
"grad_norm": 0.8206199783968727,
"learning_rate": 5.404040590195548e-07,
"loss": 0.4055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21243171393871307,
"step": 4280,
"valid_targets_mean": 3095.6,
"valid_targets_min": 938
},
{
"epoch": 6.542398777692895,
"grad_norm": 0.7123021318130813,
"learning_rate": 5.229648231700246e-07,
"loss": 0.4031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1695111095905304,
"step": 4285,
"valid_targets_mean": 3057.0,
"valid_targets_min": 959
},
{
"epoch": 6.55003819709702,
"grad_norm": 0.7367430336219517,
"learning_rate": 5.058078826096613e-07,
"loss": 0.4204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15544866025447845,
"step": 4290,
"valid_targets_mean": 2747.5,
"valid_targets_min": 823
},
{
"epoch": 6.557677616501146,
"grad_norm": 0.8256976164624099,
"learning_rate": 4.889334860068706e-07,
"loss": 0.4115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25187405943870544,
"step": 4295,
"valid_targets_mean": 3789.0,
"valid_targets_min": 1256
},
{
"epoch": 6.565317035905271,
"grad_norm": 0.7000989539122991,
"learning_rate": 4.723418779349542e-07,
"loss": 0.3866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18330548703670502,
"step": 4300,
"valid_targets_mean": 3228.8,
"valid_targets_min": 875
},
{
"epoch": 6.572956455309397,
"grad_norm": 0.7769235104940684,
"learning_rate": 4.560332988685412e-07,
"loss": 0.426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16183039546012878,
"step": 4305,
"valid_targets_mean": 2477.9,
"valid_targets_min": 842
},
{
"epoch": 6.580595874713522,
"grad_norm": 0.8338757429293011,
"learning_rate": 4.40007985180102e-07,
"loss": 0.3835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1706201136112213,
"step": 4310,
"valid_targets_mean": 2273.8,
"valid_targets_min": 826
},
{
"epoch": 6.588235294117647,
"grad_norm": 0.9735838755677048,
"learning_rate": 4.242661691365446e-07,
"loss": 0.4255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2386619746685028,
"step": 4315,
"valid_targets_mean": 2037.2,
"valid_targets_min": 690
},
{
"epoch": 6.595874713521773,
"grad_norm": 0.8316266447924147,
"learning_rate": 4.088080788958171e-07,
"loss": 0.3911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20971032977104187,
"step": 4320,
"valid_targets_mean": 2690.0,
"valid_targets_min": 849
},
{
"epoch": 6.6035141329258975,
"grad_norm": 0.944056483188538,
"learning_rate": 3.936339385036236e-07,
"loss": 0.41,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18069300055503845,
"step": 4325,
"valid_targets_mean": 1738.2,
"valid_targets_min": 928
},
{
"epoch": 6.611153552330023,
"grad_norm": 0.7536331411489621,
"learning_rate": 3.787439678901739e-07,
"loss": 0.395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14931751787662506,
"step": 4330,
"valid_targets_mean": 2758.6,
"valid_targets_min": 735
},
{
"epoch": 6.618792971734148,
"grad_norm": 0.7552466450639199,
"learning_rate": 3.641383828669831e-07,
"loss": 0.4145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22667306661605835,
"step": 4335,
"valid_targets_mean": 4108.0,
"valid_targets_min": 998
},
{
"epoch": 6.626432391138273,
"grad_norm": 0.7452294813232219,
"learning_rate": 3.498173951237593e-07,
"loss": 0.4177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18081125617027283,
"step": 4340,
"valid_targets_mean": 2849.5,
"valid_targets_min": 568
},
{
"epoch": 6.634071810542399,
"grad_norm": 0.7645301896963309,
"learning_rate": 3.3578121222532565e-07,
"loss": 0.4204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17134138941764832,
"step": 4345,
"valid_targets_mean": 2639.2,
"valid_targets_min": 759
},
{
"epoch": 6.641711229946524,
"grad_norm": 0.6464171031333205,
"learning_rate": 3.2203003760861827e-07,
"loss": 0.4402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2736469507217407,
"step": 4350,
"valid_targets_mean": 4797.0,
"valid_targets_min": 1765
},
{
"epoch": 6.64935064935065,
"grad_norm": 0.9127196120836408,
"learning_rate": 3.085640705797266e-07,
"loss": 0.4008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24204598367214203,
"step": 4355,
"valid_targets_mean": 3617.4,
"valid_targets_min": 852
},
{
"epoch": 6.656990068754775,
"grad_norm": 0.685182853452726,
"learning_rate": 2.953835063110222e-07,
"loss": 0.3911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20241063833236694,
"step": 4360,
"valid_targets_mean": 3864.1,
"valid_targets_min": 1061
},
{
"epoch": 6.6646294881589,
"grad_norm": 0.6833217903769809,
"learning_rate": 2.824885358383123e-07,
"loss": 0.4095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13412925601005554,
"step": 4365,
"valid_targets_mean": 2417.9,
"valid_targets_min": 1237
},
{
"epoch": 6.6722689075630255,
"grad_norm": 0.785494709686734,
"learning_rate": 2.6987934605808617e-07,
"loss": 0.454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19218818843364716,
"step": 4370,
"valid_targets_mean": 2367.4,
"valid_targets_min": 1093
},
{
"epoch": 6.67990832696715,
"grad_norm": 0.7628862307702344,
"learning_rate": 2.575561197247911e-07,
"loss": 0.4354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21473418176174164,
"step": 4375,
"valid_targets_mean": 3552.5,
"valid_targets_min": 662
},
{
"epoch": 6.687547746371276,
"grad_norm": 0.7289251185774825,
"learning_rate": 2.4551903544819625e-07,
"loss": 0.3982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19578754901885986,
"step": 4380,
"valid_targets_mean": 4277.5,
"valid_targets_min": 882
},
{
"epoch": 6.695187165775401,
"grad_norm": 0.7546985683585661,
"learning_rate": 2.3376826769080153e-07,
"loss": 0.3993,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24338172376155853,
"step": 4385,
"valid_targets_mean": 3920.4,
"valid_targets_min": 425
},
{
"epoch": 6.702826585179526,
"grad_norm": 0.7218443448066771,
"learning_rate": 2.2230398676529763e-07,
"loss": 0.3856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2012680470943451,
"step": 4390,
"valid_targets_mean": 3084.5,
"valid_targets_min": 1056
},
{
"epoch": 6.710466004583652,
"grad_norm": 0.7629253125535567,
"learning_rate": 2.1112635883211663e-07,
"loss": 0.4006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18300996720790863,
"step": 4395,
"valid_targets_mean": 2941.1,
"valid_targets_min": 1379
},
{
"epoch": 6.718105423987777,
"grad_norm": 0.8426812792697609,
"learning_rate": 2.0023554589701177e-07,
"loss": 0.4371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2638070583343506,
"step": 4400,
"valid_targets_mean": 3378.0,
"valid_targets_min": 1189
},
{
"epoch": 6.725744843391903,
"grad_norm": 0.9125345695540272,
"learning_rate": 1.8963170580870384e-07,
"loss": 0.3804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2333306074142456,
"step": 4405,
"valid_targets_mean": 3033.8,
"valid_targets_min": 735
},
{
"epoch": 6.733384262796028,
"grad_norm": 0.7491072210513785,
"learning_rate": 1.793149922566051e-07,
"loss": 0.389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18493598699569702,
"step": 4410,
"valid_targets_mean": 2844.1,
"valid_targets_min": 1499
},
{
"epoch": 6.741023682200153,
"grad_norm": 0.7075668630390985,
"learning_rate": 1.6928555476859454e-07,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26151540875434875,
"step": 4415,
"valid_targets_mean": 3931.2,
"valid_targets_min": 1108
},
{
"epoch": 6.748663101604278,
"grad_norm": 0.6953662547298742,
"learning_rate": 1.5954353870883289e-07,
"loss": 0.3938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18146592378616333,
"step": 4420,
"valid_targets_mean": 3214.6,
"valid_targets_min": 1157
},
{
"epoch": 6.756302521008403,
"grad_norm": 0.8442580153908322,
"learning_rate": 1.500890852756709e-07,
"loss": 0.424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2436636984348297,
"step": 4425,
"valid_targets_mean": 3346.9,
"valid_targets_min": 945
},
{
"epoch": 6.763941940412528,
"grad_norm": 0.7756874677183939,
"learning_rate": 1.409223314996e-07,
"loss": 0.4071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21483536064624786,
"step": 4430,
"valid_targets_mean": 2961.0,
"valid_targets_min": 989
},
{
"epoch": 6.771581359816654,
"grad_norm": 0.7526769191170677,
"learning_rate": 1.3204341024125822e-07,
"loss": 0.4216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28000983595848083,
"step": 4435,
"valid_targets_mean": 3804.1,
"valid_targets_min": 799
},
{
"epoch": 6.779220779220779,
"grad_norm": 0.7084850932543485,
"learning_rate": 1.234524501895207e-07,
"loss": 0.4104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1803816705942154,
"step": 4440,
"valid_targets_mean": 3388.8,
"valid_targets_min": 717
},
{
"epoch": 6.786860198624905,
"grad_norm": 0.6995301576820601,
"learning_rate": 1.1514957585961884e-07,
"loss": 0.4265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2403801530599594,
"step": 4445,
"valid_targets_mean": 3688.4,
"valid_targets_min": 856
},
{
"epoch": 6.79449961802903,
"grad_norm": 0.7980224363102327,
"learning_rate": 1.0713490759133749e-07,
"loss": 0.4298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24173349142074585,
"step": 4450,
"valid_targets_mean": 3873.1,
"valid_targets_min": 778
},
{
"epoch": 6.802139037433155,
"grad_norm": 0.938657736390237,
"learning_rate": 9.940856154728285e-08,
"loss": 0.4038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2338993102312088,
"step": 4455,
"valid_targets_mean": 2365.4,
"valid_targets_min": 868
},
{
"epoch": 6.809778456837281,
"grad_norm": 0.7970620171037146,
"learning_rate": 9.197064971118608e-08,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1684938669204712,
"step": 4460,
"valid_targets_mean": 2387.1,
"valid_targets_min": 953
},
{
"epoch": 6.8174178762414055,
"grad_norm": 0.7990434021559547,
"learning_rate": 8.482127988628686e-08,
"loss": 0.3957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20925235748291016,
"step": 4465,
"valid_targets_mean": 3208.0,
"valid_targets_min": 722
},
{
"epoch": 6.825057295645531,
"grad_norm": 0.711948338122833,
"learning_rate": 7.79605556937657e-08,
"loss": 0.3905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22843460738658905,
"step": 4470,
"valid_targets_mean": 3919.1,
"valid_targets_min": 1615
},
{
"epoch": 6.832696715049656,
"grad_norm": 0.7448708465075117,
"learning_rate": 7.138857657125187e-08,
"loss": 0.3832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16185849905014038,
"step": 4475,
"valid_targets_mean": 2761.2,
"valid_targets_min": 1180
},
{
"epoch": 6.840336134453781,
"grad_norm": 0.7579937641972179,
"learning_rate": 6.510543777136446e-08,
"loss": 0.4065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20061391592025757,
"step": 4480,
"valid_targets_mean": 3314.9,
"valid_targets_min": 823
},
{
"epoch": 6.847975553857907,
"grad_norm": 0.7907444070235546,
"learning_rate": 5.9111230360358044e-08,
"loss": 0.4075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.186139315366745,
"step": 4485,
"valid_targets_mean": 2889.6,
"valid_targets_min": 1288
},
{
"epoch": 6.855614973262032,
"grad_norm": 0.6975648733688181,
"learning_rate": 5.340604121677251e-08,
"loss": 0.4429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2715853750705719,
"step": 4490,
"valid_targets_mean": 5079.4,
"valid_targets_min": 939
},
{
"epoch": 6.863254392666157,
"grad_norm": 0.7829068945896205,
"learning_rate": 4.798995303020082e-08,
"loss": 0.4006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18688000738620758,
"step": 4495,
"valid_targets_mean": 3115.0,
"valid_targets_min": 1063
},
{
"epoch": 6.870893812070283,
"grad_norm": 0.810646499172978,
"learning_rate": 4.286304430006993e-08,
"loss": 0.4184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2315147966146469,
"step": 4500,
"valid_targets_mean": 3839.6,
"valid_targets_min": 1121
},
{
"epoch": 6.878533231474408,
"grad_norm": 0.7619179750430908,
"learning_rate": 3.802538933451949e-08,
"loss": 0.3843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1792149543762207,
"step": 4505,
"valid_targets_mean": 3125.1,
"valid_targets_min": 503
},
{
"epoch": 6.8861726508785335,
"grad_norm": 0.7682971319843082,
"learning_rate": 3.34770582493138e-08,
"loss": 0.3997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17539235949516296,
"step": 4510,
"valid_targets_mean": 2813.1,
"valid_targets_min": 694
},
{
"epoch": 6.893812070282658,
"grad_norm": 0.845749955999027,
"learning_rate": 2.921811696682708e-08,
"loss": 0.4075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2827659845352173,
"step": 4515,
"valid_targets_mean": 3597.2,
"valid_targets_min": 517
},
{
"epoch": 6.901451489686783,
"grad_norm": 0.690837425334579,
"learning_rate": 2.5248627215093135e-08,
"loss": 0.415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1957932710647583,
"step": 4520,
"valid_targets_mean": 3684.2,
"valid_targets_min": 1370
},
{
"epoch": 6.909090909090909,
"grad_norm": 0.6881716196186753,
"learning_rate": 2.1568646526906045e-08,
"loss": 0.4057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14163070917129517,
"step": 4525,
"valid_targets_mean": 2711.8,
"valid_targets_min": 1141
},
{
"epoch": 6.916730328495034,
"grad_norm": 0.7723694993387338,
"learning_rate": 1.8178228238985296e-08,
"loss": 0.4415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16728349030017853,
"step": 4530,
"valid_targets_mean": 2791.1,
"valid_targets_min": 2107
},
{
"epoch": 6.92436974789916,
"grad_norm": 0.7098507533235618,
"learning_rate": 1.507742149121194e-08,
"loss": 0.438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1468479186296463,
"step": 4535,
"valid_targets_mean": 2866.5,
"valid_targets_min": 813
},
{
"epoch": 6.932009167303285,
"grad_norm": 0.7742964005350101,
"learning_rate": 1.2266271225902515e-08,
"loss": 0.406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18890097737312317,
"step": 4540,
"valid_targets_mean": 3014.0,
"valid_targets_min": 1478
},
{
"epoch": 6.93964858670741,
"grad_norm": 0.7371062150413249,
"learning_rate": 9.744818187169547e-09,
"loss": 0.4244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25650227069854736,
"step": 4545,
"valid_targets_mean": 4534.8,
"valid_targets_min": 1061
},
{
"epoch": 6.947288006111536,
"grad_norm": 0.7581755468751333,
"learning_rate": 7.513098920324257e-09,
"loss": 0.4061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18233633041381836,
"step": 4550,
"valid_targets_mean": 3266.2,
"valid_targets_min": 1629
},
{
"epoch": 6.954927425515661,
"grad_norm": 0.8049076099781532,
"learning_rate": 5.571145771345876e-09,
"loss": 0.4024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2446897178888321,
"step": 4555,
"valid_targets_mean": 3738.0,
"valid_targets_min": 1564
},
{
"epoch": 6.962566844919786,
"grad_norm": 0.8164662192077489,
"learning_rate": 3.918986886424225e-09,
"loss": 0.3819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18588244915008545,
"step": 4560,
"valid_targets_mean": 3562.0,
"valid_targets_min": 1451
},
{
"epoch": 6.970206264323911,
"grad_norm": 0.8168583040167611,
"learning_rate": 2.5566462115333978e-09,
"loss": 0.4236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27808865904808044,
"step": 4565,
"valid_targets_mean": 2969.0,
"valid_targets_min": 948
},
{
"epoch": 6.977845683728036,
"grad_norm": 0.7599055862581678,
"learning_rate": 1.484143492100909e-09,
"loss": 0.3961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16413216292858124,
"step": 4570,
"valid_targets_mean": 2781.8,
"valid_targets_min": 643
},
{
"epoch": 6.985485103132162,
"grad_norm": 0.855562431244123,
"learning_rate": 7.014942727145979e-10,
"loss": 0.4307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20022156834602356,
"step": 4575,
"valid_targets_mean": 2384.5,
"valid_targets_min": 438
},
{
"epoch": 6.993124522536287,
"grad_norm": 0.6722570494176869,
"learning_rate": 2.0870989689614208e-10,
"loss": 0.408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2858823537826538,
"step": 4580,
"valid_targets_mean": 4627.0,
"valid_targets_min": 859
},
{
"epoch": 7.0,
"grad_norm": 1.1970404627629374,
"learning_rate": 5.797506938964859e-12,
"loss": 0.3911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35643327236175537,
"step": 4585,
"valid_targets_mean": 2517.8,
"valid_targets_min": 562
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35643327236175537,
"step": 4585,
"total_flos": 1.0328415967578685e+18,
"train_loss": 0.4849937954541771,
"train_runtime": 33081.3008,
"train_samples_per_second": 2.216,
"train_steps_per_second": 0.139,
"valid_targets_mean": 2517.8,
"valid_targets_min": 562
}
],
"logging_steps": 5,
"max_steps": 4585,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.0328415967578685e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}