penfever's picture
End of training
d51befb verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4368,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.008012820512820512,
"grad_norm": 8.40942474050559,
"learning_rate": 3.661327231121282e-07,
"loss": 0.8612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4234336018562317,
"step": 5,
"valid_targets_mean": 2232.1,
"valid_targets_min": 951
},
{
"epoch": 0.016025641025641024,
"grad_norm": 8.48364139790815,
"learning_rate": 8.237986270022884e-07,
"loss": 0.8812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4549936056137085,
"step": 10,
"valid_targets_mean": 2954.6,
"valid_targets_min": 2024
},
{
"epoch": 0.02403846153846154,
"grad_norm": 8.720393584369761,
"learning_rate": 1.2814645308924487e-06,
"loss": 0.9171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4603043496608734,
"step": 15,
"valid_targets_mean": 2330.5,
"valid_targets_min": 1188
},
{
"epoch": 0.03205128205128205,
"grad_norm": 6.401065214818598,
"learning_rate": 1.7391304347826088e-06,
"loss": 0.8352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3336380124092102,
"step": 20,
"valid_targets_mean": 1985.0,
"valid_targets_min": 455
},
{
"epoch": 0.04006410256410257,
"grad_norm": 4.816552094508015,
"learning_rate": 2.196796338672769e-06,
"loss": 0.8584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40010353922843933,
"step": 25,
"valid_targets_mean": 2756.9,
"valid_targets_min": 929
},
{
"epoch": 0.04807692307692308,
"grad_norm": 4.335386813313282,
"learning_rate": 2.654462242562929e-06,
"loss": 0.7732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4342009425163269,
"step": 30,
"valid_targets_mean": 2161.2,
"valid_targets_min": 1193
},
{
"epoch": 0.05608974358974359,
"grad_norm": 3.177645784938531,
"learning_rate": 3.1121281464530894e-06,
"loss": 0.748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3209277391433716,
"step": 35,
"valid_targets_mean": 2150.0,
"valid_targets_min": 1202
},
{
"epoch": 0.0641025641025641,
"grad_norm": 2.628557761103501,
"learning_rate": 3.56979405034325e-06,
"loss": 0.7037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3309406638145447,
"step": 40,
"valid_targets_mean": 2116.4,
"valid_targets_min": 475
},
{
"epoch": 0.07211538461538461,
"grad_norm": 1.7033923530978847,
"learning_rate": 4.0274599542334094e-06,
"loss": 0.679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24123963713645935,
"step": 45,
"valid_targets_mean": 1675.2,
"valid_targets_min": 435
},
{
"epoch": 0.08012820512820513,
"grad_norm": 1.4563809782956156,
"learning_rate": 4.48512585812357e-06,
"loss": 0.6983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31092941761016846,
"step": 50,
"valid_targets_mean": 2253.2,
"valid_targets_min": 1095
},
{
"epoch": 0.08814102564102565,
"grad_norm": 1.205430924212798,
"learning_rate": 4.94279176201373e-06,
"loss": 0.6497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3203188180923462,
"step": 55,
"valid_targets_mean": 2870.5,
"valid_targets_min": 721
},
{
"epoch": 0.09615384615384616,
"grad_norm": 1.1392627369044308,
"learning_rate": 5.400457665903891e-06,
"loss": 0.6527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30013489723205566,
"step": 60,
"valid_targets_mean": 2388.1,
"valid_targets_min": 1013
},
{
"epoch": 0.10416666666666667,
"grad_norm": 1.1352639246979592,
"learning_rate": 5.858123569794051e-06,
"loss": 0.5812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.349726140499115,
"step": 65,
"valid_targets_mean": 2654.9,
"valid_targets_min": 1101
},
{
"epoch": 0.11217948717948718,
"grad_norm": 0.9808130025882383,
"learning_rate": 6.31578947368421e-06,
"loss": 0.5923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3157884478569031,
"step": 70,
"valid_targets_mean": 2987.8,
"valid_targets_min": 1489
},
{
"epoch": 0.1201923076923077,
"grad_norm": 0.9209470326055519,
"learning_rate": 6.773455377574372e-06,
"loss": 0.6071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3476266860961914,
"step": 75,
"valid_targets_mean": 2909.8,
"valid_targets_min": 1067
},
{
"epoch": 0.1282051282051282,
"grad_norm": 0.9674711198015653,
"learning_rate": 7.231121281464531e-06,
"loss": 0.5622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25228625535964966,
"step": 80,
"valid_targets_mean": 2015.8,
"valid_targets_min": 1036
},
{
"epoch": 0.1362179487179487,
"grad_norm": 0.9614682889742122,
"learning_rate": 7.688787185354691e-06,
"loss": 0.5662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23659241199493408,
"step": 85,
"valid_targets_mean": 1919.0,
"valid_targets_min": 876
},
{
"epoch": 0.14423076923076922,
"grad_norm": 0.9793609220779523,
"learning_rate": 8.146453089244852e-06,
"loss": 0.5578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2640606164932251,
"step": 90,
"valid_targets_mean": 1888.8,
"valid_targets_min": 1484
},
{
"epoch": 0.15224358974358973,
"grad_norm": 0.7747222745750588,
"learning_rate": 8.604118993135013e-06,
"loss": 0.5403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20079509913921356,
"step": 95,
"valid_targets_mean": 2408.2,
"valid_targets_min": 822
},
{
"epoch": 0.16025641025641027,
"grad_norm": 0.8968672399440782,
"learning_rate": 9.061784897025172e-06,
"loss": 0.5561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2350616157054901,
"step": 100,
"valid_targets_mean": 2021.5,
"valid_targets_min": 1011
},
{
"epoch": 0.16826923076923078,
"grad_norm": 0.8578003953330227,
"learning_rate": 9.519450800915333e-06,
"loss": 0.546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32088974118232727,
"step": 105,
"valid_targets_mean": 3198.9,
"valid_targets_min": 1398
},
{
"epoch": 0.1762820512820513,
"grad_norm": 0.9775604038641746,
"learning_rate": 9.977116704805492e-06,
"loss": 0.5408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2899416387081146,
"step": 110,
"valid_targets_mean": 1989.8,
"valid_targets_min": 1233
},
{
"epoch": 0.1842948717948718,
"grad_norm": 0.9484746064620678,
"learning_rate": 1.0434782608695653e-05,
"loss": 0.5271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30604788661003113,
"step": 115,
"valid_targets_mean": 2266.0,
"valid_targets_min": 1375
},
{
"epoch": 0.19230769230769232,
"grad_norm": 0.746255880008432,
"learning_rate": 1.0892448512585814e-05,
"loss": 0.4977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20729142427444458,
"step": 120,
"valid_targets_mean": 2384.1,
"valid_targets_min": 218
},
{
"epoch": 0.20032051282051283,
"grad_norm": 0.7438833264963527,
"learning_rate": 1.1350114416475973e-05,
"loss": 0.5253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22926843166351318,
"step": 125,
"valid_targets_mean": 2618.1,
"valid_targets_min": 1108
},
{
"epoch": 0.20833333333333334,
"grad_norm": 0.8570205673450283,
"learning_rate": 1.1807780320366134e-05,
"loss": 0.5036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24288621544837952,
"step": 130,
"valid_targets_mean": 1906.1,
"valid_targets_min": 944
},
{
"epoch": 0.21634615384615385,
"grad_norm": 0.9417163414734101,
"learning_rate": 1.2265446224256295e-05,
"loss": 0.5166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769995927810669,
"step": 135,
"valid_targets_mean": 2436.2,
"valid_targets_min": 1533
},
{
"epoch": 0.22435897435897437,
"grad_norm": 0.9860064049785607,
"learning_rate": 1.2723112128146454e-05,
"loss": 0.5362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32120639085769653,
"step": 140,
"valid_targets_mean": 2255.4,
"valid_targets_min": 801
},
{
"epoch": 0.23237179487179488,
"grad_norm": 0.7640125489075233,
"learning_rate": 1.3180778032036615e-05,
"loss": 0.5095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2866376042366028,
"step": 145,
"valid_targets_mean": 3077.4,
"valid_targets_min": 1777
},
{
"epoch": 0.2403846153846154,
"grad_norm": 1.0242816861010413,
"learning_rate": 1.3638443935926776e-05,
"loss": 0.5142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3341456651687622,
"step": 150,
"valid_targets_mean": 2355.0,
"valid_targets_min": 1100
},
{
"epoch": 0.2483974358974359,
"grad_norm": 0.642501178965298,
"learning_rate": 1.4096109839816933e-05,
"loss": 0.4688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22167231142520905,
"step": 155,
"valid_targets_mean": 3613.2,
"valid_targets_min": 1137
},
{
"epoch": 0.2564102564102564,
"grad_norm": 0.9373104786339153,
"learning_rate": 1.4553775743707096e-05,
"loss": 0.5145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24051184952259064,
"step": 160,
"valid_targets_mean": 2034.8,
"valid_targets_min": 1050
},
{
"epoch": 0.2644230769230769,
"grad_norm": 0.9417451887793393,
"learning_rate": 1.5011441647597256e-05,
"loss": 0.5141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25027361512184143,
"step": 165,
"valid_targets_mean": 1953.4,
"valid_targets_min": 738
},
{
"epoch": 0.2724358974358974,
"grad_norm": 0.794295403588529,
"learning_rate": 1.5469107551487414e-05,
"loss": 0.4797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2761167287826538,
"step": 170,
"valid_targets_mean": 2741.1,
"valid_targets_min": 778
},
{
"epoch": 0.28044871794871795,
"grad_norm": 1.041873213895435,
"learning_rate": 1.5926773455377575e-05,
"loss": 0.5241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23646000027656555,
"step": 175,
"valid_targets_mean": 1639.4,
"valid_targets_min": 888
},
{
"epoch": 0.28846153846153844,
"grad_norm": 0.7688575732221453,
"learning_rate": 1.6384439359267736e-05,
"loss": 0.4861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2567122280597687,
"step": 180,
"valid_targets_mean": 2919.0,
"valid_targets_min": 1857
},
{
"epoch": 0.296474358974359,
"grad_norm": 0.7996959350311494,
"learning_rate": 1.6842105263157896e-05,
"loss": 0.5048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23176565766334534,
"step": 185,
"valid_targets_mean": 2770.1,
"valid_targets_min": 1156
},
{
"epoch": 0.30448717948717946,
"grad_norm": 0.9438242229304544,
"learning_rate": 1.7299771167048057e-05,
"loss": 0.4708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22697538137435913,
"step": 190,
"valid_targets_mean": 2171.6,
"valid_targets_min": 498
},
{
"epoch": 0.3125,
"grad_norm": 0.7852768168325834,
"learning_rate": 1.7757437070938218e-05,
"loss": 0.4839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16673338413238525,
"step": 195,
"valid_targets_mean": 2226.2,
"valid_targets_min": 615
},
{
"epoch": 0.32051282051282054,
"grad_norm": 0.8328845202469579,
"learning_rate": 1.8215102974828376e-05,
"loss": 0.4659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20564012229442596,
"step": 200,
"valid_targets_mean": 1902.9,
"valid_targets_min": 1076
},
{
"epoch": 0.328525641025641,
"grad_norm": 0.9107558293954876,
"learning_rate": 1.8672768878718537e-05,
"loss": 0.4652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26834234595298767,
"step": 205,
"valid_targets_mean": 2476.9,
"valid_targets_min": 1814
},
{
"epoch": 0.33653846153846156,
"grad_norm": 1.040043168249784,
"learning_rate": 1.9130434782608697e-05,
"loss": 0.4763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26306286454200745,
"step": 210,
"valid_targets_mean": 2041.9,
"valid_targets_min": 787
},
{
"epoch": 0.34455128205128205,
"grad_norm": 0.9252302157522805,
"learning_rate": 1.9588100686498858e-05,
"loss": 0.4575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2265125960111618,
"step": 215,
"valid_targets_mean": 2354.1,
"valid_targets_min": 1473
},
{
"epoch": 0.3525641025641026,
"grad_norm": 0.887453457764969,
"learning_rate": 2.004576659038902e-05,
"loss": 0.4856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22299125790596008,
"step": 220,
"valid_targets_mean": 2139.2,
"valid_targets_min": 1048
},
{
"epoch": 0.3605769230769231,
"grad_norm": 0.9059800139169017,
"learning_rate": 2.050343249427918e-05,
"loss": 0.4845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20266111195087433,
"step": 225,
"valid_targets_mean": 1946.6,
"valid_targets_min": 880
},
{
"epoch": 0.3685897435897436,
"grad_norm": 0.7607704862440865,
"learning_rate": 2.0961098398169337e-05,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26493844389915466,
"step": 230,
"valid_targets_mean": 3166.2,
"valid_targets_min": 1272
},
{
"epoch": 0.3766025641025641,
"grad_norm": 0.6967071079872735,
"learning_rate": 2.14187643020595e-05,
"loss": 0.4398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15973234176635742,
"step": 235,
"valid_targets_mean": 2076.8,
"valid_targets_min": 1075
},
{
"epoch": 0.38461538461538464,
"grad_norm": 0.9150501001631774,
"learning_rate": 2.187643020594966e-05,
"loss": 0.4443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2183428257703781,
"step": 240,
"valid_targets_mean": 2056.5,
"valid_targets_min": 907
},
{
"epoch": 0.3926282051282051,
"grad_norm": 0.8206357901155347,
"learning_rate": 2.2334096109839817e-05,
"loss": 0.4821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24904729425907135,
"step": 245,
"valid_targets_mean": 2744.9,
"valid_targets_min": 1021
},
{
"epoch": 0.40064102564102566,
"grad_norm": 0.8526548730570999,
"learning_rate": 2.279176201372998e-05,
"loss": 0.4571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23037180304527283,
"step": 250,
"valid_targets_mean": 2357.2,
"valid_targets_min": 1310
},
{
"epoch": 0.40865384615384615,
"grad_norm": 0.7860731322180793,
"learning_rate": 2.3249427917620138e-05,
"loss": 0.462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2327589988708496,
"step": 255,
"valid_targets_mean": 2966.1,
"valid_targets_min": 1291
},
{
"epoch": 0.4166666666666667,
"grad_norm": 0.8509400671372361,
"learning_rate": 2.37070938215103e-05,
"loss": 0.4554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25431883335113525,
"step": 260,
"valid_targets_mean": 2701.1,
"valid_targets_min": 2043
},
{
"epoch": 0.42467948717948717,
"grad_norm": 0.8864607945642146,
"learning_rate": 2.4164759725400463e-05,
"loss": 0.4772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28384217619895935,
"step": 265,
"valid_targets_mean": 2266.1,
"valid_targets_min": 1127
},
{
"epoch": 0.4326923076923077,
"grad_norm": 0.9413869835853772,
"learning_rate": 2.462242562929062e-05,
"loss": 0.4575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19929912686347961,
"step": 270,
"valid_targets_mean": 1698.9,
"valid_targets_min": 428
},
{
"epoch": 0.4407051282051282,
"grad_norm": 0.744625538834592,
"learning_rate": 2.508009153318078e-05,
"loss": 0.4557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25119954347610474,
"step": 275,
"valid_targets_mean": 3835.0,
"valid_targets_min": 1842
},
{
"epoch": 0.44871794871794873,
"grad_norm": 0.7738314413345992,
"learning_rate": 2.5537757437070943e-05,
"loss": 0.4397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1962563693523407,
"step": 280,
"valid_targets_mean": 2279.1,
"valid_targets_min": 1198
},
{
"epoch": 0.4567307692307692,
"grad_norm": 2.4382247977127856,
"learning_rate": 2.59954233409611e-05,
"loss": 0.4564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21939444541931152,
"step": 285,
"valid_targets_mean": 2666.8,
"valid_targets_min": 743
},
{
"epoch": 0.46474358974358976,
"grad_norm": 0.8606788715900447,
"learning_rate": 2.645308924485126e-05,
"loss": 0.4799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41101521253585815,
"step": 290,
"valid_targets_mean": 3653.4,
"valid_targets_min": 733
},
{
"epoch": 0.47275641025641024,
"grad_norm": 0.838922125549497,
"learning_rate": 2.6910755148741422e-05,
"loss": 0.4761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2805629074573517,
"step": 295,
"valid_targets_mean": 2203.1,
"valid_targets_min": 1108
},
{
"epoch": 0.4807692307692308,
"grad_norm": 0.7860048976376676,
"learning_rate": 2.7368421052631583e-05,
"loss": 0.4227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1744893491268158,
"step": 300,
"valid_targets_mean": 2218.8,
"valid_targets_min": 1246
},
{
"epoch": 0.48878205128205127,
"grad_norm": 0.8718270447419633,
"learning_rate": 2.782608695652174e-05,
"loss": 0.4686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2293800711631775,
"step": 305,
"valid_targets_mean": 2349.2,
"valid_targets_min": 1010
},
{
"epoch": 0.4967948717948718,
"grad_norm": 0.809574476298245,
"learning_rate": 2.8283752860411904e-05,
"loss": 0.4505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.286695659160614,
"step": 310,
"valid_targets_mean": 2928.5,
"valid_targets_min": 1451
},
{
"epoch": 0.5048076923076923,
"grad_norm": 0.8560435039918013,
"learning_rate": 2.8741418764302062e-05,
"loss": 0.467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2741186320781708,
"step": 315,
"valid_targets_mean": 2153.1,
"valid_targets_min": 1418
},
{
"epoch": 0.5128205128205128,
"grad_norm": 0.8443849165623637,
"learning_rate": 2.9199084668192223e-05,
"loss": 0.513,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18281307816505432,
"step": 320,
"valid_targets_mean": 1734.6,
"valid_targets_min": 416
},
{
"epoch": 0.5208333333333334,
"grad_norm": 0.8696802631590136,
"learning_rate": 2.9656750572082384e-05,
"loss": 0.4516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18471366167068481,
"step": 325,
"valid_targets_mean": 1614.6,
"valid_targets_min": 990
},
{
"epoch": 0.5288461538461539,
"grad_norm": 0.8651062420057943,
"learning_rate": 3.0114416475972544e-05,
"loss": 0.468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2343977391719818,
"step": 330,
"valid_targets_mean": 2271.1,
"valid_targets_min": 1220
},
{
"epoch": 0.5368589743589743,
"grad_norm": 0.8409126784718626,
"learning_rate": 3.05720823798627e-05,
"loss": 0.4375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2919655740261078,
"step": 335,
"valid_targets_mean": 3131.4,
"valid_targets_min": 1089
},
{
"epoch": 0.5448717948717948,
"grad_norm": 0.8010512826037681,
"learning_rate": 3.102974828375286e-05,
"loss": 0.4293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23436668515205383,
"step": 340,
"valid_targets_mean": 2680.4,
"valid_targets_min": 1639
},
{
"epoch": 0.5528846153846154,
"grad_norm": 0.7821405770402137,
"learning_rate": 3.1487414187643024e-05,
"loss": 0.4769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20524126291275024,
"step": 345,
"valid_targets_mean": 2733.0,
"valid_targets_min": 1029
},
{
"epoch": 0.5608974358974359,
"grad_norm": 0.7147060886685118,
"learning_rate": 3.1945080091533184e-05,
"loss": 0.4614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2542196810245514,
"step": 350,
"valid_targets_mean": 3058.1,
"valid_targets_min": 1283
},
{
"epoch": 0.5689102564102564,
"grad_norm": 0.7484160202180531,
"learning_rate": 3.240274599542334e-05,
"loss": 0.4498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13721662759780884,
"step": 355,
"valid_targets_mean": 1732.4,
"valid_targets_min": 327
},
{
"epoch": 0.5769230769230769,
"grad_norm": 0.9659130418383086,
"learning_rate": 3.2860411899313506e-05,
"loss": 0.4619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26037678122520447,
"step": 360,
"valid_targets_mean": 1845.2,
"valid_targets_min": 1478
},
{
"epoch": 0.5849358974358975,
"grad_norm": 1.148809792440573,
"learning_rate": 3.331807780320366e-05,
"loss": 0.4811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24160519242286682,
"step": 365,
"valid_targets_mean": 2128.8,
"valid_targets_min": 1155
},
{
"epoch": 0.592948717948718,
"grad_norm": 0.7019051186772777,
"learning_rate": 3.377574370709382e-05,
"loss": 0.4261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25113967061042786,
"step": 370,
"valid_targets_mean": 3612.8,
"valid_targets_min": 1206
},
{
"epoch": 0.6009615384615384,
"grad_norm": 0.9679216066114925,
"learning_rate": 3.423340961098399e-05,
"loss": 0.4148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2699517607688904,
"step": 375,
"valid_targets_mean": 3150.4,
"valid_targets_min": 1058
},
{
"epoch": 0.6089743589743589,
"grad_norm": 0.7848117406315669,
"learning_rate": 3.469107551487414e-05,
"loss": 0.4402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20744790136814117,
"step": 380,
"valid_targets_mean": 2178.5,
"valid_targets_min": 909
},
{
"epoch": 0.6169871794871795,
"grad_norm": 0.7080944591453242,
"learning_rate": 3.5148741418764304e-05,
"loss": 0.417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22987905144691467,
"step": 385,
"valid_targets_mean": 3240.8,
"valid_targets_min": 966
},
{
"epoch": 0.625,
"grad_norm": 0.8894368633337273,
"learning_rate": 3.5606407322654464e-05,
"loss": 0.4532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20276543498039246,
"step": 390,
"valid_targets_mean": 1739.2,
"valid_targets_min": 656
},
{
"epoch": 0.6330128205128205,
"grad_norm": 0.8437346929099193,
"learning_rate": 3.6064073226544625e-05,
"loss": 0.4301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2156563401222229,
"step": 395,
"valid_targets_mean": 2161.9,
"valid_targets_min": 1131
},
{
"epoch": 0.6410256410256411,
"grad_norm": 0.845119808027601,
"learning_rate": 3.6521739130434786e-05,
"loss": 0.4362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23626503348350525,
"step": 400,
"valid_targets_mean": 2326.6,
"valid_targets_min": 1025
},
{
"epoch": 0.6490384615384616,
"grad_norm": 0.8230495030251933,
"learning_rate": 3.697940503432495e-05,
"loss": 0.4493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21271054446697235,
"step": 405,
"valid_targets_mean": 2119.8,
"valid_targets_min": 1356
},
{
"epoch": 0.657051282051282,
"grad_norm": 0.7566270241967507,
"learning_rate": 3.743707093821511e-05,
"loss": 0.4543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2143326699733734,
"step": 410,
"valid_targets_mean": 2758.8,
"valid_targets_min": 1504
},
{
"epoch": 0.6650641025641025,
"grad_norm": 0.8891093819684329,
"learning_rate": 3.789473684210526e-05,
"loss": 0.4541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21579736471176147,
"step": 415,
"valid_targets_mean": 2091.5,
"valid_targets_min": 1118
},
{
"epoch": 0.6730769230769231,
"grad_norm": 0.7308770194117645,
"learning_rate": 3.835240274599543e-05,
"loss": 0.422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18271571397781372,
"step": 420,
"valid_targets_mean": 2216.1,
"valid_targets_min": 1241
},
{
"epoch": 0.6810897435897436,
"grad_norm": 0.6733014520665108,
"learning_rate": 3.8810068649885584e-05,
"loss": 0.4426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1795242726802826,
"step": 425,
"valid_targets_mean": 2813.6,
"valid_targets_min": 1195
},
{
"epoch": 0.6891025641025641,
"grad_norm": 0.9209305153321826,
"learning_rate": 3.9267734553775745e-05,
"loss": 0.4429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22252072393894196,
"step": 430,
"valid_targets_mean": 1781.4,
"valid_targets_min": 1204
},
{
"epoch": 0.6971153846153846,
"grad_norm": 0.7008996722806253,
"learning_rate": 3.9725400457665905e-05,
"loss": 0.4391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22679556906223297,
"step": 435,
"valid_targets_mean": 3189.6,
"valid_targets_min": 1315
},
{
"epoch": 0.7051282051282052,
"grad_norm": 0.7933102403594852,
"learning_rate": 3.999997445219712e-05,
"loss": 0.4132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21799099445343018,
"step": 440,
"valid_targets_mean": 2205.4,
"valid_targets_min": 1392
},
{
"epoch": 0.7131410256410257,
"grad_norm": 0.71765578245187,
"learning_rate": 3.999968704016428e-05,
"loss": 0.4366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14643388986587524,
"step": 445,
"valid_targets_mean": 1829.5,
"valid_targets_min": 1227
},
{
"epoch": 0.7211538461538461,
"grad_norm": 0.7680275744504215,
"learning_rate": 3.9999080285949514e-05,
"loss": 0.4545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28415074944496155,
"step": 450,
"valid_targets_mean": 3113.9,
"valid_targets_min": 882
},
{
"epoch": 0.7291666666666666,
"grad_norm": 0.7819836110236925,
"learning_rate": 3.999815419924108e-05,
"loss": 0.4581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930494546890259,
"step": 455,
"valid_targets_mean": 4082.2,
"valid_targets_min": 1368
},
{
"epoch": 0.7371794871794872,
"grad_norm": 0.7156988765066394,
"learning_rate": 3.999690879482614e-05,
"loss": 0.4458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22275188565254211,
"step": 460,
"valid_targets_mean": 2527.4,
"valid_targets_min": 1210
},
{
"epoch": 0.7451923076923077,
"grad_norm": 0.7545107849171728,
"learning_rate": 3.9995344092590506e-05,
"loss": 0.4569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17759068310260773,
"step": 465,
"valid_targets_mean": 2044.2,
"valid_targets_min": 865
},
{
"epoch": 0.7532051282051282,
"grad_norm": 0.85883814352422,
"learning_rate": 3.999346011751835e-05,
"loss": 0.4462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21038851141929626,
"step": 470,
"valid_targets_mean": 1835.1,
"valid_targets_min": 1147
},
{
"epoch": 0.7612179487179487,
"grad_norm": 0.8410031574243461,
"learning_rate": 3.999125689969176e-05,
"loss": 0.4415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17614567279815674,
"step": 475,
"valid_targets_mean": 1721.4,
"valid_targets_min": 1041
},
{
"epoch": 0.7692307692307693,
"grad_norm": 0.8789804427446964,
"learning_rate": 3.9988734474290324e-05,
"loss": 0.4357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21839639544487,
"step": 480,
"valid_targets_mean": 2227.9,
"valid_targets_min": 948
},
{
"epoch": 0.7772435897435898,
"grad_norm": 0.7384347806573924,
"learning_rate": 3.9985892881590513e-05,
"loss": 0.4596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15238994359970093,
"step": 485,
"valid_targets_mean": 2098.8,
"valid_targets_min": 991
},
{
"epoch": 0.7852564102564102,
"grad_norm": 0.8037359267266503,
"learning_rate": 3.9982732166965054e-05,
"loss": 0.4343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23122987151145935,
"step": 490,
"valid_targets_mean": 2579.4,
"valid_targets_min": 892
},
{
"epoch": 0.7932692307692307,
"grad_norm": 0.7584123950011441,
"learning_rate": 3.997925238088221e-05,
"loss": 0.4363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2352125495672226,
"step": 495,
"valid_targets_mean": 3186.1,
"valid_targets_min": 948
},
{
"epoch": 0.8012820512820513,
"grad_norm": 0.8416323300874318,
"learning_rate": 3.9975453578904975e-05,
"loss": 0.4351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2356817126274109,
"step": 500,
"valid_targets_mean": 1878.6,
"valid_targets_min": 472
},
{
"epoch": 0.8092948717948718,
"grad_norm": 0.7515584047530944,
"learning_rate": 3.997133582169018e-05,
"loss": 0.4142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19595301151275635,
"step": 505,
"valid_targets_mean": 2488.8,
"valid_targets_min": 1123
},
{
"epoch": 0.8173076923076923,
"grad_norm": 0.6570619580965038,
"learning_rate": 3.996689917498754e-05,
"loss": 0.4321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1813373565673828,
"step": 510,
"valid_targets_mean": 2813.6,
"valid_targets_min": 1393
},
{
"epoch": 0.8253205128205128,
"grad_norm": 0.7003686384566153,
"learning_rate": 3.9962143709638585e-05,
"loss": 0.4255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18100909888744354,
"step": 515,
"valid_targets_mean": 2194.2,
"valid_targets_min": 850
},
{
"epoch": 0.8333333333333334,
"grad_norm": 0.8533422308466821,
"learning_rate": 3.995706950157554e-05,
"loss": 0.4638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17890852689743042,
"step": 520,
"valid_targets_mean": 1537.5,
"valid_targets_min": 693
},
{
"epoch": 0.8413461538461539,
"grad_norm": 0.8025876920924326,
"learning_rate": 3.995167663182008e-05,
"loss": 0.415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2482287734746933,
"step": 525,
"valid_targets_mean": 2890.6,
"valid_targets_min": 500
},
{
"epoch": 0.8493589743589743,
"grad_norm": 0.817318210827593,
"learning_rate": 3.994596518648214e-05,
"loss": 0.437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18256166577339172,
"step": 530,
"valid_targets_mean": 2419.2,
"valid_targets_min": 1024
},
{
"epoch": 0.8573717948717948,
"grad_norm": 0.6865410812285857,
"learning_rate": 3.993993525675838e-05,
"loss": 0.4527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18624117970466614,
"step": 535,
"valid_targets_mean": 2568.6,
"valid_targets_min": 1364
},
{
"epoch": 0.8653846153846154,
"grad_norm": 0.8488382487153298,
"learning_rate": 3.993358693893086e-05,
"loss": 0.4254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2426677644252777,
"step": 540,
"valid_targets_mean": 1998.9,
"valid_targets_min": 1078
},
{
"epoch": 0.8733974358974359,
"grad_norm": 0.8652381079639015,
"learning_rate": 3.9926920334365457e-05,
"loss": 0.4183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.238864004611969,
"step": 545,
"valid_targets_mean": 2650.5,
"valid_targets_min": 359
},
{
"epoch": 0.8814102564102564,
"grad_norm": 0.7839796519999491,
"learning_rate": 3.991993554951023e-05,
"loss": 0.4423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22148996591567993,
"step": 550,
"valid_targets_mean": 2023.8,
"valid_targets_min": 1128
},
{
"epoch": 0.8894230769230769,
"grad_norm": 0.7542817185661378,
"learning_rate": 3.991263269589376e-05,
"loss": 0.4718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18125128746032715,
"step": 555,
"valid_targets_mean": 2083.8,
"valid_targets_min": 1150
},
{
"epoch": 0.8974358974358975,
"grad_norm": 0.741947108861436,
"learning_rate": 3.990501189012332e-05,
"loss": 0.4307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22753050923347473,
"step": 560,
"valid_targets_mean": 3070.9,
"valid_targets_min": 1628
},
{
"epoch": 0.905448717948718,
"grad_norm": 0.8420106848026391,
"learning_rate": 3.989707325388305e-05,
"loss": 0.4149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21152499318122864,
"step": 565,
"valid_targets_mean": 2034.4,
"valid_targets_min": 1006
},
{
"epoch": 0.9134615384615384,
"grad_norm": 0.725218798545047,
"learning_rate": 3.9888816913932016e-05,
"loss": 0.427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2168159782886505,
"step": 570,
"valid_targets_mean": 2498.5,
"valid_targets_min": 314
},
{
"epoch": 0.9214743589743589,
"grad_norm": 0.7551268498727862,
"learning_rate": 3.988024300210215e-05,
"loss": 0.4173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23235228657722473,
"step": 575,
"valid_targets_mean": 3109.9,
"valid_targets_min": 1392
},
{
"epoch": 0.9294871794871795,
"grad_norm": 0.8917469963673748,
"learning_rate": 3.987135165529618e-05,
"loss": 0.4279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2358158975839615,
"step": 580,
"valid_targets_mean": 2129.4,
"valid_targets_min": 738
},
{
"epoch": 0.9375,
"grad_norm": 0.7621556301152937,
"learning_rate": 3.9862143015485446e-05,
"loss": 0.4266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2662770450115204,
"step": 585,
"valid_targets_mean": 3289.5,
"valid_targets_min": 1743
},
{
"epoch": 0.9455128205128205,
"grad_norm": 0.700543068896193,
"learning_rate": 3.985261722970759e-05,
"loss": 0.4128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16867512464523315,
"step": 590,
"valid_targets_mean": 2218.5,
"valid_targets_min": 904
},
{
"epoch": 0.9535256410256411,
"grad_norm": 0.815970901264772,
"learning_rate": 3.984277445006426e-05,
"loss": 0.4353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22275325655937195,
"step": 595,
"valid_targets_mean": 1926.8,
"valid_targets_min": 978
},
{
"epoch": 0.9615384615384616,
"grad_norm": 0.8361593918244778,
"learning_rate": 3.9832614833718654e-05,
"loss": 0.4177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18687403202056885,
"step": 600,
"valid_targets_mean": 2228.1,
"valid_targets_min": 1269
},
{
"epoch": 0.969551282051282,
"grad_norm": 0.7613367304322403,
"learning_rate": 3.9822138542893005e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23270726203918457,
"step": 605,
"valid_targets_mean": 2532.5,
"valid_targets_min": 677
},
{
"epoch": 0.9775641025641025,
"grad_norm": 0.8051775177601395,
"learning_rate": 3.9811345744866014e-05,
"loss": 0.4378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21936899423599243,
"step": 610,
"valid_targets_mean": 2139.5,
"valid_targets_min": 1092
},
{
"epoch": 0.9855769230769231,
"grad_norm": 0.9820300582408891,
"learning_rate": 3.980023661197016e-05,
"loss": 0.4396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2305496335029602,
"step": 615,
"valid_targets_mean": 1676.1,
"valid_targets_min": 1009
},
{
"epoch": 0.9935897435897436,
"grad_norm": 0.7251745500664333,
"learning_rate": 3.978881132158896e-05,
"loss": 0.4072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22141022980213165,
"step": 620,
"valid_targets_mean": 2821.9,
"valid_targets_min": 857
},
{
"epoch": 1.001602564102564,
"grad_norm": 0.7465984644079928,
"learning_rate": 3.9777070056154124e-05,
"loss": 0.4273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20381376147270203,
"step": 625,
"valid_targets_mean": 2395.4,
"valid_targets_min": 993
},
{
"epoch": 1.0096153846153846,
"grad_norm": 0.6090997256218228,
"learning_rate": 3.976501300314264e-05,
"loss": 0.3996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19216665625572205,
"step": 630,
"valid_targets_mean": 3795.2,
"valid_targets_min": 1148
},
{
"epoch": 1.017628205128205,
"grad_norm": 0.9887537640031723,
"learning_rate": 3.9752640355073825e-05,
"loss": 0.3934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19999739527702332,
"step": 635,
"valid_targets_mean": 2683.5,
"valid_targets_min": 1874
},
{
"epoch": 1.0256410256410255,
"grad_norm": 0.7712631721878844,
"learning_rate": 3.9739952309506175e-05,
"loss": 0.4294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1707819700241089,
"step": 640,
"valid_targets_mean": 2182.8,
"valid_targets_min": 612
},
{
"epoch": 1.0336538461538463,
"grad_norm": 0.7915294225622618,
"learning_rate": 3.972694906903427e-05,
"loss": 0.4052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1669417917728424,
"step": 645,
"valid_targets_mean": 2294.2,
"valid_targets_min": 1128
},
{
"epoch": 1.0416666666666667,
"grad_norm": 0.7030915254920559,
"learning_rate": 3.971363084128552e-05,
"loss": 0.3957,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2009146809577942,
"step": 650,
"valid_targets_mean": 3490.4,
"valid_targets_min": 260
},
{
"epoch": 1.0496794871794872,
"grad_norm": 0.8227935946585014,
"learning_rate": 3.969999783891685e-05,
"loss": 0.4199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2600316107273102,
"step": 655,
"valid_targets_mean": 2552.5,
"valid_targets_min": 1095
},
{
"epoch": 1.0576923076923077,
"grad_norm": 0.819150924957127,
"learning_rate": 3.96860502796113e-05,
"loss": 0.4009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22930988669395447,
"step": 660,
"valid_targets_mean": 2559.0,
"valid_targets_min": 904
},
{
"epoch": 1.0657051282051282,
"grad_norm": 0.8189973867037402,
"learning_rate": 3.967178838607456e-05,
"loss": 0.4129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15020707249641418,
"step": 665,
"valid_targets_mean": 1769.4,
"valid_targets_min": 1131
},
{
"epoch": 1.0737179487179487,
"grad_norm": 0.6455047256028397,
"learning_rate": 3.965721238603139e-05,
"loss": 0.3861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17924004793167114,
"step": 670,
"valid_targets_mean": 2953.0,
"valid_targets_min": 791
},
{
"epoch": 1.0817307692307692,
"grad_norm": 0.9974279650169392,
"learning_rate": 3.964232251222203e-05,
"loss": 0.4186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20407584309577942,
"step": 675,
"valid_targets_mean": 2472.5,
"valid_targets_min": 1522
},
{
"epoch": 1.0897435897435896,
"grad_norm": 0.6570532885048896,
"learning_rate": 3.962711900239844e-05,
"loss": 0.3995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2124699354171753,
"step": 680,
"valid_targets_mean": 3709.4,
"valid_targets_min": 1239
},
{
"epoch": 1.0977564102564104,
"grad_norm": 0.7966806502459381,
"learning_rate": 3.961160209932051e-05,
"loss": 0.3707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16343654692173004,
"step": 685,
"valid_targets_mean": 1613.4,
"valid_targets_min": 435
},
{
"epoch": 1.1057692307692308,
"grad_norm": 0.8141799386192287,
"learning_rate": 3.95957720507522e-05,
"loss": 0.3784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21225258708000183,
"step": 690,
"valid_targets_mean": 3180.0,
"valid_targets_min": 475
},
{
"epoch": 1.1137820512820513,
"grad_norm": 0.7663834307163272,
"learning_rate": 3.957962910945759e-05,
"loss": 0.3945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1471199244260788,
"step": 695,
"valid_targets_mean": 2677.8,
"valid_targets_min": 902
},
{
"epoch": 1.1217948717948718,
"grad_norm": 0.735440023679953,
"learning_rate": 3.9563173533196805e-05,
"loss": 0.4039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1359565705060959,
"step": 700,
"valid_targets_mean": 1893.1,
"valid_targets_min": 822
},
{
"epoch": 1.1298076923076923,
"grad_norm": 0.7634365465235168,
"learning_rate": 3.954640558472195e-05,
"loss": 0.4141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1666882336139679,
"step": 705,
"valid_targets_mean": 2108.0,
"valid_targets_min": 1599
},
{
"epoch": 1.1378205128205128,
"grad_norm": 0.7962658670444661,
"learning_rate": 3.952932553177287e-05,
"loss": 0.377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22097454965114594,
"step": 710,
"valid_targets_mean": 2968.0,
"valid_targets_min": 1200
},
{
"epoch": 1.1458333333333333,
"grad_norm": 0.9117502451013554,
"learning_rate": 3.95119336470729e-05,
"loss": 0.4146,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22754886746406555,
"step": 715,
"valid_targets_mean": 1757.2,
"valid_targets_min": 1269
},
{
"epoch": 1.1538461538461537,
"grad_norm": 0.8083486713374696,
"learning_rate": 3.949423020832451e-05,
"loss": 0.414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17627468705177307,
"step": 720,
"valid_targets_mean": 1481.2,
"valid_targets_min": 1051
},
{
"epoch": 1.1618589743589745,
"grad_norm": 0.7333098847473878,
"learning_rate": 3.947621549820485e-05,
"loss": 0.3805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18278644979000092,
"step": 725,
"valid_targets_mean": 2522.1,
"valid_targets_min": 1157
},
{
"epoch": 1.169871794871795,
"grad_norm": 0.7401713642953307,
"learning_rate": 3.945788980436129e-05,
"loss": 0.389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20542725920677185,
"step": 730,
"valid_targets_mean": 2958.4,
"valid_targets_min": 1348
},
{
"epoch": 1.1778846153846154,
"grad_norm": 0.8633291622977045,
"learning_rate": 3.943925341940673e-05,
"loss": 0.4114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16674403846263885,
"step": 735,
"valid_targets_mean": 1984.1,
"valid_targets_min": 315
},
{
"epoch": 1.185897435897436,
"grad_norm": 0.6862290281154118,
"learning_rate": 3.942030664091503e-05,
"loss": 0.3787,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1515948474407196,
"step": 740,
"valid_targets_mean": 2081.1,
"valid_targets_min": 1404
},
{
"epoch": 1.1939102564102564,
"grad_norm": 0.7517010622113833,
"learning_rate": 3.9401049771416214e-05,
"loss": 0.397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20460815727710724,
"step": 745,
"valid_targets_mean": 2555.0,
"valid_targets_min": 828
},
{
"epoch": 1.2019230769230769,
"grad_norm": 0.7701867921629503,
"learning_rate": 3.938148311839162e-05,
"loss": 0.4257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24021926522254944,
"step": 750,
"valid_targets_mean": 2868.4,
"valid_targets_min": 812
},
{
"epoch": 1.2099358974358974,
"grad_norm": 0.8053323182482374,
"learning_rate": 3.9361606994269014e-05,
"loss": 0.407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1931108832359314,
"step": 755,
"valid_targets_mean": 2227.1,
"valid_targets_min": 1148
},
{
"epoch": 1.217948717948718,
"grad_norm": 0.6874024005644546,
"learning_rate": 3.934142171641763e-05,
"loss": 0.3773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21617969870567322,
"step": 760,
"valid_targets_mean": 3691.2,
"valid_targets_min": 1327
},
{
"epoch": 1.2259615384615385,
"grad_norm": 0.803368730894559,
"learning_rate": 3.9320927607143003e-05,
"loss": 0.3977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23498323559761047,
"step": 765,
"valid_targets_mean": 2918.5,
"valid_targets_min": 1543
},
{
"epoch": 1.233974358974359,
"grad_norm": 0.6761209321682878,
"learning_rate": 3.9300124993681976e-05,
"loss": 0.4127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20131105184555054,
"step": 770,
"valid_targets_mean": 3544.6,
"valid_targets_min": 1438
},
{
"epoch": 1.2419871794871795,
"grad_norm": 0.8140029717837052,
"learning_rate": 3.9279014208197317e-05,
"loss": 0.3932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19266082346439362,
"step": 775,
"valid_targets_mean": 2522.5,
"valid_targets_min": 1147
},
{
"epoch": 1.25,
"grad_norm": 0.7819556286960125,
"learning_rate": 3.925759558777252e-05,
"loss": 0.3876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2085326910018921,
"step": 780,
"valid_targets_mean": 2123.0,
"valid_targets_min": 984
},
{
"epoch": 1.2580128205128205,
"grad_norm": 0.7378325645590994,
"learning_rate": 3.923586947440639e-05,
"loss": 0.4051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24526703357696533,
"step": 785,
"valid_targets_mean": 3333.6,
"valid_targets_min": 1216
},
{
"epoch": 1.266025641025641,
"grad_norm": 0.7617824513828749,
"learning_rate": 3.921383621500758e-05,
"loss": 0.3929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25414544343948364,
"step": 790,
"valid_targets_mean": 3125.8,
"valid_targets_min": 1466
},
{
"epoch": 1.2740384615384617,
"grad_norm": 0.827506556223389,
"learning_rate": 3.919149616138906e-05,
"loss": 0.4056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1815040558576584,
"step": 795,
"valid_targets_mean": 2285.4,
"valid_targets_min": 689
},
{
"epoch": 1.282051282051282,
"grad_norm": 0.8523188451016964,
"learning_rate": 3.916884967026246e-05,
"loss": 0.3955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19575875997543335,
"step": 800,
"valid_targets_mean": 2627.0,
"valid_targets_min": 1235
},
{
"epoch": 1.2900641025641026,
"grad_norm": 0.8602226407777478,
"learning_rate": 3.914589710323245e-05,
"loss": 0.3981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22027531266212463,
"step": 805,
"valid_targets_mean": 2483.4,
"valid_targets_min": 1320
},
{
"epoch": 1.2980769230769231,
"grad_norm": 0.7192846478140936,
"learning_rate": 3.912263882679091e-05,
"loss": 0.3709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12481571733951569,
"step": 810,
"valid_targets_mean": 1910.9,
"valid_targets_min": 737
},
{
"epoch": 1.3060897435897436,
"grad_norm": 0.7463244398063339,
"learning_rate": 3.9099075212311076e-05,
"loss": 0.3779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19425347447395325,
"step": 815,
"valid_targets_mean": 2349.6,
"valid_targets_min": 925
},
{
"epoch": 1.314102564102564,
"grad_norm": 0.7798070432766532,
"learning_rate": 3.9075206636041646e-05,
"loss": 0.3889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16809885203838348,
"step": 820,
"valid_targets_mean": 2378.0,
"valid_targets_min": 1186
},
{
"epoch": 1.3221153846153846,
"grad_norm": 0.7353506089603916,
"learning_rate": 3.905103347910075e-05,
"loss": 0.3846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14414098858833313,
"step": 825,
"valid_targets_mean": 1964.6,
"valid_targets_min": 984
},
{
"epoch": 1.330128205128205,
"grad_norm": 0.7469626524872656,
"learning_rate": 3.902655612746985e-05,
"loss": 0.3986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20464842021465302,
"step": 830,
"valid_targets_mean": 2803.6,
"valid_targets_min": 1178
},
{
"epoch": 1.3381410256410255,
"grad_norm": 0.8086127489461551,
"learning_rate": 3.900177497198761e-05,
"loss": 0.4059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2263430953025818,
"step": 835,
"valid_targets_mean": 2755.0,
"valid_targets_min": 1021
},
{
"epoch": 1.3461538461538463,
"grad_norm": 0.6460008366891428,
"learning_rate": 3.8976690408343635e-05,
"loss": 0.3958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16660919785499573,
"step": 840,
"valid_targets_mean": 3076.5,
"valid_targets_min": 1058
},
{
"epoch": 1.3541666666666667,
"grad_norm": 0.8460991987261154,
"learning_rate": 3.8951302837072165e-05,
"loss": 0.408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2518458068370819,
"step": 845,
"valid_targets_mean": 2448.0,
"valid_targets_min": 1097
},
{
"epoch": 1.3621794871794872,
"grad_norm": 0.821233295005827,
"learning_rate": 3.892561266354566e-05,
"loss": 0.4159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18111786246299744,
"step": 850,
"valid_targets_mean": 2694.5,
"valid_targets_min": 1012
},
{
"epoch": 1.3701923076923077,
"grad_norm": 0.7296441292083241,
"learning_rate": 3.889962029796833e-05,
"loss": 0.3896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17838101089000702,
"step": 855,
"valid_targets_mean": 2373.2,
"valid_targets_min": 1162
},
{
"epoch": 1.3782051282051282,
"grad_norm": 0.7026610730862972,
"learning_rate": 3.887332615536962e-05,
"loss": 0.4075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21002928912639618,
"step": 860,
"valid_targets_mean": 3131.4,
"valid_targets_min": 1406
},
{
"epoch": 1.3862179487179487,
"grad_norm": 1.0977711950424043,
"learning_rate": 3.8846730655597535e-05,
"loss": 0.4108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2301381528377533,
"step": 865,
"valid_targets_mean": 2209.1,
"valid_targets_min": 958
},
{
"epoch": 1.3942307692307692,
"grad_norm": 1.0677689487035835,
"learning_rate": 3.881983422331198e-05,
"loss": 0.405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22443720698356628,
"step": 870,
"valid_targets_mean": 1953.8,
"valid_targets_min": 1342
},
{
"epoch": 1.4022435897435899,
"grad_norm": 0.7984589627995452,
"learning_rate": 3.879263728797792e-05,
"loss": 0.3901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19039490818977356,
"step": 875,
"valid_targets_mean": 2250.5,
"valid_targets_min": 984
},
{
"epoch": 1.4102564102564101,
"grad_norm": 0.7610997708344249,
"learning_rate": 3.876514028385861e-05,
"loss": 0.3793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18667712807655334,
"step": 880,
"valid_targets_mean": 2457.6,
"valid_targets_min": 625
},
{
"epoch": 1.4182692307692308,
"grad_norm": 0.7660744650444555,
"learning_rate": 3.873734365000857e-05,
"loss": 0.3793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19710713624954224,
"step": 885,
"valid_targets_mean": 2400.2,
"valid_targets_min": 1439
},
{
"epoch": 1.4262820512820513,
"grad_norm": 0.9027867349808698,
"learning_rate": 3.870924783026663e-05,
"loss": 0.4044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25323033332824707,
"step": 890,
"valid_targets_mean": 2769.5,
"valid_targets_min": 1285
},
{
"epoch": 1.4342948717948718,
"grad_norm": 0.6655726580543196,
"learning_rate": 3.8680853273248826e-05,
"loss": 0.4161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24514815211296082,
"step": 895,
"valid_targets_mean": 3499.0,
"valid_targets_min": 994
},
{
"epoch": 1.4423076923076923,
"grad_norm": 0.7581770160173827,
"learning_rate": 3.865216043234126e-05,
"loss": 0.3768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21933013200759888,
"step": 900,
"valid_targets_mean": 3721.2,
"valid_targets_min": 998
},
{
"epoch": 1.4503205128205128,
"grad_norm": 0.7738042590711245,
"learning_rate": 3.862316976569281e-05,
"loss": 0.4284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30224043130874634,
"step": 905,
"valid_targets_mean": 3316.0,
"valid_targets_min": 1100
},
{
"epoch": 1.4583333333333333,
"grad_norm": 0.6155745043657496,
"learning_rate": 3.859388173620785e-05,
"loss": 0.3978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2257455587387085,
"step": 910,
"valid_targets_mean": 4074.5,
"valid_targets_min": 1359
},
{
"epoch": 1.4663461538461537,
"grad_norm": 0.6817808713104984,
"learning_rate": 3.8564296811538874e-05,
"loss": 0.4026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2565431594848633,
"step": 915,
"valid_targets_mean": 3401.1,
"valid_targets_min": 1271
},
{
"epoch": 1.4743589743589745,
"grad_norm": 0.7173177986914446,
"learning_rate": 3.853441546407898e-05,
"loss": 0.3924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24881017208099365,
"step": 920,
"valid_targets_mean": 3510.5,
"valid_targets_min": 994
},
{
"epoch": 1.482371794871795,
"grad_norm": 0.7945715980200994,
"learning_rate": 3.850423817095438e-05,
"loss": 0.3963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15524527430534363,
"step": 925,
"valid_targets_mean": 1850.6,
"valid_targets_min": 1284
},
{
"epoch": 1.4903846153846154,
"grad_norm": 0.7598949103076834,
"learning_rate": 3.847376541401674e-05,
"loss": 0.3804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16828379034996033,
"step": 930,
"valid_targets_mean": 1823.9,
"valid_targets_min": 1016
},
{
"epoch": 1.498397435897436,
"grad_norm": 0.7977097435862016,
"learning_rate": 3.844299767983551e-05,
"loss": 0.3995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20539097487926483,
"step": 935,
"valid_targets_mean": 2585.9,
"valid_targets_min": 447
},
{
"epoch": 1.5064102564102564,
"grad_norm": 0.7796806378947536,
"learning_rate": 3.841193545969015e-05,
"loss": 0.372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21690428256988525,
"step": 940,
"valid_targets_mean": 3070.1,
"valid_targets_min": 1298
},
{
"epoch": 1.5144230769230769,
"grad_norm": 0.795763049986929,
"learning_rate": 3.8380579249562265e-05,
"loss": 0.3871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21313318610191345,
"step": 945,
"valid_targets_mean": 2357.9,
"valid_targets_min": 1087
},
{
"epoch": 1.5224358974358974,
"grad_norm": 0.7856865708709738,
"learning_rate": 3.8348929550127734e-05,
"loss": 0.3934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21079853177070618,
"step": 950,
"valid_targets_mean": 2205.2,
"valid_targets_min": 1438
},
{
"epoch": 1.530448717948718,
"grad_norm": 0.7102354357674125,
"learning_rate": 3.831698686674866e-05,
"loss": 0.3864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1579192876815796,
"step": 955,
"valid_targets_mean": 2220.9,
"valid_targets_min": 1185
},
{
"epoch": 1.5384615384615383,
"grad_norm": 0.7397064308922544,
"learning_rate": 3.828475170946534e-05,
"loss": 0.4017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21521735191345215,
"step": 960,
"valid_targets_mean": 2871.2,
"valid_targets_min": 1032
},
{
"epoch": 1.546474358974359,
"grad_norm": 0.9957473984975943,
"learning_rate": 3.8252224592988087e-05,
"loss": 0.4178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19509410858154297,
"step": 965,
"valid_targets_mean": 1405.8,
"valid_targets_min": 972
},
{
"epoch": 1.5544871794871795,
"grad_norm": 0.804754542638096,
"learning_rate": 3.821940603668906e-05,
"loss": 0.3824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16173695027828217,
"step": 970,
"valid_targets_mean": 1865.6,
"valid_targets_min": 1015
},
{
"epoch": 1.5625,
"grad_norm": 0.7298059783039583,
"learning_rate": 3.8186296564593924e-05,
"loss": 0.3954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22694705426692963,
"step": 975,
"valid_targets_mean": 3259.4,
"valid_targets_min": 1155
},
{
"epoch": 1.5705128205128205,
"grad_norm": 0.7890833541271126,
"learning_rate": 3.815289670537351e-05,
"loss": 0.372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19712330400943756,
"step": 980,
"valid_targets_mean": 2654.9,
"valid_targets_min": 1281
},
{
"epoch": 1.578525641025641,
"grad_norm": 0.7721134490148664,
"learning_rate": 3.811920699233535e-05,
"loss": 0.3662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16013117134571075,
"step": 985,
"valid_targets_mean": 2404.1,
"valid_targets_min": 1045
},
{
"epoch": 1.5865384615384617,
"grad_norm": 0.7771772844437951,
"learning_rate": 3.8085227963415186e-05,
"loss": 0.3862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18366935849189758,
"step": 990,
"valid_targets_mean": 2047.1,
"valid_targets_min": 1234
},
{
"epoch": 1.594551282051282,
"grad_norm": 0.7263474584644822,
"learning_rate": 3.805096016116838e-05,
"loss": 0.4002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23366929590702057,
"step": 995,
"valid_targets_mean": 3505.8,
"valid_targets_min": 1170
},
{
"epoch": 1.6025641025641026,
"grad_norm": 0.7734401430489013,
"learning_rate": 3.801640413276121e-05,
"loss": 0.3876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18875086307525635,
"step": 1000,
"valid_targets_mean": 2440.6,
"valid_targets_min": 798
},
{
"epoch": 1.6105769230769231,
"grad_norm": 1.0978052948369825,
"learning_rate": 3.7981560429962204e-05,
"loss": 0.3848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19252219796180725,
"step": 1005,
"valid_targets_mean": 2162.2,
"valid_targets_min": 1507
},
{
"epoch": 1.6185897435897436,
"grad_norm": 0.8249891646453199,
"learning_rate": 3.7946429609133274e-05,
"loss": 0.3908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2153560221195221,
"step": 1010,
"valid_targets_mean": 1905.8,
"valid_targets_min": 991
},
{
"epoch": 1.626602564102564,
"grad_norm": 0.7433162943053611,
"learning_rate": 3.791101223122084e-05,
"loss": 0.3959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1687787026166916,
"step": 1015,
"valid_targets_mean": 1962.5,
"valid_targets_min": 974
},
{
"epoch": 1.6346153846153846,
"grad_norm": 0.7062532227721724,
"learning_rate": 3.787530886174688e-05,
"loss": 0.3808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14789080619812012,
"step": 1020,
"valid_targets_mean": 2009.1,
"valid_targets_min": 1159
},
{
"epoch": 1.6426282051282053,
"grad_norm": 0.7284286934878477,
"learning_rate": 3.783932007079992e-05,
"loss": 0.3724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1761750727891922,
"step": 1025,
"valid_targets_mean": 2278.1,
"valid_targets_min": 1055
},
{
"epoch": 1.6506410256410255,
"grad_norm": 0.6724344397247881,
"learning_rate": 3.7803046433025905e-05,
"loss": 0.3876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19518470764160156,
"step": 1030,
"valid_targets_mean": 2953.0,
"valid_targets_min": 1636
},
{
"epoch": 1.6586538461538463,
"grad_norm": 0.7306814326324378,
"learning_rate": 3.7766488527619024e-05,
"loss": 0.3828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2070809304714203,
"step": 1035,
"valid_targets_mean": 2797.0,
"valid_targets_min": 956
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.6966329661882152,
"learning_rate": 3.772964693831247e-05,
"loss": 0.3898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1665840744972229,
"step": 1040,
"valid_targets_mean": 2359.0,
"valid_targets_min": 1252
},
{
"epoch": 1.6746794871794872,
"grad_norm": 0.8183363093585437,
"learning_rate": 3.7692522253369136e-05,
"loss": 0.3856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20456507802009583,
"step": 1045,
"valid_targets_mean": 2110.2,
"valid_targets_min": 1108
},
{
"epoch": 1.6826923076923077,
"grad_norm": 0.7326066646720534,
"learning_rate": 3.7655115065572194e-05,
"loss": 0.3792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1852574348449707,
"step": 1050,
"valid_targets_mean": 2510.5,
"valid_targets_min": 1361
},
{
"epoch": 1.6907051282051282,
"grad_norm": 0.8179852635285826,
"learning_rate": 3.7617425972215626e-05,
"loss": 0.3651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18398068845272064,
"step": 1055,
"valid_targets_mean": 2575.1,
"valid_targets_min": 1176
},
{
"epoch": 1.6987179487179487,
"grad_norm": 0.7594138822240342,
"learning_rate": 3.757945557509472e-05,
"loss": 0.3976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2564973831176758,
"step": 1060,
"valid_targets_mean": 3293.5,
"valid_targets_min": 1092
},
{
"epoch": 1.7067307692307692,
"grad_norm": 0.7744891981574005,
"learning_rate": 3.7541204480496444e-05,
"loss": 0.436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2867600917816162,
"step": 1065,
"valid_targets_mean": 2808.5,
"valid_targets_min": 1224
},
{
"epoch": 1.7147435897435899,
"grad_norm": 0.6569368962525489,
"learning_rate": 3.7502673299189745e-05,
"loss": 0.3927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20591554045677185,
"step": 1070,
"valid_targets_mean": 3459.0,
"valid_targets_min": 1088
},
{
"epoch": 1.7227564102564101,
"grad_norm": 0.731504718928724,
"learning_rate": 3.746386264641583e-05,
"loss": 0.3947,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18665257096290588,
"step": 1075,
"valid_targets_mean": 2337.9,
"valid_targets_min": 885
},
{
"epoch": 1.7307692307692308,
"grad_norm": 0.7677480742647473,
"learning_rate": 3.7424773141878324e-05,
"loss": 0.4064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18656907975673676,
"step": 1080,
"valid_targets_mean": 2099.4,
"valid_targets_min": 1228
},
{
"epoch": 1.7387820512820513,
"grad_norm": 0.7989982560887274,
"learning_rate": 3.738540540973338e-05,
"loss": 0.3992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1916476935148239,
"step": 1085,
"valid_targets_mean": 2387.1,
"valid_targets_min": 1355
},
{
"epoch": 1.7467948717948718,
"grad_norm": 0.7713226972032743,
"learning_rate": 3.7345760078579695e-05,
"loss": 0.382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1601388305425644,
"step": 1090,
"valid_targets_mean": 1695.2,
"valid_targets_min": 269
},
{
"epoch": 1.7548076923076923,
"grad_norm": 0.7153583276085919,
"learning_rate": 3.730583778144852e-05,
"loss": 0.3881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24518054723739624,
"step": 1095,
"valid_targets_mean": 3535.8,
"valid_targets_min": 988
},
{
"epoch": 1.7628205128205128,
"grad_norm": 0.7238652347725764,
"learning_rate": 3.7265639155793494e-05,
"loss": 0.3776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15082888305187225,
"step": 1100,
"valid_targets_mean": 2375.6,
"valid_targets_min": 872
},
{
"epoch": 1.7708333333333335,
"grad_norm": 0.7597119444096863,
"learning_rate": 3.7225164843480503e-05,
"loss": 0.4042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18812818825244904,
"step": 1105,
"valid_targets_mean": 2196.5,
"valid_targets_min": 1162
},
{
"epoch": 1.7788461538461537,
"grad_norm": 0.8964624092632014,
"learning_rate": 3.7184415490777426e-05,
"loss": 0.372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.207992285490036,
"step": 1110,
"valid_targets_mean": 2188.0,
"valid_targets_min": 1124
},
{
"epoch": 1.7868589743589745,
"grad_norm": 0.6948514781192213,
"learning_rate": 3.714339174834379e-05,
"loss": 0.3726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18899385631084442,
"step": 1115,
"valid_targets_mean": 2110.8,
"valid_targets_min": 1174
},
{
"epoch": 1.7948717948717947,
"grad_norm": 0.7001908243752163,
"learning_rate": 3.710209427122044e-05,
"loss": 0.4312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19637015461921692,
"step": 1120,
"valid_targets_mean": 2747.2,
"valid_targets_min": 1109
},
{
"epoch": 1.8028846153846154,
"grad_norm": 0.6314682487629872,
"learning_rate": 3.7060523718819e-05,
"loss": 0.3815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19258755445480347,
"step": 1125,
"valid_targets_mean": 3663.5,
"valid_targets_min": 1600
},
{
"epoch": 1.810897435897436,
"grad_norm": 0.8124805310376293,
"learning_rate": 3.701868075491139e-05,
"loss": 0.4002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18830403685569763,
"step": 1130,
"valid_targets_mean": 2149.4,
"valid_targets_min": 1127
},
{
"epoch": 1.8189102564102564,
"grad_norm": 0.7453037484756837,
"learning_rate": 3.697656604761926e-05,
"loss": 0.3497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17239141464233398,
"step": 1135,
"valid_targets_mean": 2228.2,
"valid_targets_min": 1263
},
{
"epoch": 1.8269230769230769,
"grad_norm": 0.7597851188699107,
"learning_rate": 3.693418026940325e-05,
"loss": 0.3694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1435607373714447,
"step": 1140,
"valid_targets_mean": 1410.1,
"valid_targets_min": 446
},
{
"epoch": 1.8349358974358974,
"grad_norm": 0.6747261559800963,
"learning_rate": 3.689152409705229e-05,
"loss": 0.3834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1624498814344406,
"step": 1145,
"valid_targets_mean": 2713.1,
"valid_targets_min": 1090
},
{
"epoch": 1.842948717948718,
"grad_norm": 0.7735869483528329,
"learning_rate": 3.6848598211672794e-05,
"loss": 0.3872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2225751131772995,
"step": 1150,
"valid_targets_mean": 2196.0,
"valid_targets_min": 786
},
{
"epoch": 1.8509615384615383,
"grad_norm": 0.8104590197423858,
"learning_rate": 3.6805403298677797e-05,
"loss": 0.4101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1646331250667572,
"step": 1155,
"valid_targets_mean": 1976.8,
"valid_targets_min": 1181
},
{
"epoch": 1.858974358974359,
"grad_norm": 0.6609774232707526,
"learning_rate": 3.6761940047775966e-05,
"loss": 0.3791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1530018448829651,
"step": 1160,
"valid_targets_mean": 2702.2,
"valid_targets_min": 1064
},
{
"epoch": 1.8669871794871795,
"grad_norm": 0.8716057992411466,
"learning_rate": 3.671820915296063e-05,
"loss": 0.3935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22766408324241638,
"step": 1165,
"valid_targets_mean": 2449.6,
"valid_targets_min": 1228
},
{
"epoch": 1.875,
"grad_norm": 0.8210753368155098,
"learning_rate": 3.667421131249869e-05,
"loss": 0.4034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19551564753055573,
"step": 1170,
"valid_targets_mean": 1927.8,
"valid_targets_min": 1021
},
{
"epoch": 1.8830128205128205,
"grad_norm": 0.8627779649045554,
"learning_rate": 3.662994722891946e-05,
"loss": 0.3899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18560561537742615,
"step": 1175,
"valid_targets_mean": 1790.8,
"valid_targets_min": 1279
},
{
"epoch": 1.891025641025641,
"grad_norm": 0.6827904826786426,
"learning_rate": 3.658541760900344e-05,
"loss": 0.3562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19983141124248505,
"step": 1180,
"valid_targets_mean": 2813.4,
"valid_targets_min": 1533
},
{
"epoch": 1.8990384615384617,
"grad_norm": 0.6841910626255084,
"learning_rate": 3.654062316377106e-05,
"loss": 0.3845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17266666889190674,
"step": 1185,
"valid_targets_mean": 2745.6,
"valid_targets_min": 303
},
{
"epoch": 1.907051282051282,
"grad_norm": 0.8254813972995194,
"learning_rate": 3.649556460847131e-05,
"loss": 0.3928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15996776521205902,
"step": 1190,
"valid_targets_mean": 1754.0,
"valid_targets_min": 894
},
{
"epoch": 1.9150641025641026,
"grad_norm": 0.7291405879871701,
"learning_rate": 3.6450242662570314e-05,
"loss": 0.387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.192326158285141,
"step": 1195,
"valid_targets_mean": 2522.0,
"valid_targets_min": 1364
},
{
"epoch": 1.9230769230769231,
"grad_norm": 0.6684747033924835,
"learning_rate": 3.6404658049739854e-05,
"loss": 0.3701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12845301628112793,
"step": 1200,
"valid_targets_mean": 2355.8,
"valid_targets_min": 1434
},
{
"epoch": 1.9310897435897436,
"grad_norm": 0.7501902469595525,
"learning_rate": 3.63588114978458e-05,
"loss": 0.3906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20027633011341095,
"step": 1205,
"valid_targets_mean": 2796.9,
"valid_targets_min": 968
},
{
"epoch": 1.939102564102564,
"grad_norm": 0.8787778878398708,
"learning_rate": 3.6312703738936504e-05,
"loss": 0.3808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17389872670173645,
"step": 1210,
"valid_targets_mean": 1681.4,
"valid_targets_min": 1167
},
{
"epoch": 1.9471153846153846,
"grad_norm": 0.7032222031644281,
"learning_rate": 3.626633550923111e-05,
"loss": 0.3797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14461690187454224,
"step": 1215,
"valid_targets_mean": 1986.5,
"valid_targets_min": 977
},
{
"epoch": 1.9551282051282053,
"grad_norm": 0.7669477034061776,
"learning_rate": 3.621970754910778e-05,
"loss": 0.3969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.158382385969162,
"step": 1220,
"valid_targets_mean": 2008.5,
"valid_targets_min": 1022
},
{
"epoch": 1.9631410256410255,
"grad_norm": 0.7419304317666434,
"learning_rate": 3.6172820603091885e-05,
"loss": 0.3972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2039494663476944,
"step": 1225,
"valid_targets_mean": 2516.6,
"valid_targets_min": 870
},
{
"epoch": 1.9711538461538463,
"grad_norm": 0.6889071670417813,
"learning_rate": 3.612567541984413e-05,
"loss": 0.3967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14030852913856506,
"step": 1230,
"valid_targets_mean": 1680.6,
"valid_targets_min": 1042
},
{
"epoch": 1.9791666666666665,
"grad_norm": 0.7401744379682911,
"learning_rate": 3.6078272752148574e-05,
"loss": 0.3848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20165783166885376,
"step": 1235,
"valid_targets_mean": 2676.4,
"valid_targets_min": 1282
},
{
"epoch": 1.9871794871794872,
"grad_norm": 0.7127292270502633,
"learning_rate": 3.6030613356900635e-05,
"loss": 0.3778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2067841738462448,
"step": 1240,
"valid_targets_mean": 2912.0,
"valid_targets_min": 1089
},
{
"epoch": 1.9951923076923077,
"grad_norm": 0.6696204116089755,
"learning_rate": 3.598269799509498e-05,
"loss": 0.3925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.133599191904068,
"step": 1245,
"valid_targets_mean": 2193.4,
"valid_targets_min": 830
},
{
"epoch": 2.003205128205128,
"grad_norm": 0.7309611863815216,
"learning_rate": 3.5934527431813385e-05,
"loss": 0.3699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1557263731956482,
"step": 1250,
"valid_targets_mean": 2589.4,
"valid_targets_min": 1535
},
{
"epoch": 2.011217948717949,
"grad_norm": 0.7184249082256497,
"learning_rate": 3.5886102436212536e-05,
"loss": 0.3362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2098970264196396,
"step": 1255,
"valid_targets_mean": 3387.4,
"valid_targets_min": 1266
},
{
"epoch": 2.019230769230769,
"grad_norm": 0.818316424675812,
"learning_rate": 3.583742378151171e-05,
"loss": 0.3529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20294536650180817,
"step": 1260,
"valid_targets_mean": 2087.0,
"valid_targets_min": 1378
},
{
"epoch": 2.02724358974359,
"grad_norm": 0.8278234776817402,
"learning_rate": 3.5788492244980464e-05,
"loss": 0.3806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12976673245429993,
"step": 1265,
"valid_targets_mean": 1713.8,
"valid_targets_min": 1291
},
{
"epoch": 2.03525641025641,
"grad_norm": 0.6959655858741635,
"learning_rate": 3.573930860792621e-05,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15088346600532532,
"step": 1270,
"valid_targets_mean": 2264.1,
"valid_targets_min": 833
},
{
"epoch": 2.043269230769231,
"grad_norm": 0.7359135223433384,
"learning_rate": 3.568987365568173e-05,
"loss": 0.3635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21914812922477722,
"step": 1275,
"valid_targets_mean": 2839.2,
"valid_targets_min": 718
},
{
"epoch": 2.051282051282051,
"grad_norm": 0.7969244476786354,
"learning_rate": 3.564018817759266e-05,
"loss": 0.3536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17785009741783142,
"step": 1280,
"valid_targets_mean": 2738.1,
"valid_targets_min": 1117
},
{
"epoch": 2.059294871794872,
"grad_norm": 0.7000366520475035,
"learning_rate": 3.559025296700484e-05,
"loss": 0.3509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1585804522037506,
"step": 1285,
"valid_targets_mean": 2884.6,
"valid_targets_min": 1399
},
{
"epoch": 2.0673076923076925,
"grad_norm": 0.8302999135088763,
"learning_rate": 3.554006882125173e-05,
"loss": 0.346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1665937602519989,
"step": 1290,
"valid_targets_mean": 2208.9,
"valid_targets_min": 1027
},
{
"epoch": 2.0753205128205128,
"grad_norm": 0.6867619519062099,
"learning_rate": 3.5489636541641586e-05,
"loss": 0.3343,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1533121019601822,
"step": 1295,
"valid_targets_mean": 2485.8,
"valid_targets_min": 1319
},
{
"epoch": 2.0833333333333335,
"grad_norm": 0.7660992574595947,
"learning_rate": 3.543895693344472e-05,
"loss": 0.3459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2186858355998993,
"step": 1300,
"valid_targets_mean": 3234.2,
"valid_targets_min": 1875
},
{
"epoch": 2.0913461538461537,
"grad_norm": 0.7111187839614682,
"learning_rate": 3.538803080588063e-05,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1263820230960846,
"step": 1305,
"valid_targets_mean": 2168.0,
"valid_targets_min": 557
},
{
"epoch": 2.0993589743589745,
"grad_norm": 0.8189330742251553,
"learning_rate": 3.5336858972105076e-05,
"loss": 0.3724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17902137339115143,
"step": 1310,
"valid_targets_mean": 2206.6,
"valid_targets_min": 389
},
{
"epoch": 2.1073717948717947,
"grad_norm": 0.6791884046018158,
"learning_rate": 3.528544224919708e-05,
"loss": 0.3539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2036716639995575,
"step": 1315,
"valid_targets_mean": 3792.5,
"valid_targets_min": 807
},
{
"epoch": 2.1153846153846154,
"grad_norm": 0.7284182583266996,
"learning_rate": 3.5233781458145934e-05,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20440541207790375,
"step": 1320,
"valid_targets_mean": 3414.0,
"valid_targets_min": 989
},
{
"epoch": 2.123397435897436,
"grad_norm": 0.8141069191193862,
"learning_rate": 3.5181877423838034e-05,
"loss": 0.3478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12585687637329102,
"step": 1325,
"valid_targets_mean": 1891.8,
"valid_targets_min": 329
},
{
"epoch": 2.1314102564102564,
"grad_norm": 0.7779645588888344,
"learning_rate": 3.512973097504371e-05,
"loss": 0.348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19460856914520264,
"step": 1330,
"valid_targets_mean": 2242.0,
"valid_targets_min": 1178
},
{
"epoch": 2.139423076923077,
"grad_norm": 0.7927049005753485,
"learning_rate": 3.507734294440403e-05,
"loss": 0.3607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14881053566932678,
"step": 1335,
"valid_targets_mean": 1846.4,
"valid_targets_min": 1157
},
{
"epoch": 2.1474358974358974,
"grad_norm": 1.2475102978708894,
"learning_rate": 3.50247141684175e-05,
"loss": 0.344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17731156945228577,
"step": 1340,
"valid_targets_mean": 1948.9,
"valid_targets_min": 811
},
{
"epoch": 2.155448717948718,
"grad_norm": 0.8006723258352239,
"learning_rate": 3.497184548742667e-05,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14808142185211182,
"step": 1345,
"valid_targets_mean": 2546.2,
"valid_targets_min": 1636
},
{
"epoch": 2.1634615384615383,
"grad_norm": 0.7877170951828761,
"learning_rate": 3.491873774560473e-05,
"loss": 0.3593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15312331914901733,
"step": 1350,
"valid_targets_mean": 2226.0,
"valid_targets_min": 1151
},
{
"epoch": 2.171474358974359,
"grad_norm": 0.7625814945603144,
"learning_rate": 3.486539179094208e-05,
"loss": 0.3636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1644267737865448,
"step": 1355,
"valid_targets_mean": 2441.2,
"valid_targets_min": 1147
},
{
"epoch": 2.1794871794871793,
"grad_norm": 0.7774543384531808,
"learning_rate": 3.481180847523272e-05,
"loss": 0.3601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20621232688426971,
"step": 1360,
"valid_targets_mean": 2525.8,
"valid_targets_min": 884
},
{
"epoch": 2.1875,
"grad_norm": 0.7288588923791031,
"learning_rate": 3.4757988654060684e-05,
"loss": 0.341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20766200125217438,
"step": 1365,
"valid_targets_mean": 3249.2,
"valid_targets_min": 1425
},
{
"epoch": 2.1955128205128207,
"grad_norm": 0.8803087140032898,
"learning_rate": 3.470393318678637e-05,
"loss": 0.3466,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18664687871932983,
"step": 1370,
"valid_targets_mean": 1891.2,
"valid_targets_min": 1214
},
{
"epoch": 2.203525641025641,
"grad_norm": 0.9072383303435303,
"learning_rate": 3.4649642936532836e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16699038445949554,
"step": 1375,
"valid_targets_mean": 2271.9,
"valid_targets_min": 1252
},
{
"epoch": 2.2115384615384617,
"grad_norm": 0.8374276049391025,
"learning_rate": 3.4595118770171984e-05,
"loss": 0.338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19499821960926056,
"step": 1380,
"valid_targets_mean": 2261.1,
"valid_targets_min": 921
},
{
"epoch": 2.219551282051282,
"grad_norm": 0.7110224511296612,
"learning_rate": 3.454036155831077e-05,
"loss": 0.3402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16453278064727783,
"step": 1385,
"valid_targets_mean": 3003.4,
"valid_targets_min": 984
},
{
"epoch": 2.2275641025641026,
"grad_norm": 0.8034598679262911,
"learning_rate": 3.4485372175277236e-05,
"loss": 0.339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21522057056427002,
"step": 1390,
"valid_targets_mean": 2669.6,
"valid_targets_min": 1629
},
{
"epoch": 2.235576923076923,
"grad_norm": 0.936818141069857,
"learning_rate": 3.44301514991066e-05,
"loss": 0.3514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18182526528835297,
"step": 1395,
"valid_targets_mean": 1872.4,
"valid_targets_min": 789
},
{
"epoch": 2.2435897435897436,
"grad_norm": 1.0145081834032068,
"learning_rate": 3.4374700411527225e-05,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18463921546936035,
"step": 1400,
"valid_targets_mean": 2367.8,
"valid_targets_min": 1028
},
{
"epoch": 2.251602564102564,
"grad_norm": 0.8485161257861278,
"learning_rate": 3.431901979794653e-05,
"loss": 0.3413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22386862337589264,
"step": 1405,
"valid_targets_mean": 2464.2,
"valid_targets_min": 1088
},
{
"epoch": 2.2596153846153846,
"grad_norm": 0.6648536661400917,
"learning_rate": 3.426311054743685e-05,
"loss": 0.3317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17803597450256348,
"step": 1410,
"valid_targets_mean": 2665.6,
"valid_targets_min": 663
},
{
"epoch": 2.2676282051282053,
"grad_norm": 0.8127131589772357,
"learning_rate": 3.420697355272127e-05,
"loss": 0.3681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18442665040493011,
"step": 1415,
"valid_targets_mean": 2133.6,
"valid_targets_min": 1183
},
{
"epoch": 2.2756410256410255,
"grad_norm": 0.7669669977387416,
"learning_rate": 3.415060971015933e-05,
"loss": 0.3398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14786052703857422,
"step": 1420,
"valid_targets_mean": 2188.1,
"valid_targets_min": 1065
},
{
"epoch": 2.2836538461538463,
"grad_norm": 0.6858864773705935,
"learning_rate": 3.4094019919732736e-05,
"loss": 0.3458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18889179825782776,
"step": 1425,
"valid_targets_mean": 3692.6,
"valid_targets_min": 1097
},
{
"epoch": 2.2916666666666665,
"grad_norm": 0.7713618046589539,
"learning_rate": 3.403720508503098e-05,
"loss": 0.3686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15971162915229797,
"step": 1430,
"valid_targets_mean": 2336.1,
"valid_targets_min": 416
},
{
"epoch": 2.2996794871794872,
"grad_norm": 0.929199437687356,
"learning_rate": 3.398016611323693e-05,
"loss": 0.3483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20525173842906952,
"step": 1435,
"valid_targets_mean": 2049.9,
"valid_targets_min": 1188
},
{
"epoch": 2.3076923076923075,
"grad_norm": 0.7351797681344957,
"learning_rate": 3.392290391511232e-05,
"loss": 0.362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19388672709465027,
"step": 1440,
"valid_targets_mean": 2718.4,
"valid_targets_min": 1272
},
{
"epoch": 2.315705128205128,
"grad_norm": 0.7830095585397322,
"learning_rate": 3.386541940498322e-05,
"loss": 0.3424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.200042262673378,
"step": 1445,
"valid_targets_mean": 2492.6,
"valid_targets_min": 1031
},
{
"epoch": 2.323717948717949,
"grad_norm": 0.7260002191823239,
"learning_rate": 3.380771350072543e-05,
"loss": 0.3463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20473235845565796,
"step": 1450,
"valid_targets_mean": 3114.0,
"valid_targets_min": 1678
},
{
"epoch": 2.331730769230769,
"grad_norm": 0.7003366188583651,
"learning_rate": 3.374978712374986e-05,
"loss": 0.3536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1109727993607521,
"step": 1455,
"valid_targets_mean": 1764.2,
"valid_targets_min": 853
},
{
"epoch": 2.33974358974359,
"grad_norm": 0.7556951896666148,
"learning_rate": 3.369164119898774e-05,
"loss": 0.3393,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17174313962459564,
"step": 1460,
"valid_targets_mean": 2113.0,
"valid_targets_min": 1189
},
{
"epoch": 2.34775641025641,
"grad_norm": 0.8200928309772625,
"learning_rate": 3.363327665487593e-05,
"loss": 0.3544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15979711711406708,
"step": 1465,
"valid_targets_mean": 2258.0,
"valid_targets_min": 1672
},
{
"epoch": 2.355769230769231,
"grad_norm": 0.8309370694493936,
"learning_rate": 3.357469442334206e-05,
"loss": 0.3346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14197608828544617,
"step": 1470,
"valid_targets_mean": 1783.0,
"valid_targets_min": 1057
},
{
"epoch": 2.363782051282051,
"grad_norm": 0.7797104980045181,
"learning_rate": 3.351589543978965e-05,
"loss": 0.3431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17039065062999725,
"step": 1475,
"valid_targets_mean": 2508.9,
"valid_targets_min": 1190
},
{
"epoch": 2.371794871794872,
"grad_norm": 0.7814917434524874,
"learning_rate": 3.345688064308317e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15709833800792694,
"step": 1480,
"valid_targets_mean": 1788.9,
"valid_targets_min": 242
},
{
"epoch": 2.3798076923076925,
"grad_norm": 0.8902647624043396,
"learning_rate": 3.339765097553307e-05,
"loss": 0.376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1867244690656662,
"step": 1485,
"valid_targets_mean": 1679.9,
"valid_targets_min": 387
},
{
"epoch": 2.3878205128205128,
"grad_norm": 0.7346094387599812,
"learning_rate": 3.33382073828807e-05,
"loss": 0.3471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13888698816299438,
"step": 1490,
"valid_targets_mean": 2292.5,
"valid_targets_min": 1131
},
{
"epoch": 2.3958333333333335,
"grad_norm": 0.9446299732229079,
"learning_rate": 3.327855081428326e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18648427724838257,
"step": 1495,
"valid_targets_mean": 2009.9,
"valid_targets_min": 953
},
{
"epoch": 2.4038461538461537,
"grad_norm": 0.9536703972245442,
"learning_rate": 3.3218682222298584e-05,
"loss": 0.354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1705888956785202,
"step": 1500,
"valid_targets_mean": 2930.1,
"valid_targets_min": 1317
},
{
"epoch": 2.4118589743589745,
"grad_norm": 0.7903036062618911,
"learning_rate": 3.315860256286996e-05,
"loss": 0.3293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13649359345436096,
"step": 1505,
"valid_targets_mean": 1522.0,
"valid_targets_min": 971
},
{
"epoch": 2.4198717948717947,
"grad_norm": 0.9511143375417098,
"learning_rate": 3.3098312795310894e-05,
"loss": 0.3604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16688911616802216,
"step": 1510,
"valid_targets_mean": 1994.0,
"valid_targets_min": 1433
},
{
"epoch": 2.4278846153846154,
"grad_norm": 0.7414997447826995,
"learning_rate": 3.303781388228974e-05,
"loss": 0.3339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19089877605438232,
"step": 1515,
"valid_targets_mean": 2811.2,
"valid_targets_min": 1503
},
{
"epoch": 2.435897435897436,
"grad_norm": 0.767828117255108,
"learning_rate": 3.297710678981435e-05,
"loss": 0.3574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14534533023834229,
"step": 1520,
"valid_targets_mean": 2010.8,
"valid_targets_min": 1053
},
{
"epoch": 2.4439102564102564,
"grad_norm": 0.7887402243405925,
"learning_rate": 3.291619248721667e-05,
"loss": 0.3573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18452662229537964,
"step": 1525,
"valid_targets_mean": 2406.5,
"valid_targets_min": 949
},
{
"epoch": 2.451923076923077,
"grad_norm": 0.8651403875034883,
"learning_rate": 3.285507194713724e-05,
"loss": 0.3432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21715617179870605,
"step": 1530,
"valid_targets_mean": 2057.1,
"valid_targets_min": 249
},
{
"epoch": 2.4599358974358974,
"grad_norm": 0.9068357442847398,
"learning_rate": 3.279374614550966e-05,
"loss": 0.3353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1632959544658661,
"step": 1535,
"valid_targets_mean": 1864.1,
"valid_targets_min": 500
},
{
"epoch": 2.467948717948718,
"grad_norm": 0.745269665162631,
"learning_rate": 3.2732216061545e-05,
"loss": 0.342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1703471690416336,
"step": 1540,
"valid_targets_mean": 2952.0,
"valid_targets_min": 508
},
{
"epoch": 2.4759615384615383,
"grad_norm": 0.7463621637326882,
"learning_rate": 3.2670482677716214e-05,
"loss": 0.3561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12429662048816681,
"step": 1545,
"valid_targets_mean": 1754.8,
"valid_targets_min": 868
},
{
"epoch": 2.483974358974359,
"grad_norm": 0.6632562787335162,
"learning_rate": 3.2608546979742394e-05,
"loss": 0.3604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.142435684800148,
"step": 1550,
"valid_targets_mean": 2705.5,
"valid_targets_min": 1315
},
{
"epoch": 2.4919871794871793,
"grad_norm": 1.0979260579943735,
"learning_rate": 3.254640995657307e-05,
"loss": 0.3423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17696614563465118,
"step": 1555,
"valid_targets_mean": 2757.8,
"valid_targets_min": 1335
},
{
"epoch": 2.5,
"grad_norm": 0.718451828389939,
"learning_rate": 3.248407260037239e-05,
"loss": 0.3522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17623674869537354,
"step": 1560,
"valid_targets_mean": 3102.8,
"valid_targets_min": 1101
},
{
"epoch": 2.5080128205128203,
"grad_norm": 0.5714615297855816,
"learning_rate": 3.24215359065033e-05,
"loss": 0.3451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11917003989219666,
"step": 1565,
"valid_targets_mean": 3913.8,
"valid_targets_min": 1852
},
{
"epoch": 2.516025641025641,
"grad_norm": 0.7253937767608349,
"learning_rate": 3.235880087351164e-05,
"loss": 0.3532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13781258463859558,
"step": 1570,
"valid_targets_mean": 2443.8,
"valid_targets_min": 1277
},
{
"epoch": 2.5240384615384617,
"grad_norm": 0.7141718259882394,
"learning_rate": 3.2295868503110184e-05,
"loss": 0.336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1570618599653244,
"step": 1575,
"valid_targets_mean": 2712.8,
"valid_targets_min": 1092
},
{
"epoch": 2.532051282051282,
"grad_norm": 0.7370659727178314,
"learning_rate": 3.22327398001627e-05,
"loss": 0.3498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16354694962501526,
"step": 1580,
"valid_targets_mean": 2248.0,
"valid_targets_min": 1015
},
{
"epoch": 2.5400641025641026,
"grad_norm": 0.8429155440531665,
"learning_rate": 3.216941577266783e-05,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18911314010620117,
"step": 1585,
"valid_targets_mean": 1692.5,
"valid_targets_min": 473
},
{
"epoch": 2.5480769230769234,
"grad_norm": 0.8850080126831343,
"learning_rate": 3.210589743174308e-05,
"loss": 0.376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25558894872665405,
"step": 1590,
"valid_targets_mean": 2742.9,
"valid_targets_min": 968
},
{
"epoch": 2.5560897435897436,
"grad_norm": 0.7791032617822178,
"learning_rate": 3.204218579160857e-05,
"loss": 0.3491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1383132040500641,
"step": 1595,
"valid_targets_mean": 2072.0,
"valid_targets_min": 1294
},
{
"epoch": 2.564102564102564,
"grad_norm": 0.8381378811245371,
"learning_rate": 3.197828186957094e-05,
"loss": 0.344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18840298056602478,
"step": 1600,
"valid_targets_mean": 1596.6,
"valid_targets_min": 338
},
{
"epoch": 2.5721153846153846,
"grad_norm": 0.8590646227884097,
"learning_rate": 3.191418668600705e-05,
"loss": 0.3538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16716593503952026,
"step": 1605,
"valid_targets_mean": 1956.9,
"valid_targets_min": 1305
},
{
"epoch": 2.5801282051282053,
"grad_norm": 0.827636937072311,
"learning_rate": 3.184990126434771e-05,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18711942434310913,
"step": 1610,
"valid_targets_mean": 2087.8,
"valid_targets_min": 941
},
{
"epoch": 2.5881410256410255,
"grad_norm": 0.7476429637498967,
"learning_rate": 3.178542663106131e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1350896656513214,
"step": 1615,
"valid_targets_mean": 1842.0,
"valid_targets_min": 1224
},
{
"epoch": 2.5961538461538463,
"grad_norm": 0.6440604251073735,
"learning_rate": 3.172076381563748e-05,
"loss": 0.3368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1780594140291214,
"step": 1620,
"valid_targets_mean": 3939.6,
"valid_targets_min": 1489
},
{
"epoch": 2.6041666666666665,
"grad_norm": 0.8225690775334342,
"learning_rate": 3.165591385057058e-05,
"loss": 0.3391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13189071416854858,
"step": 1625,
"valid_targets_mean": 1886.9,
"valid_targets_min": 895
},
{
"epoch": 2.6121794871794872,
"grad_norm": 0.7321770207000557,
"learning_rate": 3.1590877771343316e-05,
"loss": 0.3349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2012443244457245,
"step": 1630,
"valid_targets_mean": 3346.5,
"valid_targets_min": 1084
},
{
"epoch": 2.6201923076923075,
"grad_norm": 0.7457391847366335,
"learning_rate": 3.152565661641008e-05,
"loss": 0.3506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17787332832813263,
"step": 1635,
"valid_targets_mean": 2177.1,
"valid_targets_min": 934
},
{
"epoch": 2.628205128205128,
"grad_norm": 0.7502464415879065,
"learning_rate": 3.1460251427180474e-05,
"loss": 0.3503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16391557455062866,
"step": 1640,
"valid_targets_mean": 2989.6,
"valid_targets_min": 997
},
{
"epoch": 2.636217948717949,
"grad_norm": 0.9095546327940534,
"learning_rate": 3.139466324800263e-05,
"loss": 0.3692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1844089925289154,
"step": 1645,
"valid_targets_mean": 1437.8,
"valid_targets_min": 792
},
{
"epoch": 2.644230769230769,
"grad_norm": 0.7167811943459642,
"learning_rate": 3.132889312614655e-05,
"loss": 0.325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1620154082775116,
"step": 1650,
"valid_targets_mean": 2718.0,
"valid_targets_min": 767
},
{
"epoch": 2.65224358974359,
"grad_norm": 0.7082837484361146,
"learning_rate": 3.126294211178737e-05,
"loss": 0.3712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22598208487033844,
"step": 1655,
"valid_targets_mean": 3451.8,
"valid_targets_min": 959
},
{
"epoch": 2.66025641025641,
"grad_norm": 0.7905440205287989,
"learning_rate": 3.1196811257988634e-05,
"loss": 0.3238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.166299968957901,
"step": 1660,
"valid_targets_mean": 2094.1,
"valid_targets_min": 882
},
{
"epoch": 2.668269230769231,
"grad_norm": 0.7476779090208169,
"learning_rate": 3.1130501620685394e-05,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13155703246593475,
"step": 1665,
"valid_targets_mean": 2074.2,
"valid_targets_min": 1097
},
{
"epoch": 2.676282051282051,
"grad_norm": 0.614252113316522,
"learning_rate": 3.106401425866745e-05,
"loss": 0.3477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11827291548252106,
"step": 1670,
"valid_targets_mean": 2858.2,
"valid_targets_min": 912
},
{
"epoch": 2.684294871794872,
"grad_norm": 0.8246290440439452,
"learning_rate": 3.099735023356236e-05,
"loss": 0.347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21760646998882294,
"step": 1675,
"valid_targets_mean": 2478.5,
"valid_targets_min": 1126
},
{
"epoch": 2.6923076923076925,
"grad_norm": 0.8477067106504065,
"learning_rate": 3.0930510609818564e-05,
"loss": 0.3248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18377399444580078,
"step": 1680,
"valid_targets_mean": 2193.5,
"valid_targets_min": 1098
},
{
"epoch": 2.7003205128205128,
"grad_norm": 0.743871662197125,
"learning_rate": 3.086349645468831e-05,
"loss": 0.3422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16777920722961426,
"step": 1685,
"valid_targets_mean": 2257.5,
"valid_targets_min": 958
},
{
"epoch": 2.7083333333333335,
"grad_norm": 0.8446130888099646,
"learning_rate": 3.079630883821067e-05,
"loss": 0.3332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1785382628440857,
"step": 1690,
"valid_targets_mean": 2225.0,
"valid_targets_min": 1133
},
{
"epoch": 2.7163461538461537,
"grad_norm": 0.7190320385340914,
"learning_rate": 3.0728948833194436e-05,
"loss": 0.3663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1873319000005722,
"step": 1695,
"valid_targets_mean": 3258.6,
"valid_targets_min": 1604
},
{
"epoch": 2.7243589743589745,
"grad_norm": 0.7955833242225298,
"learning_rate": 3.066141751520099e-05,
"loss": 0.3468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16164278984069824,
"step": 1700,
"valid_targets_mean": 2220.6,
"valid_targets_min": 948
},
{
"epoch": 2.7323717948717947,
"grad_norm": 0.8727727023841495,
"learning_rate": 3.059371596252712e-05,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1807830035686493,
"step": 1705,
"valid_targets_mean": 2360.4,
"valid_targets_min": 1186
},
{
"epoch": 2.7403846153846154,
"grad_norm": 0.8285434490328112,
"learning_rate": 3.0525845256187834e-05,
"loss": 0.3647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19549046456813812,
"step": 1710,
"valid_targets_mean": 2300.2,
"valid_targets_min": 1139
},
{
"epoch": 2.748397435897436,
"grad_norm": 0.6665940354235458,
"learning_rate": 3.0457806479899044e-05,
"loss": 0.3145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1639786660671234,
"step": 1715,
"valid_targets_mean": 3070.1,
"valid_targets_min": 1047
},
{
"epoch": 2.7564102564102564,
"grad_norm": 0.7400644302712954,
"learning_rate": 3.0389600720060318e-05,
"loss": 0.344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15920796990394592,
"step": 1720,
"valid_targets_mean": 2484.5,
"valid_targets_min": 1521
},
{
"epoch": 2.7644230769230766,
"grad_norm": 0.6529233923053657,
"learning_rate": 3.0321229065737522e-05,
"loss": 0.3434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15723413228988647,
"step": 1725,
"valid_targets_mean": 2664.8,
"valid_targets_min": 1180
},
{
"epoch": 2.7724358974358974,
"grad_norm": 0.9818917911509216,
"learning_rate": 3.0252692608645384e-05,
"loss": 0.3592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18439249694347382,
"step": 1730,
"valid_targets_mean": 1599.9,
"valid_targets_min": 931
},
{
"epoch": 2.780448717948718,
"grad_norm": 0.7429322400334534,
"learning_rate": 3.0183992443130127e-05,
"loss": 0.3221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1347109079360962,
"step": 1735,
"valid_targets_mean": 2627.2,
"valid_targets_min": 1023
},
{
"epoch": 2.7884615384615383,
"grad_norm": 0.825330415012023,
"learning_rate": 3.011512966615195e-05,
"loss": 0.3568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1733407974243164,
"step": 1740,
"valid_targets_mean": 2149.0,
"valid_targets_min": 991
},
{
"epoch": 2.796474358974359,
"grad_norm": 0.7695789184189072,
"learning_rate": 3.0046105377267523e-05,
"loss": 0.3452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13556677103042603,
"step": 1745,
"valid_targets_mean": 2014.4,
"valid_targets_min": 1220
},
{
"epoch": 2.8044871794871797,
"grad_norm": 0.7365188240450388,
"learning_rate": 2.9976920678612456e-05,
"loss": 0.3379,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19936934113502502,
"step": 1750,
"valid_targets_mean": 3110.4,
"valid_targets_min": 1290
},
{
"epoch": 2.8125,
"grad_norm": 0.7010220729446671,
"learning_rate": 2.9907576674883664e-05,
"loss": 0.3527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14287908375263214,
"step": 1755,
"valid_targets_mean": 2108.6,
"valid_targets_min": 1171
},
{
"epoch": 2.8205128205128203,
"grad_norm": 1.0422014811559845,
"learning_rate": 2.983807447332174e-05,
"loss": 0.3366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19687989354133606,
"step": 1760,
"valid_targets_mean": 2476.4,
"valid_targets_min": 828
},
{
"epoch": 2.828525641025641,
"grad_norm": 0.7770747301590775,
"learning_rate": 2.9768415183693293e-05,
"loss": 0.3622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19372722506523132,
"step": 1765,
"valid_targets_mean": 2394.9,
"valid_targets_min": 577
},
{
"epoch": 2.8365384615384617,
"grad_norm": 0.7422438539405928,
"learning_rate": 2.9698599918273197e-05,
"loss": 0.3448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1415659487247467,
"step": 1770,
"valid_targets_mean": 1877.5,
"valid_targets_min": 836
},
{
"epoch": 2.844551282051282,
"grad_norm": 0.8216346096786719,
"learning_rate": 2.962862979182686e-05,
"loss": 0.3372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17512428760528564,
"step": 1775,
"valid_targets_mean": 2119.5,
"valid_targets_min": 1289
},
{
"epoch": 2.8525641025641026,
"grad_norm": 0.6864990682783045,
"learning_rate": 2.95585059215924e-05,
"loss": 0.3494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14896155893802643,
"step": 1780,
"valid_targets_mean": 2570.9,
"valid_targets_min": 1166
},
{
"epoch": 2.8605769230769234,
"grad_norm": 0.7673674716714654,
"learning_rate": 2.948822942726284e-05,
"loss": 0.3436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1696726679801941,
"step": 1785,
"valid_targets_mean": 2115.2,
"valid_targets_min": 1126
},
{
"epoch": 2.8685897435897436,
"grad_norm": 0.787999238286826,
"learning_rate": 2.941780143096817e-05,
"loss": 0.3485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23070955276489258,
"step": 1790,
"valid_targets_mean": 2714.6,
"valid_targets_min": 1237
},
{
"epoch": 2.876602564102564,
"grad_norm": 0.6927465574387711,
"learning_rate": 2.9347223057257505e-05,
"loss": 0.3081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15984871983528137,
"step": 1795,
"valid_targets_mean": 2840.6,
"valid_targets_min": 1456
},
{
"epoch": 2.8846153846153846,
"grad_norm": 0.7229524925061765,
"learning_rate": 2.927649543308106e-05,
"loss": 0.3195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1824902594089508,
"step": 1800,
"valid_targets_mean": 2636.5,
"valid_targets_min": 1155
},
{
"epoch": 2.8926282051282053,
"grad_norm": 0.9207234756930798,
"learning_rate": 2.9205619687772212e-05,
"loss": 0.3468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.194568932056427,
"step": 1805,
"valid_targets_mean": 2309.9,
"valid_targets_min": 1418
},
{
"epoch": 2.9006410256410255,
"grad_norm": 0.8484173433057807,
"learning_rate": 2.9134596953029413e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18519386649131775,
"step": 1810,
"valid_targets_mean": 1788.4,
"valid_targets_min": 1265
},
{
"epoch": 2.9086538461538463,
"grad_norm": 0.8106235389071998,
"learning_rate": 2.9063428362898168e-05,
"loss": 0.3538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18934476375579834,
"step": 1815,
"valid_targets_mean": 2666.2,
"valid_targets_min": 1363
},
{
"epoch": 2.9166666666666665,
"grad_norm": 0.8083685538552774,
"learning_rate": 2.8992115053752905e-05,
"loss": 0.336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21094626188278198,
"step": 1820,
"valid_targets_mean": 2983.9,
"valid_targets_min": 859
},
{
"epoch": 2.9246794871794872,
"grad_norm": 0.683223511020343,
"learning_rate": 2.8920658164278816e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19165866076946259,
"step": 1825,
"valid_targets_mean": 3494.6,
"valid_targets_min": 1391
},
{
"epoch": 2.9326923076923075,
"grad_norm": 0.7022396849802295,
"learning_rate": 2.884905883545373e-05,
"loss": 0.3389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1804656982421875,
"step": 1830,
"valid_targets_mean": 2772.4,
"valid_targets_min": 1289
},
{
"epoch": 2.940705128205128,
"grad_norm": 0.699550022589993,
"learning_rate": 2.877731821052981e-05,
"loss": 0.3475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15796631574630737,
"step": 1835,
"valid_targets_mean": 2599.6,
"valid_targets_min": 985
},
{
"epoch": 2.948717948717949,
"grad_norm": 0.7457851430690988,
"learning_rate": 2.8705437435015375e-05,
"loss": 0.3592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1569703370332718,
"step": 1840,
"valid_targets_mean": 2262.1,
"valid_targets_min": 1235
},
{
"epoch": 2.956730769230769,
"grad_norm": 0.8448740229638224,
"learning_rate": 2.8633417656656566e-05,
"loss": 0.3345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19404947757720947,
"step": 1845,
"valid_targets_mean": 1978.1,
"valid_targets_min": 909
},
{
"epoch": 2.96474358974359,
"grad_norm": 0.8042048534440943,
"learning_rate": 2.8561260025419036e-05,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18623505532741547,
"step": 1850,
"valid_targets_mean": 2426.5,
"valid_targets_min": 980
},
{
"epoch": 2.97275641025641,
"grad_norm": 0.7147551803870944,
"learning_rate": 2.8488965693469583e-05,
"loss": 0.328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19029518961906433,
"step": 1855,
"valid_targets_mean": 2745.0,
"valid_targets_min": 1748
},
{
"epoch": 2.980769230769231,
"grad_norm": 0.7361534209295404,
"learning_rate": 2.8416535815157763e-05,
"loss": 0.3141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1878901571035385,
"step": 1860,
"valid_targets_mean": 2995.4,
"valid_targets_min": 1033
},
{
"epoch": 2.988782051282051,
"grad_norm": 0.7658891299385264,
"learning_rate": 2.8343971546997434e-05,
"loss": 0.3467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16783340275287628,
"step": 1865,
"valid_targets_mean": 2798.8,
"valid_targets_min": 383
},
{
"epoch": 2.996794871794872,
"grad_norm": 0.7446832022601828,
"learning_rate": 2.827127404764831e-05,
"loss": 0.3496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16190892457962036,
"step": 1870,
"valid_targets_mean": 2053.6,
"valid_targets_min": 895
},
{
"epoch": 3.0048076923076925,
"grad_norm": 0.7325957115374676,
"learning_rate": 2.8198444477897467e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1726066768169403,
"step": 1875,
"valid_targets_mean": 2703.5,
"valid_targets_min": 321
},
{
"epoch": 3.0128205128205128,
"grad_norm": 0.8146787211464528,
"learning_rate": 2.8125484000640787e-05,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14417630434036255,
"step": 1880,
"valid_targets_mean": 2497.8,
"valid_targets_min": 1203
},
{
"epoch": 3.0208333333333335,
"grad_norm": 0.8406399733518674,
"learning_rate": 2.8052393780864394e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1478326916694641,
"step": 1885,
"valid_targets_mean": 2281.6,
"valid_targets_min": 1267
},
{
"epoch": 3.0288461538461537,
"grad_norm": 0.7160031702370862,
"learning_rate": 2.797917498562607e-05,
"loss": 0.294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13371425867080688,
"step": 1890,
"valid_targets_mean": 3478.1,
"valid_targets_min": 2443
},
{
"epoch": 3.0368589743589745,
"grad_norm": 0.7856133018379108,
"learning_rate": 2.7905828784036596e-05,
"loss": 0.2932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19632607698440552,
"step": 1895,
"valid_targets_mean": 3087.1,
"valid_targets_min": 1181
},
{
"epoch": 3.0448717948717947,
"grad_norm": 0.947660312509705,
"learning_rate": 2.78323563472411e-05,
"loss": 0.3186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13372501730918884,
"step": 1900,
"valid_targets_mean": 1653.9,
"valid_targets_min": 1072
},
{
"epoch": 3.0528846153846154,
"grad_norm": 0.9400847917635448,
"learning_rate": 2.7758758848400354e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1144673079252243,
"step": 1905,
"valid_targets_mean": 1697.1,
"valid_targets_min": 859
},
{
"epoch": 3.0608974358974357,
"grad_norm": 0.7027648710059686,
"learning_rate": 2.7685037462672043e-05,
"loss": 0.3216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10471771657466888,
"step": 1910,
"valid_targets_mean": 2158.2,
"valid_targets_min": 1249
},
{
"epoch": 3.0689102564102564,
"grad_norm": 0.9402109201312709,
"learning_rate": 2.7611193367191993e-05,
"loss": 0.3119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21580298244953156,
"step": 1915,
"valid_targets_mean": 2296.0,
"valid_targets_min": 1001
},
{
"epoch": 3.076923076923077,
"grad_norm": 0.9572841906462561,
"learning_rate": 2.7537227741055378e-05,
"loss": 0.3104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1641775518655777,
"step": 1920,
"valid_targets_mean": 1653.5,
"valid_targets_min": 1161
},
{
"epoch": 3.0849358974358974,
"grad_norm": 0.729963052156269,
"learning_rate": 2.746314176529791e-05,
"loss": 0.2922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14104565978050232,
"step": 1925,
"valid_targets_mean": 2807.6,
"valid_targets_min": 1764
},
{
"epoch": 3.092948717948718,
"grad_norm": 0.7748643309949854,
"learning_rate": 2.7388936622876957e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1505746990442276,
"step": 1930,
"valid_targets_mean": 2144.5,
"valid_targets_min": 960
},
{
"epoch": 3.1009615384615383,
"grad_norm": 0.7762780237813749,
"learning_rate": 2.7314613498652663e-05,
"loss": 0.2857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17231060564517975,
"step": 1935,
"valid_targets_mean": 3336.2,
"valid_targets_min": 1030
},
{
"epoch": 3.108974358974359,
"grad_norm": 0.6722190788058807,
"learning_rate": 2.7240173579369025e-05,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14252430200576782,
"step": 1940,
"valid_targets_mean": 3849.6,
"valid_targets_min": 1573
},
{
"epoch": 3.1169871794871793,
"grad_norm": 0.9430632446810732,
"learning_rate": 2.7165618053634962e-05,
"loss": 0.3255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1814703643321991,
"step": 1945,
"valid_targets_mean": 2009.1,
"valid_targets_min": 1026
},
{
"epoch": 3.125,
"grad_norm": 0.7277451337056141,
"learning_rate": 2.7090948111905304e-05,
"loss": 0.283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15981590747833252,
"step": 1950,
"valid_targets_mean": 3229.4,
"valid_targets_min": 979
},
{
"epoch": 3.1330128205128207,
"grad_norm": 0.8461152648042034,
"learning_rate": 2.701616494646183e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1708703637123108,
"step": 1955,
"valid_targets_mean": 2370.4,
"valid_targets_min": 1092
},
{
"epoch": 3.141025641025641,
"grad_norm": 0.8759130229646693,
"learning_rate": 2.6941269751394174e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1723184883594513,
"step": 1960,
"valid_targets_mean": 2504.0,
"valid_targets_min": 929
},
{
"epoch": 3.1490384615384617,
"grad_norm": 0.8760804346780584,
"learning_rate": 2.686626372258081e-05,
"loss": 0.3108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1883678436279297,
"step": 1965,
"valid_targets_mean": 2763.2,
"valid_targets_min": 1438
},
{
"epoch": 3.157051282051282,
"grad_norm": 0.7824998399362582,
"learning_rate": 2.6791148057669913e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14598461985588074,
"step": 1970,
"valid_targets_mean": 1893.1,
"valid_targets_min": 811
},
{
"epoch": 3.1650641025641026,
"grad_norm": 0.7207162402545875,
"learning_rate": 2.671592395606027e-05,
"loss": 0.2963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1699347198009491,
"step": 1975,
"valid_targets_mean": 3550.0,
"valid_targets_min": 1056
},
{
"epoch": 3.173076923076923,
"grad_norm": 0.8392526596294367,
"learning_rate": 2.6640592618882114e-05,
"loss": 0.2851,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12137892842292786,
"step": 1980,
"valid_targets_mean": 2289.5,
"valid_targets_min": 1066
},
{
"epoch": 3.1810897435897436,
"grad_norm": 0.6882637569568384,
"learning_rate": 2.656515524897795e-05,
"loss": 0.317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19221651554107666,
"step": 1985,
"valid_targets_mean": 3759.4,
"valid_targets_min": 1478
},
{
"epoch": 3.189102564102564,
"grad_norm": 0.9801416336913753,
"learning_rate": 2.6489613050883343e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15233540534973145,
"step": 1990,
"valid_targets_mean": 1970.0,
"valid_targets_min": 1294
},
{
"epoch": 3.1971153846153846,
"grad_norm": 0.7453903933538132,
"learning_rate": 2.6413967230807677e-05,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16587764024734497,
"step": 1995,
"valid_targets_mean": 3308.9,
"valid_targets_min": 1813
},
{
"epoch": 3.2051282051282053,
"grad_norm": 0.7841224659830258,
"learning_rate": 2.6338218996614924e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12263019382953644,
"step": 2000,
"valid_targets_mean": 2472.6,
"valid_targets_min": 925
},
{
"epoch": 3.2131410256410255,
"grad_norm": 0.9039563479812038,
"learning_rate": 2.6262369557804325e-05,
"loss": 0.3313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1826220154762268,
"step": 2005,
"valid_targets_mean": 2237.0,
"valid_targets_min": 999
},
{
"epoch": 3.2211538461538463,
"grad_norm": 0.8416860751127145,
"learning_rate": 2.6186420125491094e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1301402747631073,
"step": 2010,
"valid_targets_mean": 2353.5,
"valid_targets_min": 925
},
{
"epoch": 3.2291666666666665,
"grad_norm": 0.8526043964264228,
"learning_rate": 2.6110371912387083e-05,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14723050594329834,
"step": 2015,
"valid_targets_mean": 1859.8,
"valid_targets_min": 880
},
{
"epoch": 3.2371794871794872,
"grad_norm": 0.7157138595622383,
"learning_rate": 2.6034226132781407e-05,
"loss": 0.2923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1483040452003479,
"step": 2020,
"valid_targets_mean": 3164.2,
"valid_targets_min": 1033
},
{
"epoch": 3.2451923076923075,
"grad_norm": 0.8354355862763577,
"learning_rate": 2.5957984002521066e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.151239812374115,
"step": 2025,
"valid_targets_mean": 1905.2,
"valid_targets_min": 816
},
{
"epoch": 3.253205128205128,
"grad_norm": 0.8549380234850392,
"learning_rate": 2.588164673899151e-05,
"loss": 0.3203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14034335315227509,
"step": 2030,
"valid_targets_mean": 1982.0,
"valid_targets_min": 1465
},
{
"epoch": 3.261217948717949,
"grad_norm": 0.6918270014906354,
"learning_rate": 2.580521556109724e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1363942176103592,
"step": 2035,
"valid_targets_mean": 2749.0,
"valid_targets_min": 1295
},
{
"epoch": 3.269230769230769,
"grad_norm": 1.0174666576501485,
"learning_rate": 2.57286916892423e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18560458719730377,
"step": 2040,
"valid_targets_mean": 1905.9,
"valid_targets_min": 1423
},
{
"epoch": 3.27724358974359,
"grad_norm": 0.9140763921901908,
"learning_rate": 2.5652076345310822e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14916765689849854,
"step": 2045,
"valid_targets_mean": 1814.0,
"valid_targets_min": 1239
},
{
"epoch": 3.28525641025641,
"grad_norm": 0.6748799927803247,
"learning_rate": 2.5575370752647507e-05,
"loss": 0.2976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12936852872371674,
"step": 2050,
"valid_targets_mean": 2390.4,
"valid_targets_min": 1174
},
{
"epoch": 3.293269230769231,
"grad_norm": 0.7156103482993798,
"learning_rate": 2.5498576136038077e-05,
"loss": 0.32,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1080101728439331,
"step": 2055,
"valid_targets_mean": 1998.4,
"valid_targets_min": 1159
},
{
"epoch": 3.301282051282051,
"grad_norm": 0.703655239658459,
"learning_rate": 2.542169372168976e-05,
"loss": 0.3054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12107835710048676,
"step": 2060,
"valid_targets_mean": 2706.5,
"valid_targets_min": 653
},
{
"epoch": 3.309294871794872,
"grad_norm": 0.739225948183899,
"learning_rate": 2.5344724737211646e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09956350922584534,
"step": 2065,
"valid_targets_mean": 1626.0,
"valid_targets_min": 1021
},
{
"epoch": 3.3173076923076925,
"grad_norm": 2.2757640724713064,
"learning_rate": 2.5267670411595152e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1255197525024414,
"step": 2070,
"valid_targets_mean": 2971.5,
"valid_targets_min": 1132
},
{
"epoch": 3.3253205128205128,
"grad_norm": 0.7500910233878659,
"learning_rate": 2.5190531975194345e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14343443512916565,
"step": 2075,
"valid_targets_mean": 3160.2,
"valid_targets_min": 1641
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.7428850119831736,
"learning_rate": 2.5113310659706322e-05,
"loss": 0.3057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1660858690738678,
"step": 2080,
"valid_targets_mean": 3558.9,
"valid_targets_min": 988
},
{
"epoch": 3.3413461538461537,
"grad_norm": 0.805327734018275,
"learning_rate": 2.5036007698151553e-05,
"loss": 0.2945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11538653075695038,
"step": 2085,
"valid_targets_mean": 2320.5,
"valid_targets_min": 990
},
{
"epoch": 3.3493589743589745,
"grad_norm": 0.8271835600858624,
"learning_rate": 2.4958624324854185e-05,
"loss": 0.3124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1344335377216339,
"step": 2090,
"valid_targets_mean": 1865.6,
"valid_targets_min": 958
},
{
"epoch": 3.3573717948717947,
"grad_norm": 0.7768125076129313,
"learning_rate": 2.4881161775422303e-05,
"loss": 0.288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16174614429473877,
"step": 2095,
"valid_targets_mean": 2769.1,
"valid_targets_min": 233
},
{
"epoch": 3.3653846153846154,
"grad_norm": 0.8892991278143192,
"learning_rate": 2.480362128672824e-05,
"loss": 0.3083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1573309600353241,
"step": 2100,
"valid_targets_mean": 2051.8,
"valid_targets_min": 878
},
{
"epoch": 3.373397435897436,
"grad_norm": 0.8378062536549976,
"learning_rate": 2.4726004096888817e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20106950402259827,
"step": 2105,
"valid_targets_mean": 3109.9,
"valid_targets_min": 1101
},
{
"epoch": 3.3814102564102564,
"grad_norm": 0.8230359694097013,
"learning_rate": 2.4648311445245558e-05,
"loss": 0.3226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2123335748910904,
"step": 2110,
"valid_targets_mean": 2667.5,
"valid_targets_min": 1020
},
{
"epoch": 3.389423076923077,
"grad_norm": 0.9290568558607065,
"learning_rate": 2.457054457234493e-05,
"loss": 0.3193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18395236134529114,
"step": 2115,
"valid_targets_mean": 2331.6,
"valid_targets_min": 281
},
{
"epoch": 3.3974358974358974,
"grad_norm": 0.7670991635073626,
"learning_rate": 2.4492704719918497e-05,
"loss": 0.3027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15496304631233215,
"step": 2120,
"valid_targets_mean": 2392.4,
"valid_targets_min": 888
},
{
"epoch": 3.405448717948718,
"grad_norm": 0.782240421451244,
"learning_rate": 2.4414793130863134e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18173784017562866,
"step": 2125,
"valid_targets_mean": 3618.1,
"valid_targets_min": 708
},
{
"epoch": 3.4134615384615383,
"grad_norm": 0.7322971407666778,
"learning_rate": 2.433681104922114e-05,
"loss": 0.3136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.117400161921978,
"step": 2130,
"valid_targets_mean": 2565.1,
"valid_targets_min": 1052
},
{
"epoch": 3.421474358974359,
"grad_norm": 0.6489435534494313,
"learning_rate": 2.4258759720160412e-05,
"loss": 0.3057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13403040170669556,
"step": 2135,
"valid_targets_mean": 3160.1,
"valid_targets_min": 1714
},
{
"epoch": 3.4294871794871793,
"grad_norm": 0.7779796344498587,
"learning_rate": 2.4180640389954534e-05,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15386280417442322,
"step": 2140,
"valid_targets_mean": 2593.6,
"valid_targets_min": 1072
},
{
"epoch": 3.4375,
"grad_norm": 0.8296585482152623,
"learning_rate": 2.4102454305962892e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1341044306755066,
"step": 2145,
"valid_targets_mean": 1699.1,
"valid_targets_min": 361
},
{
"epoch": 3.4455128205128207,
"grad_norm": 0.7714401323308417,
"learning_rate": 2.402420271661076e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14644163846969604,
"step": 2150,
"valid_targets_mean": 3023.0,
"valid_targets_min": 942
},
{
"epoch": 3.453525641025641,
"grad_norm": 0.7696698896813144,
"learning_rate": 2.3945886871369338e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16718119382858276,
"step": 2155,
"valid_targets_mean": 3139.9,
"valid_targets_min": 1343
},
{
"epoch": 3.4615384615384617,
"grad_norm": 0.8050270640705677,
"learning_rate": 2.3867508020735865e-05,
"loss": 0.3004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13597774505615234,
"step": 2160,
"valid_targets_mean": 2135.0,
"valid_targets_min": 1281
},
{
"epoch": 3.469551282051282,
"grad_norm": 0.880792188264717,
"learning_rate": 2.3789067416213568e-05,
"loss": 0.2981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.134599506855011,
"step": 2165,
"valid_targets_mean": 2303.0,
"valid_targets_min": 1009
},
{
"epoch": 3.4775641025641026,
"grad_norm": 0.7868422040472738,
"learning_rate": 2.3710566310291733e-05,
"loss": 0.3001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13010697066783905,
"step": 2170,
"valid_targets_mean": 2357.6,
"valid_targets_min": 896
},
{
"epoch": 3.485576923076923,
"grad_norm": 0.8317296109067873,
"learning_rate": 2.36320059564257e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17702716588974,
"step": 2175,
"valid_targets_mean": 2804.6,
"valid_targets_min": 1479
},
{
"epoch": 3.4935897435897436,
"grad_norm": 0.7742404251072617,
"learning_rate": 2.3553387609016833e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.146556094288826,
"step": 2180,
"valid_targets_mean": 2264.8,
"valid_targets_min": 1623
},
{
"epoch": 3.501602564102564,
"grad_norm": 0.8147300113930734,
"learning_rate": 2.347471252339252e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1777869015932083,
"step": 2185,
"valid_targets_mean": 2804.1,
"valid_targets_min": 1277
},
{
"epoch": 3.5096153846153846,
"grad_norm": 0.848117651346152,
"learning_rate": 2.339598195578608e-05,
"loss": 0.3088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14068767428398132,
"step": 2190,
"valid_targets_mean": 1880.0,
"valid_targets_min": 895
},
{
"epoch": 3.5176282051282053,
"grad_norm": 0.7692448440855282,
"learning_rate": 2.3317197163316757e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13899481296539307,
"step": 2195,
"valid_targets_mean": 2212.0,
"valid_targets_min": 853
},
{
"epoch": 3.5256410256410255,
"grad_norm": 0.8800744946825352,
"learning_rate": 2.3238359403969608e-05,
"loss": 0.3115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16469797492027283,
"step": 2200,
"valid_targets_mean": 2316.8,
"valid_targets_min": 443
},
{
"epoch": 3.5336538461538463,
"grad_norm": 0.9037287807197032,
"learning_rate": 2.315946993657543e-05,
"loss": 0.3168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15300291776657104,
"step": 2205,
"valid_targets_mean": 1937.8,
"valid_targets_min": 1433
},
{
"epoch": 3.5416666666666665,
"grad_norm": 0.7352963329157969,
"learning_rate": 2.3080530020790673e-05,
"loss": 0.3352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12197897583246231,
"step": 2210,
"valid_targets_mean": 2205.6,
"valid_targets_min": 577
},
{
"epoch": 3.5496794871794872,
"grad_norm": 0.7829030632859258,
"learning_rate": 2.300154091707731e-05,
"loss": 0.299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14087346196174622,
"step": 2215,
"valid_targets_mean": 2687.8,
"valid_targets_min": 1060
},
{
"epoch": 3.5576923076923075,
"grad_norm": 0.6539140626498782,
"learning_rate": 2.2922503886682706e-05,
"loss": 0.3002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12677669525146484,
"step": 2220,
"valid_targets_mean": 3135.9,
"valid_targets_min": 1455
},
{
"epoch": 3.565705128205128,
"grad_norm": 0.8014167728473969,
"learning_rate": 2.28434201916195e-05,
"loss": 0.3065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13969087600708008,
"step": 2225,
"valid_targets_mean": 2349.4,
"valid_targets_min": 1233
},
{
"epoch": 3.573717948717949,
"grad_norm": 0.6940618273966738,
"learning_rate": 2.2764291094645446e-05,
"loss": 0.3283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17305408418178558,
"step": 2230,
"valid_targets_mean": 2655.8,
"valid_targets_min": 1173
},
{
"epoch": 3.581730769230769,
"grad_norm": 0.8317185277984226,
"learning_rate": 2.2685117859243223e-05,
"loss": 0.312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1836153119802475,
"step": 2235,
"valid_targets_mean": 2955.6,
"valid_targets_min": 385
},
{
"epoch": 3.58974358974359,
"grad_norm": 0.9360794306661345,
"learning_rate": 2.2605901749600312e-05,
"loss": 0.2841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13323697447776794,
"step": 2240,
"valid_targets_mean": 1700.8,
"valid_targets_min": 1044
},
{
"epoch": 3.59775641025641,
"grad_norm": 0.9575442006291623,
"learning_rate": 2.2526644030588764e-05,
"loss": 0.3219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1550298035144806,
"step": 2245,
"valid_targets_mean": 1732.8,
"valid_targets_min": 830
},
{
"epoch": 3.605769230769231,
"grad_norm": 0.7439293011806408,
"learning_rate": 2.2447345967745036e-05,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18119588494300842,
"step": 2250,
"valid_targets_mean": 3019.4,
"valid_targets_min": 1185
},
{
"epoch": 3.613782051282051,
"grad_norm": 0.7521495969910179,
"learning_rate": 2.2368008827249756e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16421186923980713,
"step": 2255,
"valid_targets_mean": 2975.4,
"valid_targets_min": 1097
},
{
"epoch": 3.621794871794872,
"grad_norm": 0.8618091844527409,
"learning_rate": 2.228863387590752e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13043256103992462,
"step": 2260,
"valid_targets_mean": 1935.0,
"valid_targets_min": 1235
},
{
"epoch": 3.6298076923076925,
"grad_norm": 0.9418809259129349,
"learning_rate": 2.2209222381126687e-05,
"loss": 0.312,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18692129850387573,
"step": 2265,
"valid_targets_mean": 3238.5,
"valid_targets_min": 1272
},
{
"epoch": 3.6378205128205128,
"grad_norm": 1.2669863904356735,
"learning_rate": 2.212977561089908e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11323244869709015,
"step": 2270,
"valid_targets_mean": 1818.8,
"valid_targets_min": 947
},
{
"epoch": 3.6458333333333335,
"grad_norm": 0.7178438925925271,
"learning_rate": 2.20502948337798e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14442986249923706,
"step": 2275,
"valid_targets_mean": 2371.1,
"valid_targets_min": 1153
},
{
"epoch": 3.6538461538461537,
"grad_norm": 0.8569782259230551,
"learning_rate": 2.1970781318866953e-05,
"loss": 0.3256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19485518336296082,
"step": 2280,
"valid_targets_mean": 2588.1,
"valid_targets_min": 1005
},
{
"epoch": 3.6618589743589745,
"grad_norm": 2.112497526405271,
"learning_rate": 2.1891236335781363e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12906664609909058,
"step": 2285,
"valid_targets_mean": 2045.6,
"valid_targets_min": 1078
},
{
"epoch": 3.6698717948717947,
"grad_norm": 1.2177253686979004,
"learning_rate": 2.1811661154646332e-05,
"loss": 0.3239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1536482274532318,
"step": 2290,
"valid_targets_mean": 1866.0,
"valid_targets_min": 1053
},
{
"epoch": 3.6778846153846154,
"grad_norm": 0.7181600618276615,
"learning_rate": 2.173205704606735e-05,
"loss": 0.3128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16137897968292236,
"step": 2295,
"valid_targets_mean": 3668.9,
"valid_targets_min": 1970
},
{
"epoch": 3.685897435897436,
"grad_norm": 0.7682172069784419,
"learning_rate": 2.1652425281111785e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11456585675477982,
"step": 2300,
"valid_targets_mean": 2416.9,
"valid_targets_min": 1804
},
{
"epoch": 3.6939102564102564,
"grad_norm": 0.894927579310415,
"learning_rate": 2.1572767131288607e-05,
"loss": 0.2982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12253161519765854,
"step": 2305,
"valid_targets_mean": 2175.1,
"valid_targets_min": 1301
},
{
"epoch": 3.7019230769230766,
"grad_norm": 0.9030443572331698,
"learning_rate": 2.1493083868528095e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16637665033340454,
"step": 2310,
"valid_targets_mean": 1787.1,
"valid_targets_min": 909
},
{
"epoch": 3.7099358974358974,
"grad_norm": 0.8709845006870474,
"learning_rate": 2.141337676516151e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14325791597366333,
"step": 2315,
"valid_targets_mean": 2471.1,
"valid_targets_min": 1252
},
{
"epoch": 3.717948717948718,
"grad_norm": 0.7117739613765913,
"learning_rate": 2.1333647093900772e-05,
"loss": 0.3006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1770605444908142,
"step": 2320,
"valid_targets_mean": 3549.5,
"valid_targets_min": 958
},
{
"epoch": 3.7259615384615383,
"grad_norm": 0.7878345355183604,
"learning_rate": 2.1253896127818175e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0999627634882927,
"step": 2325,
"valid_targets_mean": 1936.6,
"valid_targets_min": 1035
},
{
"epoch": 3.733974358974359,
"grad_norm": 0.886615512563476,
"learning_rate": 2.1174125140326013e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15225833654403687,
"step": 2330,
"valid_targets_mean": 2917.9,
"valid_targets_min": 902
},
{
"epoch": 3.7419871794871797,
"grad_norm": 0.7335716261401273,
"learning_rate": 2.1094335405156277e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13625505566596985,
"step": 2335,
"valid_targets_mean": 2365.8,
"valid_targets_min": 1204
},
{
"epoch": 3.75,
"grad_norm": 0.8029433347399508,
"learning_rate": 2.1014528196340316e-05,
"loss": 0.3038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17654207348823547,
"step": 2340,
"valid_targets_mean": 3089.9,
"valid_targets_min": 1638
},
{
"epoch": 3.7580128205128203,
"grad_norm": 0.813979444044512,
"learning_rate": 2.093470478818847e-05,
"loss": 0.3084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17776831984519958,
"step": 2345,
"valid_targets_mean": 2865.4,
"valid_targets_min": 1878
},
{
"epoch": 3.766025641025641,
"grad_norm": 1.0704643578025568,
"learning_rate": 2.0854866455269756e-05,
"loss": 0.2992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11565354466438293,
"step": 2350,
"valid_targets_mean": 2172.4,
"valid_targets_min": 824
},
{
"epoch": 3.7740384615384617,
"grad_norm": 0.767664259998352,
"learning_rate": 2.0775014472391496e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13974158465862274,
"step": 2355,
"valid_targets_mean": 2264.8,
"valid_targets_min": 383
},
{
"epoch": 3.782051282051282,
"grad_norm": 0.8116983946381069,
"learning_rate": 2.0695150114578958e-05,
"loss": 0.3101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17401279509067535,
"step": 2360,
"valid_targets_mean": 2502.2,
"valid_targets_min": 997
},
{
"epoch": 3.7900641025641026,
"grad_norm": 0.838756392734306,
"learning_rate": 2.061527465705502e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1414027363061905,
"step": 2365,
"valid_targets_mean": 1893.6,
"valid_targets_min": 1012
},
{
"epoch": 3.7980769230769234,
"grad_norm": 0.8116104628684938,
"learning_rate": 2.0535389375219773e-05,
"loss": 0.2978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1255178451538086,
"step": 2370,
"valid_targets_mean": 1870.0,
"valid_targets_min": 1031
},
{
"epoch": 3.8060897435897436,
"grad_norm": 0.8119638624612898,
"learning_rate": 2.045549554463019e-05,
"loss": 0.3111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1506079137325287,
"step": 2375,
"valid_targets_mean": 2428.9,
"valid_targets_min": 868
},
{
"epoch": 3.814102564102564,
"grad_norm": 0.9284702930461602,
"learning_rate": 2.0375594440979744e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18719634413719177,
"step": 2380,
"valid_targets_mean": 2382.8,
"valid_targets_min": 1713
},
{
"epoch": 3.8221153846153846,
"grad_norm": 0.6769878780139562,
"learning_rate": 2.0295687340078037e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14017589390277863,
"step": 2385,
"valid_targets_mean": 2623.1,
"valid_targets_min": 1183
},
{
"epoch": 3.8301282051282053,
"grad_norm": 0.7732324489152704,
"learning_rate": 2.0215775517830437e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14514802396297455,
"step": 2390,
"valid_targets_mean": 2283.8,
"valid_targets_min": 1304
},
{
"epoch": 3.8381410256410255,
"grad_norm": 0.7064375534961691,
"learning_rate": 2.013586025021769e-05,
"loss": 0.3033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11343707889318466,
"step": 2395,
"valid_targets_mean": 2805.6,
"valid_targets_min": 1879
},
{
"epoch": 3.8461538461538463,
"grad_norm": 0.8985980622999645,
"learning_rate": 2.0055942813275564e-05,
"loss": 0.3196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16325703263282776,
"step": 2400,
"valid_targets_mean": 2028.1,
"valid_targets_min": 975
},
{
"epoch": 3.8541666666666665,
"grad_norm": 0.794562051071232,
"learning_rate": 1.9976024483074456e-05,
"loss": 0.31,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.168821781873703,
"step": 2405,
"valid_targets_mean": 3017.8,
"valid_targets_min": 1367
},
{
"epoch": 3.8621794871794872,
"grad_norm": 0.7169752500616591,
"learning_rate": 1.9896106535699025e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15249863266944885,
"step": 2410,
"valid_targets_mean": 3116.9,
"valid_targets_min": 1162
},
{
"epoch": 3.8701923076923075,
"grad_norm": 1.2976110140884907,
"learning_rate": 1.9816190247227834e-05,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1410829871892929,
"step": 2415,
"valid_targets_mean": 3285.1,
"valid_targets_min": 1013
},
{
"epoch": 3.878205128205128,
"grad_norm": 0.7918220393027592,
"learning_rate": 1.9736276893712954e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17646968364715576,
"step": 2420,
"valid_targets_mean": 2813.5,
"valid_targets_min": 1461
},
{
"epoch": 3.886217948717949,
"grad_norm": 0.9353419692330223,
"learning_rate": 1.9656367751159565e-05,
"loss": 0.3385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12920579314231873,
"step": 2425,
"valid_targets_mean": 1474.0,
"valid_targets_min": 314
},
{
"epoch": 3.894230769230769,
"grad_norm": 0.8471014654076914,
"learning_rate": 1.957646409550565e-05,
"loss": 0.3067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16839198768138885,
"step": 2430,
"valid_targets_mean": 2648.2,
"valid_targets_min": 1082
},
{
"epoch": 3.90224358974359,
"grad_norm": 0.805711000015817,
"learning_rate": 1.9496567202601545e-05,
"loss": 0.3216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1253741979598999,
"step": 2435,
"valid_targets_mean": 1789.8,
"valid_targets_min": 1029
},
{
"epoch": 3.91025641025641,
"grad_norm": 0.7373986082126022,
"learning_rate": 1.9416678348189627e-05,
"loss": 0.2949,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10667409002780914,
"step": 2440,
"valid_targets_mean": 2386.0,
"valid_targets_min": 928
},
{
"epoch": 3.918269230769231,
"grad_norm": 0.7887849161507996,
"learning_rate": 1.9336798807883907e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14934706687927246,
"step": 2445,
"valid_targets_mean": 2199.2,
"valid_targets_min": 315
},
{
"epoch": 3.926282051282051,
"grad_norm": 0.7530765328540372,
"learning_rate": 1.9256929857149686e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12907078862190247,
"step": 2450,
"valid_targets_mean": 2505.1,
"valid_targets_min": 1049
},
{
"epoch": 3.934294871794872,
"grad_norm": 0.7605153269941574,
"learning_rate": 1.9177072771283167e-05,
"loss": 0.3209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18549108505249023,
"step": 2455,
"valid_targets_mean": 3427.1,
"valid_targets_min": 931
},
{
"epoch": 3.9423076923076925,
"grad_norm": 0.7187662676386029,
"learning_rate": 1.9097228825391087e-05,
"loss": 0.3087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18586839735507965,
"step": 2460,
"valid_targets_mean": 3050.5,
"valid_targets_min": 1382
},
{
"epoch": 3.9503205128205128,
"grad_norm": 0.801030836461524,
"learning_rate": 1.9017399294370413e-05,
"loss": 0.3008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1393556445837021,
"step": 2465,
"valid_targets_mean": 2522.4,
"valid_targets_min": 1126
},
{
"epoch": 3.9583333333333335,
"grad_norm": 0.7125978880537887,
"learning_rate": 1.893758545288791e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12806084752082825,
"step": 2470,
"valid_targets_mean": 2649.1,
"valid_targets_min": 956
},
{
"epoch": 3.9663461538461537,
"grad_norm": 0.733573562499821,
"learning_rate": 1.8857788575359847e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16902223229408264,
"step": 2475,
"valid_targets_mean": 2976.0,
"valid_targets_min": 1443
},
{
"epoch": 3.9743589743589745,
"grad_norm": 0.8286725638748283,
"learning_rate": 1.87780099359316e-05,
"loss": 0.3069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15555858612060547,
"step": 2480,
"valid_targets_mean": 2136.1,
"valid_targets_min": 325
},
{
"epoch": 3.9823717948717947,
"grad_norm": 0.8013127483982946,
"learning_rate": 1.869825080845734e-05,
"loss": 0.3007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11979212611913681,
"step": 2485,
"valid_targets_mean": 1891.2,
"valid_targets_min": 1063
},
{
"epoch": 3.9903846153846154,
"grad_norm": 1.1755524488770757,
"learning_rate": 1.8618512466479686e-05,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11900055408477783,
"step": 2490,
"valid_targets_mean": 1870.2,
"valid_targets_min": 879
},
{
"epoch": 3.998397435897436,
"grad_norm": 0.7228754958110429,
"learning_rate": 1.8538796183209373e-05,
"loss": 0.3068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18811742961406708,
"step": 2495,
"valid_targets_mean": 3598.2,
"valid_targets_min": 2064
},
{
"epoch": 4.006410256410256,
"grad_norm": 0.8107216208175523,
"learning_rate": 1.845910323150491e-05,
"loss": 0.2849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10420330613851547,
"step": 2500,
"valid_targets_mean": 1475.4,
"valid_targets_min": 693
},
{
"epoch": 4.014423076923077,
"grad_norm": 0.7289801458879988,
"learning_rate": 1.8379434883852255e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1149950623512268,
"step": 2505,
"valid_targets_mean": 2478.2,
"valid_targets_min": 1065
},
{
"epoch": 4.022435897435898,
"grad_norm": 0.6172941964344577,
"learning_rate": 1.8299792412344524e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09197504073381424,
"step": 2510,
"valid_targets_mean": 2993.5,
"valid_targets_min": 827
},
{
"epoch": 4.030448717948718,
"grad_norm": 0.924056863546892,
"learning_rate": 1.8220177088661635e-05,
"loss": 0.2846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11417260766029358,
"step": 2515,
"valid_targets_mean": 2422.9,
"valid_targets_min": 1248
},
{
"epoch": 4.038461538461538,
"grad_norm": 0.7599373898282045,
"learning_rate": 1.814059018405004e-05,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1344180405139923,
"step": 2520,
"valid_targets_mean": 2648.2,
"valid_targets_min": 1827
},
{
"epoch": 4.046474358974359,
"grad_norm": 0.847954527866217,
"learning_rate": 1.806103296930243e-05,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16294752061367035,
"step": 2525,
"valid_targets_mean": 2578.5,
"valid_targets_min": 1032
},
{
"epoch": 4.05448717948718,
"grad_norm": 0.7840662540311333,
"learning_rate": 1.7981506714737392e-05,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1518925577402115,
"step": 2530,
"valid_targets_mean": 2867.4,
"valid_targets_min": 972
},
{
"epoch": 4.0625,
"grad_norm": 1.0308185743550442,
"learning_rate": 1.7902012690179188e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14089523255825043,
"step": 2535,
"valid_targets_mean": 1825.4,
"valid_targets_min": 972
},
{
"epoch": 4.07051282051282,
"grad_norm": 1.0080791319366573,
"learning_rate": 1.7822552164937437e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15818694233894348,
"step": 2540,
"valid_targets_mean": 2121.5,
"valid_targets_min": 1100
},
{
"epoch": 4.078525641025641,
"grad_norm": 0.7700047605910827,
"learning_rate": 1.7743126407786873e-05,
"loss": 0.2431,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11398568749427795,
"step": 2545,
"valid_targets_mean": 2395.9,
"valid_targets_min": 877
},
{
"epoch": 4.086538461538462,
"grad_norm": 0.8996747224204145,
"learning_rate": 1.766373668694707e-05,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19166290760040283,
"step": 2550,
"valid_targets_mean": 2388.6,
"valid_targets_min": 358
},
{
"epoch": 4.094551282051282,
"grad_norm": 0.6926397629736457,
"learning_rate": 1.7584384270062195e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14995482563972473,
"step": 2555,
"valid_targets_mean": 3620.6,
"valid_targets_min": 995
},
{
"epoch": 4.102564102564102,
"grad_norm": 0.9135167791555272,
"learning_rate": 1.7505070424180772e-05,
"loss": 0.2773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13266316056251526,
"step": 2560,
"valid_targets_mean": 1995.1,
"valid_targets_min": 399
},
{
"epoch": 4.110576923076923,
"grad_norm": 0.6987226388783631,
"learning_rate": 1.7425796415735454e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14873361587524414,
"step": 2565,
"valid_targets_mean": 4161.2,
"valid_targets_min": 1467
},
{
"epoch": 4.118589743589744,
"grad_norm": 0.9300152796838081,
"learning_rate": 1.7346563510522783e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14323440194129944,
"step": 2570,
"valid_targets_mean": 2504.5,
"valid_targets_min": 956
},
{
"epoch": 4.126602564102564,
"grad_norm": 0.9032919810067497,
"learning_rate": 1.7267372973682998e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14378081262111664,
"step": 2575,
"valid_targets_mean": 1905.8,
"valid_targets_min": 1172
},
{
"epoch": 4.134615384615385,
"grad_norm": 0.738179906420384,
"learning_rate": 1.7188226069679834e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16808360815048218,
"step": 2580,
"valid_targets_mean": 3544.9,
"valid_targets_min": 1459
},
{
"epoch": 4.142628205128205,
"grad_norm": 0.8642444098290127,
"learning_rate": 1.7109124062280307e-05,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13248826563358307,
"step": 2585,
"valid_targets_mean": 2062.6,
"valid_targets_min": 807
},
{
"epoch": 4.1506410256410255,
"grad_norm": 0.8868230221130139,
"learning_rate": 1.7030068214534567e-05,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12323059141635895,
"step": 2590,
"valid_targets_mean": 2625.6,
"valid_targets_min": 1143
},
{
"epoch": 4.158653846153846,
"grad_norm": 0.8464117069340547,
"learning_rate": 1.695105978875572e-05,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1996307373046875,
"step": 2595,
"valid_targets_mean": 3468.2,
"valid_targets_min": 1515
},
{
"epoch": 4.166666666666667,
"grad_norm": 0.8256615333687891,
"learning_rate": 1.687210004649965e-05,
"loss": 0.272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13181278109550476,
"step": 2600,
"valid_targets_mean": 3212.9,
"valid_targets_min": 1089
},
{
"epoch": 4.174679487179487,
"grad_norm": 0.8870269434095935,
"learning_rate": 1.679319024854491e-05,
"loss": 0.2826,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1275901198387146,
"step": 2605,
"valid_targets_mean": 1700.0,
"valid_targets_min": 840
},
{
"epoch": 4.1826923076923075,
"grad_norm": 0.7677929822500646,
"learning_rate": 1.6714331654872564e-05,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13212555646896362,
"step": 2610,
"valid_targets_mean": 3407.5,
"valid_targets_min": 1222
},
{
"epoch": 4.190705128205128,
"grad_norm": 0.903137572181981,
"learning_rate": 1.663552552464609e-05,
"loss": 0.2715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18511812388896942,
"step": 2615,
"valid_targets_mean": 2890.0,
"valid_targets_min": 430
},
{
"epoch": 4.198717948717949,
"grad_norm": 0.8198954378497408,
"learning_rate": 1.6556773116191257e-05,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11871003359556198,
"step": 2620,
"valid_targets_mean": 2507.9,
"valid_targets_min": 1272
},
{
"epoch": 4.206730769230769,
"grad_norm": 0.8935891481944647,
"learning_rate": 1.647807568697603e-05,
"loss": 0.2895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1254265010356903,
"step": 2625,
"valid_targets_mean": 2132.4,
"valid_targets_min": 1236
},
{
"epoch": 4.214743589743589,
"grad_norm": 0.806136169949257,
"learning_rate": 1.6399434493590524e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1111583337187767,
"step": 2630,
"valid_targets_mean": 2298.0,
"valid_targets_min": 455
},
{
"epoch": 4.222756410256411,
"grad_norm": 0.8129392813125258,
"learning_rate": 1.6320850791726884e-05,
"loss": 0.2888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11087336391210556,
"step": 2635,
"valid_targets_mean": 2346.0,
"valid_targets_min": 1047
},
{
"epoch": 4.230769230769231,
"grad_norm": 0.7954597693417139,
"learning_rate": 1.6242325836159304e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12124334275722504,
"step": 2640,
"valid_targets_mean": 2325.2,
"valid_targets_min": 1332
},
{
"epoch": 4.238782051282051,
"grad_norm": 0.7994370389318457,
"learning_rate": 1.6163860880723923e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11619360744953156,
"step": 2645,
"valid_targets_mean": 2158.5,
"valid_targets_min": 993
},
{
"epoch": 4.246794871794872,
"grad_norm": 1.3081684100190851,
"learning_rate": 1.6085457178298866e-05,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15662749111652374,
"step": 2650,
"valid_targets_mean": 2542.2,
"valid_targets_min": 1074
},
{
"epoch": 4.2548076923076925,
"grad_norm": 0.9133168019792289,
"learning_rate": 1.6007115980784182e-05,
"loss": 0.2696,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14592257142066956,
"step": 2655,
"valid_targets_mean": 2387.5,
"valid_targets_min": 896
},
{
"epoch": 4.262820512820513,
"grad_norm": 0.853360669593718,
"learning_rate": 1.592883853908188e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12176774442195892,
"step": 2660,
"valid_targets_mean": 2206.1,
"valid_targets_min": 328
},
{
"epoch": 4.270833333333333,
"grad_norm": 0.7599368635884864,
"learning_rate": 1.585062610307599e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1838086098432541,
"step": 2665,
"valid_targets_mean": 3465.8,
"valid_targets_min": 1081
},
{
"epoch": 4.278846153846154,
"grad_norm": 0.8525433719634645,
"learning_rate": 1.5772479921612543e-05,
"loss": 0.2756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14185798168182373,
"step": 2670,
"valid_targets_mean": 2654.0,
"valid_targets_min": 1737
},
{
"epoch": 4.2868589743589745,
"grad_norm": 0.7462684034862797,
"learning_rate": 1.5694401242479677e-05,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14972269535064697,
"step": 2675,
"valid_targets_mean": 3185.0,
"valid_targets_min": 1101
},
{
"epoch": 4.294871794871795,
"grad_norm": 1.0578925215532613,
"learning_rate": 1.5616391312387683e-05,
"loss": 0.2805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13549691438674927,
"step": 2680,
"valid_targets_mean": 2258.2,
"valid_targets_min": 1204
},
{
"epoch": 4.302884615384615,
"grad_norm": 0.8648608606389229,
"learning_rate": 1.5538451376949106e-05,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1298896223306656,
"step": 2685,
"valid_targets_mean": 2905.2,
"valid_targets_min": 1248
},
{
"epoch": 4.310897435897436,
"grad_norm": 0.8938045422851925,
"learning_rate": 1.5460582680658888e-05,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16241608560085297,
"step": 2690,
"valid_targets_mean": 1907.6,
"valid_targets_min": 1285
},
{
"epoch": 4.318910256410256,
"grad_norm": 0.8098362846204934,
"learning_rate": 1.5382786466874446e-05,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11088044941425323,
"step": 2695,
"valid_targets_mean": 2425.4,
"valid_targets_min": 1100
},
{
"epoch": 4.326923076923077,
"grad_norm": 0.7618680406015733,
"learning_rate": 1.5305063977795856e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10798428952693939,
"step": 2700,
"valid_targets_mean": 2501.0,
"valid_targets_min": 1152
},
{
"epoch": 4.334935897435898,
"grad_norm": 0.8771021903966155,
"learning_rate": 1.5227416454445995e-05,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12293270230293274,
"step": 2705,
"valid_targets_mean": 1854.9,
"valid_targets_min": 955
},
{
"epoch": 4.342948717948718,
"grad_norm": 0.8902232258682791,
"learning_rate": 1.5149845136650748e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17401179671287537,
"step": 2710,
"valid_targets_mean": 2398.9,
"valid_targets_min": 1217
},
{
"epoch": 4.350961538461538,
"grad_norm": 0.7400416574631132,
"learning_rate": 1.5072351263019177e-05,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13317830860614777,
"step": 2715,
"valid_targets_mean": 2971.4,
"valid_targets_min": 367
},
{
"epoch": 4.358974358974359,
"grad_norm": 0.8323847921657985,
"learning_rate": 1.4994936070923784e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11686371266841888,
"step": 2720,
"valid_targets_mean": 2373.9,
"valid_targets_min": 1433
},
{
"epoch": 4.36698717948718,
"grad_norm": 0.8564853210865073,
"learning_rate": 1.4917600796480745e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.154568150639534,
"step": 2725,
"valid_targets_mean": 3047.5,
"valid_targets_min": 1192
},
{
"epoch": 4.375,
"grad_norm": 4.516311351290841,
"learning_rate": 1.4840346674530122e-05,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10477745532989502,
"step": 2730,
"valid_targets_mean": 1647.8,
"valid_targets_min": 577
},
{
"epoch": 4.38301282051282,
"grad_norm": 0.8773956755455364,
"learning_rate": 1.4763174938616232e-05,
"loss": 0.2868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12866738438606262,
"step": 2735,
"valid_targets_mean": 1814.0,
"valid_targets_min": 1064
},
{
"epoch": 4.391025641025641,
"grad_norm": 0.862173024576601,
"learning_rate": 1.4686086820967865e-05,
"loss": 0.2803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10677969455718994,
"step": 2740,
"valid_targets_mean": 2018.1,
"valid_targets_min": 1167
},
{
"epoch": 4.399038461538462,
"grad_norm": 0.7936422088513276,
"learning_rate": 1.460908355247868e-05,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0854073315858841,
"step": 2745,
"valid_targets_mean": 1962.6,
"valid_targets_min": 344
},
{
"epoch": 4.407051282051282,
"grad_norm": 0.7666993392738055,
"learning_rate": 1.4532166362687507e-05,
"loss": 0.2848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09944554418325424,
"step": 2750,
"valid_targets_mean": 2318.1,
"valid_targets_min": 886
},
{
"epoch": 4.415064102564102,
"grad_norm": 0.8829285662230825,
"learning_rate": 1.445533647975871e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1385907530784607,
"step": 2755,
"valid_targets_mean": 2788.9,
"valid_targets_min": 949
},
{
"epoch": 4.423076923076923,
"grad_norm": 0.9272776009807071,
"learning_rate": 1.437859513046263e-05,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12871670722961426,
"step": 2760,
"valid_targets_mean": 1785.0,
"valid_targets_min": 1228
},
{
"epoch": 4.431089743589744,
"grad_norm": 0.8347503928560401,
"learning_rate": 1.4301943540155914e-05,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12505707144737244,
"step": 2765,
"valid_targets_mean": 2583.8,
"valid_targets_min": 1438
},
{
"epoch": 4.439102564102564,
"grad_norm": 0.9069365982168227,
"learning_rate": 1.4225382932762033e-05,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16004319489002228,
"step": 2770,
"valid_targets_mean": 2442.6,
"valid_targets_min": 906
},
{
"epoch": 4.447115384615385,
"grad_norm": 1.0573384285454255,
"learning_rate": 1.4148914530751681e-05,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17709983885288239,
"step": 2775,
"valid_targets_mean": 1901.5,
"valid_targets_min": 880
},
{
"epoch": 4.455128205128205,
"grad_norm": 0.9369049788177093,
"learning_rate": 1.4072539555123292e-05,
"loss": 0.2803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1579183042049408,
"step": 2780,
"valid_targets_mean": 2392.0,
"valid_targets_min": 839
},
{
"epoch": 4.4631410256410255,
"grad_norm": 0.8913049677040563,
"learning_rate": 1.3996259225383514e-05,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1293807029724121,
"step": 2785,
"valid_targets_mean": 2368.1,
"valid_targets_min": 1251
},
{
"epoch": 4.471153846153846,
"grad_norm": 0.88256947286605,
"learning_rate": 1.3920074759527737e-05,
"loss": 0.29,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14929986000061035,
"step": 2790,
"valid_targets_mean": 2416.9,
"valid_targets_min": 1440
},
{
"epoch": 4.479166666666667,
"grad_norm": 0.8160206288790809,
"learning_rate": 1.3843987374020689e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14964623749256134,
"step": 2795,
"valid_targets_mean": 2870.5,
"valid_targets_min": 721
},
{
"epoch": 4.487179487179487,
"grad_norm": 0.8428944555480611,
"learning_rate": 1.376799828377696e-05,
"loss": 0.2659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1721874475479126,
"step": 2800,
"valid_targets_mean": 2782.9,
"valid_targets_min": 1694
},
{
"epoch": 4.4951923076923075,
"grad_norm": 0.8871852280382094,
"learning_rate": 1.3692108702141642e-05,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12747956812381744,
"step": 2805,
"valid_targets_mean": 1721.0,
"valid_targets_min": 338
},
{
"epoch": 4.503205128205128,
"grad_norm": 0.9872908843916991,
"learning_rate": 1.361631984087091e-05,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15744715929031372,
"step": 2810,
"valid_targets_mean": 1939.6,
"valid_targets_min": 1134
},
{
"epoch": 4.511217948717949,
"grad_norm": 0.8580567465549157,
"learning_rate": 1.354063291011273e-05,
"loss": 0.2632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.130362868309021,
"step": 2815,
"valid_targets_mean": 2308.5,
"valid_targets_min": 1237
},
{
"epoch": 4.519230769230769,
"grad_norm": 0.7644493527586255,
"learning_rate": 1.3465049118387486e-05,
"loss": 0.2674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13236522674560547,
"step": 2820,
"valid_targets_mean": 2896.8,
"valid_targets_min": 1084
},
{
"epoch": 4.527243589743589,
"grad_norm": 0.9667014319508634,
"learning_rate": 1.3389569672568707e-05,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12788935005664825,
"step": 2825,
"valid_targets_mean": 2036.5,
"valid_targets_min": 324
},
{
"epoch": 4.535256410256411,
"grad_norm": 0.8421523844856508,
"learning_rate": 1.331419577786381e-05,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.109443299472332,
"step": 2830,
"valid_targets_mean": 1979.4,
"valid_targets_min": 1006
},
{
"epoch": 4.543269230769231,
"grad_norm": 0.744928564210247,
"learning_rate": 1.3238928637794816e-05,
"loss": 0.2639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11254187673330307,
"step": 2835,
"valid_targets_mean": 2626.8,
"valid_targets_min": 753
},
{
"epoch": 4.551282051282051,
"grad_norm": 0.975086466256904,
"learning_rate": 1.3163769454179183e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1786927580833435,
"step": 2840,
"valid_targets_mean": 2314.1,
"valid_targets_min": 1070
},
{
"epoch": 4.559294871794872,
"grad_norm": 0.7209383245592558,
"learning_rate": 1.3088719427110552e-05,
"loss": 0.266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08105504512786865,
"step": 2845,
"valid_targets_mean": 2961.5,
"valid_targets_min": 1371
},
{
"epoch": 4.5673076923076925,
"grad_norm": 0.7810108736494066,
"learning_rate": 1.3013779754939666e-05,
"loss": 0.2735,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14913949370384216,
"step": 2850,
"valid_targets_mean": 2757.1,
"valid_targets_min": 1361
},
{
"epoch": 4.575320512820513,
"grad_norm": 0.8254385625250282,
"learning_rate": 1.2938951634255164e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1645059883594513,
"step": 2855,
"valid_targets_mean": 3087.0,
"valid_targets_min": 1169
},
{
"epoch": 4.583333333333333,
"grad_norm": 0.7306018923704536,
"learning_rate": 1.2864236259864495e-05,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11817409098148346,
"step": 2860,
"valid_targets_mean": 2937.9,
"valid_targets_min": 371
},
{
"epoch": 4.591346153846154,
"grad_norm": 0.7477590617323558,
"learning_rate": 1.2789634824774887e-05,
"loss": 0.2722,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12819048762321472,
"step": 2865,
"valid_targets_mean": 2968.5,
"valid_targets_min": 1499
},
{
"epoch": 4.5993589743589745,
"grad_norm": 0.728894279788435,
"learning_rate": 1.2715148520174206e-05,
"loss": 0.2687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12905170023441315,
"step": 2870,
"valid_targets_mean": 3541.0,
"valid_targets_min": 1720
},
{
"epoch": 4.607371794871795,
"grad_norm": 0.744918036805367,
"learning_rate": 1.2640778535412036e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10740716010332108,
"step": 2875,
"valid_targets_mean": 2260.5,
"valid_targets_min": 879
},
{
"epoch": 4.615384615384615,
"grad_norm": 0.8997924981650226,
"learning_rate": 1.2566526057980608e-05,
"loss": 0.2517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1263289749622345,
"step": 2880,
"valid_targets_mean": 2141.9,
"valid_targets_min": 979
},
{
"epoch": 4.623397435897436,
"grad_norm": 0.7732205590951574,
"learning_rate": 1.2492392273495879e-05,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1344079226255417,
"step": 2885,
"valid_targets_mean": 3042.1,
"valid_targets_min": 1931
},
{
"epoch": 4.631410256410256,
"grad_norm": 0.9244368747106443,
"learning_rate": 1.2418378365678612e-05,
"loss": 0.2776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18506968021392822,
"step": 2890,
"valid_targets_mean": 2340.2,
"valid_targets_min": 1257
},
{
"epoch": 4.639423076923077,
"grad_norm": 0.981906856635814,
"learning_rate": 1.234448551633542e-05,
"loss": 0.2707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11560280621051788,
"step": 2895,
"valid_targets_mean": 1585.2,
"valid_targets_min": 1039
},
{
"epoch": 4.647435897435898,
"grad_norm": 0.9031224981302811,
"learning_rate": 1.2270714905339969e-05,
"loss": 0.2716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11820649355649948,
"step": 2900,
"valid_targets_mean": 2263.9,
"valid_targets_min": 482
},
{
"epoch": 4.655448717948718,
"grad_norm": 0.8745154308021823,
"learning_rate": 1.2197067710614075e-05,
"loss": 0.2798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09645086526870728,
"step": 2905,
"valid_targets_mean": 1823.5,
"valid_targets_min": 945
},
{
"epoch": 4.663461538461538,
"grad_norm": 0.8245554409210525,
"learning_rate": 1.2123545108108943e-05,
"loss": 0.2887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12594664096832275,
"step": 2910,
"valid_targets_mean": 2744.8,
"valid_targets_min": 865
},
{
"epoch": 4.671474358974359,
"grad_norm": 0.829115549908771,
"learning_rate": 1.2050148271786348e-05,
"loss": 0.2912,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15721480548381805,
"step": 2915,
"valid_targets_mean": 3267.1,
"valid_targets_min": 1111
},
{
"epoch": 4.67948717948718,
"grad_norm": 0.846511250803801,
"learning_rate": 1.1976878373599928e-05,
"loss": 0.2866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14120858907699585,
"step": 2920,
"valid_targets_mean": 2450.1,
"valid_targets_min": 1375
},
{
"epoch": 4.6875,
"grad_norm": 0.7975341835970318,
"learning_rate": 1.1903736583476441e-05,
"loss": 0.2745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14211896061897278,
"step": 2925,
"valid_targets_mean": 2471.6,
"valid_targets_min": 1047
},
{
"epoch": 4.69551282051282,
"grad_norm": 0.9078900951131141,
"learning_rate": 1.1830724069297106e-05,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13938596844673157,
"step": 2930,
"valid_targets_mean": 2080.9,
"valid_targets_min": 1256
},
{
"epoch": 4.703525641025641,
"grad_norm": 0.8028681041530895,
"learning_rate": 1.1757841996878957e-05,
"loss": 0.287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11330582201480865,
"step": 2935,
"valid_targets_mean": 2032.8,
"valid_targets_min": 1029
},
{
"epoch": 4.711538461538462,
"grad_norm": 0.8363540894412191,
"learning_rate": 1.1685091529956187e-05,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15411382913589478,
"step": 2940,
"valid_targets_mean": 2787.2,
"valid_targets_min": 1093
},
{
"epoch": 4.719551282051282,
"grad_norm": 0.912460705122893,
"learning_rate": 1.161247383016163e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16072651743888855,
"step": 2945,
"valid_targets_mean": 2128.5,
"valid_targets_min": 966
},
{
"epoch": 4.727564102564102,
"grad_norm": 0.7499400173047096,
"learning_rate": 1.1539990057008166e-05,
"loss": 0.285,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10620361566543579,
"step": 2950,
"valid_targets_mean": 2388.1,
"valid_targets_min": 1203
},
{
"epoch": 4.735576923076923,
"grad_norm": 0.9237353949311389,
"learning_rate": 1.1467641367870198e-05,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11121618747711182,
"step": 2955,
"valid_targets_mean": 1521.9,
"valid_targets_min": 937
},
{
"epoch": 4.743589743589744,
"grad_norm": 0.8205670496593648,
"learning_rate": 1.1395428917965239e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14764776825904846,
"step": 2960,
"valid_targets_mean": 2725.4,
"valid_targets_min": 923
},
{
"epoch": 4.751602564102564,
"grad_norm": 0.9098777718387225,
"learning_rate": 1.1323353860335385e-05,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15366676449775696,
"step": 2965,
"valid_targets_mean": 2146.5,
"valid_targets_min": 1034
},
{
"epoch": 4.759615384615385,
"grad_norm": 0.8551265905437225,
"learning_rate": 1.1251417345828962e-05,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20508478581905365,
"step": 2970,
"valid_targets_mean": 3284.0,
"valid_targets_min": 1291
},
{
"epoch": 4.767628205128205,
"grad_norm": 0.8632459584174168,
"learning_rate": 1.1179620523082107e-05,
"loss": 0.278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15938019752502441,
"step": 2975,
"valid_targets_mean": 2744.9,
"valid_targets_min": 1368
},
{
"epoch": 4.7756410256410255,
"grad_norm": 0.8257591086160776,
"learning_rate": 1.110796453850047e-05,
"loss": 0.2649,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13130192458629608,
"step": 2980,
"valid_targets_mean": 2265.9,
"valid_targets_min": 1378
},
{
"epoch": 4.783653846153846,
"grad_norm": 0.8559905279176463,
"learning_rate": 1.1036450536240877e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14812210202217102,
"step": 2985,
"valid_targets_mean": 2335.5,
"valid_targets_min": 403
},
{
"epoch": 4.791666666666667,
"grad_norm": 0.7527787079235052,
"learning_rate": 1.0965079658193068e-05,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13627628982067108,
"step": 2990,
"valid_targets_mean": 3166.6,
"valid_targets_min": 966
},
{
"epoch": 4.799679487179487,
"grad_norm": 0.9363191867774112,
"learning_rate": 1.0893853043961475e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15567584335803986,
"step": 2995,
"valid_targets_mean": 2027.8,
"valid_targets_min": 872
},
{
"epoch": 4.8076923076923075,
"grad_norm": 0.8073681066642808,
"learning_rate": 1.0822771830847011e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09198524802923203,
"step": 3000,
"valid_targets_mean": 1890.8,
"valid_targets_min": 218
},
{
"epoch": 4.815705128205128,
"grad_norm": 0.988773013105684,
"learning_rate": 1.0751837153828926e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13376572728157043,
"step": 3005,
"valid_targets_mean": 1561.8,
"valid_targets_min": 1034
},
{
"epoch": 4.823717948717949,
"grad_norm": 0.9762413699290895,
"learning_rate": 1.0681050145546666e-05,
"loss": 0.2865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14275820553302765,
"step": 3010,
"valid_targets_mean": 2047.4,
"valid_targets_min": 1062
},
{
"epoch": 4.831730769230769,
"grad_norm": 0.9275506661578156,
"learning_rate": 1.0610411936281801e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15121185779571533,
"step": 3015,
"valid_targets_mean": 2387.4,
"valid_targets_min": 1138
},
{
"epoch": 4.839743589743589,
"grad_norm": 1.186762101396794,
"learning_rate": 1.0539923653939978e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14785534143447876,
"step": 3020,
"valid_targets_mean": 2331.1,
"valid_targets_min": 260
},
{
"epoch": 4.847756410256411,
"grad_norm": 0.7972641980595226,
"learning_rate": 1.0469586424032903e-05,
"loss": 0.278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11366459727287292,
"step": 3025,
"valid_targets_mean": 2833.2,
"valid_targets_min": 1378
},
{
"epoch": 4.855769230769231,
"grad_norm": 0.787773519783044,
"learning_rate": 1.0399401369660369e-05,
"loss": 0.2588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12477640807628632,
"step": 3030,
"valid_targets_mean": 2976.5,
"valid_targets_min": 1412
},
{
"epoch": 4.863782051282051,
"grad_norm": 1.077467606380259,
"learning_rate": 1.0329369611492334e-05,
"loss": 0.2799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13085028529167175,
"step": 3035,
"valid_targets_mean": 1301.2,
"valid_targets_min": 903
},
{
"epoch": 4.871794871794872,
"grad_norm": 0.779085250047778,
"learning_rate": 1.0259492267751022e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09794454276561737,
"step": 3040,
"valid_targets_mean": 2191.4,
"valid_targets_min": 872
},
{
"epoch": 4.8798076923076925,
"grad_norm": 0.772242896624771,
"learning_rate": 1.0189770454193052e-05,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09873206913471222,
"step": 3045,
"valid_targets_mean": 1930.6,
"valid_targets_min": 998
},
{
"epoch": 4.887820512820513,
"grad_norm": 0.9599867450295364,
"learning_rate": 1.0120205284091673e-05,
"loss": 0.2858,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11163206398487091,
"step": 3050,
"valid_targets_mean": 1916.6,
"valid_targets_min": 1115
},
{
"epoch": 4.895833333333333,
"grad_norm": 0.7918817935809193,
"learning_rate": 1.0050797868218907e-05,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1077142059803009,
"step": 3055,
"valid_targets_mean": 2029.9,
"valid_targets_min": 1202
},
{
"epoch": 4.903846153846154,
"grad_norm": 1.0640408645767745,
"learning_rate": 9.981549314827876e-06,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15119090676307678,
"step": 3060,
"valid_targets_mean": 2257.6,
"valid_targets_min": 1607
},
{
"epoch": 4.9118589743589745,
"grad_norm": 0.9302729531429398,
"learning_rate": 9.912460729635097e-06,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1315920054912567,
"step": 3065,
"valid_targets_mean": 2105.0,
"valid_targets_min": 1408
},
{
"epoch": 4.919871794871795,
"grad_norm": 0.9369289493805716,
"learning_rate": 9.843533215802796e-06,
"loss": 0.2706,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15253514051437378,
"step": 3070,
"valid_targets_mean": 2191.6,
"valid_targets_min": 1061
},
{
"epoch": 4.927884615384615,
"grad_norm": 0.844646606230592,
"learning_rate": 9.774767873921357e-06,
"loss": 0.2723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.137139230966568,
"step": 3075,
"valid_targets_mean": 2565.4,
"valid_targets_min": 974
},
{
"epoch": 4.935897435897436,
"grad_norm": 2.329062257750856,
"learning_rate": 9.706165801991651e-06,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13304753601551056,
"step": 3080,
"valid_targets_mean": 1838.1,
"valid_targets_min": 795
},
{
"epoch": 4.943910256410256,
"grad_norm": 0.853413187103336,
"learning_rate": 9.637728095407593e-06,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12307369709014893,
"step": 3085,
"valid_targets_mean": 2275.2,
"valid_targets_min": 991
},
{
"epoch": 4.951923076923077,
"grad_norm": 0.8149656643934992,
"learning_rate": 9.56945584693861e-06,
"loss": 0.2665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14071014523506165,
"step": 3090,
"valid_targets_mean": 2706.8,
"valid_targets_min": 1006
},
{
"epoch": 4.959935897435898,
"grad_norm": 0.8879281552541326,
"learning_rate": 9.501350146712193e-06,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16927888989448547,
"step": 3095,
"valid_targets_mean": 2713.2,
"valid_targets_min": 836
},
{
"epoch": 4.967948717948718,
"grad_norm": 0.8421674616911554,
"learning_rate": 9.433412082196527e-06,
"loss": 0.278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15744885802268982,
"step": 3100,
"valid_targets_mean": 2638.9,
"valid_targets_min": 966
},
{
"epoch": 4.975961538461538,
"grad_norm": 0.8600840077890818,
"learning_rate": 9.365642738183044e-06,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.104631707072258,
"step": 3105,
"valid_targets_mean": 1865.5,
"valid_targets_min": 447
},
{
"epoch": 4.983974358974359,
"grad_norm": 0.8348297609388227,
"learning_rate": 9.298043196769217e-06,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13417679071426392,
"step": 3110,
"valid_targets_mean": 2495.9,
"valid_targets_min": 1227
},
{
"epoch": 4.99198717948718,
"grad_norm": 9.580138479223857,
"learning_rate": 9.230614537341167e-06,
"loss": 0.2797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1282835602760315,
"step": 3115,
"valid_targets_mean": 2251.1,
"valid_targets_min": 1236
},
{
"epoch": 5.0,
"grad_norm": 0.8722530383797718,
"learning_rate": 9.163357836556498e-06,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1430858075618744,
"step": 3120,
"valid_targets_mean": 2250.0,
"valid_targets_min": 360
},
{
"epoch": 5.00801282051282,
"grad_norm": 0.760262997035743,
"learning_rate": 9.096274168327122e-06,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11211199313402176,
"step": 3125,
"valid_targets_mean": 2454.6,
"valid_targets_min": 1559
},
{
"epoch": 5.016025641025641,
"grad_norm": 0.8081201546727087,
"learning_rate": 9.029364603802017e-06,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12468785047531128,
"step": 3130,
"valid_targets_mean": 2825.5,
"valid_targets_min": 964
},
{
"epoch": 5.024038461538462,
"grad_norm": 0.9144227586011615,
"learning_rate": 8.962630211350248e-06,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11245831847190857,
"step": 3135,
"valid_targets_mean": 2072.0,
"valid_targets_min": 1201
},
{
"epoch": 5.032051282051282,
"grad_norm": 0.8415836808622785,
"learning_rate": 8.89607205654378e-06,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21187756955623627,
"step": 3140,
"valid_targets_mean": 3681.8,
"valid_targets_min": 1378
},
{
"epoch": 5.040064102564102,
"grad_norm": 1.0690915033438144,
"learning_rate": 8.829691202140591e-06,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0969729870557785,
"step": 3145,
"valid_targets_mean": 1514.1,
"valid_targets_min": 498
},
{
"epoch": 5.048076923076923,
"grad_norm": 0.888331771783694,
"learning_rate": 8.763488708067604e-06,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12027233839035034,
"step": 3150,
"valid_targets_mean": 2255.6,
"valid_targets_min": 955
},
{
"epoch": 5.056089743589744,
"grad_norm": 0.8115419127246998,
"learning_rate": 8.69746563140379e-06,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13751327991485596,
"step": 3155,
"valid_targets_mean": 3138.2,
"valid_targets_min": 925
},
{
"epoch": 5.064102564102564,
"grad_norm": 0.880802924767822,
"learning_rate": 8.631623026363331e-06,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09337887912988663,
"step": 3160,
"valid_targets_mean": 1815.4,
"valid_targets_min": 725
},
{
"epoch": 5.072115384615385,
"grad_norm": 0.8526126585543974,
"learning_rate": 8.56596194427873e-06,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10085926949977875,
"step": 3165,
"valid_targets_mean": 1936.5,
"valid_targets_min": 1147
},
{
"epoch": 5.080128205128205,
"grad_norm": 0.865864615519599,
"learning_rate": 8.500483433584054e-06,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11514122039079666,
"step": 3170,
"valid_targets_mean": 2888.1,
"valid_targets_min": 1666
},
{
"epoch": 5.0881410256410255,
"grad_norm": 0.8633744921019645,
"learning_rate": 8.435188539798187e-06,
"loss": 0.2695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16413256525993347,
"step": 3175,
"valid_targets_mean": 3507.0,
"valid_targets_min": 1585
},
{
"epoch": 5.096153846153846,
"grad_norm": 0.7489172858590697,
"learning_rate": 8.370078305508136e-06,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1103079617023468,
"step": 3180,
"valid_targets_mean": 3308.8,
"valid_targets_min": 1774
},
{
"epoch": 5.104166666666667,
"grad_norm": 0.7761189735769272,
"learning_rate": 8.305153770352384e-06,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10959683358669281,
"step": 3185,
"valid_targets_mean": 3496.6,
"valid_targets_min": 958
},
{
"epoch": 5.112179487179487,
"grad_norm": 0.953121153374897,
"learning_rate": 8.240415971004285e-06,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14587818086147308,
"step": 3190,
"valid_targets_mean": 2079.8,
"valid_targets_min": 1043
},
{
"epoch": 5.1201923076923075,
"grad_norm": 0.8994783360343982,
"learning_rate": 8.175865941155525e-06,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11071066558361053,
"step": 3195,
"valid_targets_mean": 2350.0,
"valid_targets_min": 1123
},
{
"epoch": 5.128205128205128,
"grad_norm": 0.8639406630796981,
"learning_rate": 8.111504711499598e-06,
"loss": 0.2537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15387535095214844,
"step": 3200,
"valid_targets_mean": 3171.8,
"valid_targets_min": 1809
},
{
"epoch": 5.136217948717949,
"grad_norm": 0.8743544692197517,
"learning_rate": 8.04733330971536e-06,
"loss": 0.2608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12671324610710144,
"step": 3205,
"valid_targets_mean": 2485.6,
"valid_targets_min": 1268
},
{
"epoch": 5.144230769230769,
"grad_norm": 0.9582632299000284,
"learning_rate": 7.983352760450618e-06,
"loss": 0.2571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11250822991132736,
"step": 3210,
"valid_targets_mean": 1896.8,
"valid_targets_min": 554
},
{
"epoch": 5.152243589743589,
"grad_norm": 0.9124958970924283,
"learning_rate": 7.919564085305768e-06,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11880991607904434,
"step": 3215,
"valid_targets_mean": 2402.8,
"valid_targets_min": 1805
},
{
"epoch": 5.160256410256411,
"grad_norm": 0.809203448407432,
"learning_rate": 7.855968302817487e-06,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1249704360961914,
"step": 3220,
"valid_targets_mean": 2293.9,
"valid_targets_min": 314
},
{
"epoch": 5.168269230769231,
"grad_norm": 1.0224736881905714,
"learning_rate": 7.792566428442456e-06,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1433626413345337,
"step": 3225,
"valid_targets_mean": 2055.8,
"valid_targets_min": 818
},
{
"epoch": 5.176282051282051,
"grad_norm": 0.828565366523305,
"learning_rate": 7.729359474541168e-06,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12695926427841187,
"step": 3230,
"valid_targets_mean": 3304.5,
"valid_targets_min": 1022
},
{
"epoch": 5.184294871794872,
"grad_norm": 1.0703527171317921,
"learning_rate": 7.666348450361737e-06,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17552143335342407,
"step": 3235,
"valid_targets_mean": 2147.1,
"valid_targets_min": 922
},
{
"epoch": 5.1923076923076925,
"grad_norm": 0.8629077122279247,
"learning_rate": 7.60353436202381e-06,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12918856739997864,
"step": 3240,
"valid_targets_mean": 2890.6,
"valid_targets_min": 1021
},
{
"epoch": 5.200320512820513,
"grad_norm": 0.7496627630060603,
"learning_rate": 7.540918212502479e-06,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11419525742530823,
"step": 3245,
"valid_targets_mean": 3239.9,
"valid_targets_min": 903
},
{
"epoch": 5.208333333333333,
"grad_norm": 0.9516986948209849,
"learning_rate": 7.478501001612281e-06,
"loss": 0.2642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10599060356616974,
"step": 3250,
"valid_targets_mean": 2018.6,
"valid_targets_min": 1264
},
{
"epoch": 5.216346153846154,
"grad_norm": 0.8786538617105409,
"learning_rate": 7.416283725991229e-06,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13649001717567444,
"step": 3255,
"valid_targets_mean": 2654.9,
"valid_targets_min": 974
},
{
"epoch": 5.2243589743589745,
"grad_norm": 0.7547164045773196,
"learning_rate": 7.354267379084896e-06,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11847176402807236,
"step": 3260,
"valid_targets_mean": 3161.9,
"valid_targets_min": 1418
},
{
"epoch": 5.232371794871795,
"grad_norm": 0.8827711281808431,
"learning_rate": 7.292452951130548e-06,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11796671152114868,
"step": 3265,
"valid_targets_mean": 2813.1,
"valid_targets_min": 849
},
{
"epoch": 5.240384615384615,
"grad_norm": 0.991683934378518,
"learning_rate": 7.230841429141347e-06,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11138557642698288,
"step": 3270,
"valid_targets_mean": 1707.8,
"valid_targets_min": 779
},
{
"epoch": 5.248397435897436,
"grad_norm": 0.8413292996210097,
"learning_rate": 7.169433796890595e-06,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11664022505283356,
"step": 3275,
"valid_targets_mean": 2805.9,
"valid_targets_min": 1887
},
{
"epoch": 5.256410256410256,
"grad_norm": 0.8481142716287121,
"learning_rate": 7.108231034895976e-06,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12616068124771118,
"step": 3280,
"valid_targets_mean": 2882.4,
"valid_targets_min": 1045
},
{
"epoch": 5.264423076923077,
"grad_norm": 0.7422363717208107,
"learning_rate": 7.047234120403972e-06,
"loss": 0.2453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07960276305675507,
"step": 3285,
"valid_targets_mean": 2813.0,
"valid_targets_min": 830
},
{
"epoch": 5.272435897435898,
"grad_norm": 0.9631783328404132,
"learning_rate": 6.986444027374211e-06,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10581400245428085,
"step": 3290,
"valid_targets_mean": 1969.2,
"valid_targets_min": 473
},
{
"epoch": 5.280448717948718,
"grad_norm": 0.9641249779597492,
"learning_rate": 6.925861726463919e-06,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12430629134178162,
"step": 3295,
"valid_targets_mean": 2351.1,
"valid_targets_min": 1181
},
{
"epoch": 5.288461538461538,
"grad_norm": 0.9412615692571877,
"learning_rate": 6.865488185012464e-06,
"loss": 0.2898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1612430363893509,
"step": 3300,
"valid_targets_mean": 2558.1,
"valid_targets_min": 1309
},
{
"epoch": 5.296474358974359,
"grad_norm": 1.0509911379396097,
"learning_rate": 6.805324367025825e-06,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11822021007537842,
"step": 3305,
"valid_targets_mean": 1644.9,
"valid_targets_min": 299
},
{
"epoch": 5.30448717948718,
"grad_norm": 0.8553682205085341,
"learning_rate": 6.745371233161309e-06,
"loss": 0.249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13173708319664001,
"step": 3310,
"valid_targets_mean": 2514.2,
"valid_targets_min": 548
},
{
"epoch": 5.3125,
"grad_norm": 0.7609829443446366,
"learning_rate": 6.685629740712103e-06,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1069406270980835,
"step": 3315,
"valid_targets_mean": 2430.6,
"valid_targets_min": 1418
},
{
"epoch": 5.32051282051282,
"grad_norm": 0.8915994872025942,
"learning_rate": 6.6261008435920605e-06,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11810167878866196,
"step": 3320,
"valid_targets_mean": 2207.5,
"valid_targets_min": 1348
},
{
"epoch": 5.328525641025641,
"grad_norm": 0.9796125193027324,
"learning_rate": 6.566785492320471e-06,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13730502128601074,
"step": 3325,
"valid_targets_mean": 1870.9,
"valid_targets_min": 1223
},
{
"epoch": 5.336538461538462,
"grad_norm": 0.8717267812917334,
"learning_rate": 6.507684634006815e-06,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1494694948196411,
"step": 3330,
"valid_targets_mean": 2862.1,
"valid_targets_min": 1343
},
{
"epoch": 5.344551282051282,
"grad_norm": 0.7268347262067547,
"learning_rate": 6.448799212335734e-06,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09736894816160202,
"step": 3335,
"valid_targets_mean": 3054.6,
"valid_targets_min": 979
},
{
"epoch": 5.352564102564102,
"grad_norm": 0.9759718449339392,
"learning_rate": 6.390130167551869e-06,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11273542046546936,
"step": 3340,
"valid_targets_mean": 1938.5,
"valid_targets_min": 1000
},
{
"epoch": 5.360576923076923,
"grad_norm": 0.9594102043664786,
"learning_rate": 6.331678436444939e-06,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13123399019241333,
"step": 3345,
"valid_targets_mean": 2063.9,
"valid_targets_min": 994
},
{
"epoch": 5.368589743589744,
"grad_norm": 1.1783899265802422,
"learning_rate": 6.273444952334713e-06,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1367177963256836,
"step": 3350,
"valid_targets_mean": 1565.1,
"valid_targets_min": 945
},
{
"epoch": 5.376602564102564,
"grad_norm": 0.9688205506455062,
"learning_rate": 6.2154306450561175e-06,
"loss": 0.2452,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14453257620334625,
"step": 3355,
"valid_targets_mean": 2148.6,
"valid_targets_min": 1155
},
{
"epoch": 5.384615384615385,
"grad_norm": 0.8744646444334985,
"learning_rate": 6.157636440944445e-06,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11924951523542404,
"step": 3360,
"valid_targets_mean": 2748.2,
"valid_targets_min": 870
},
{
"epoch": 5.392628205128205,
"grad_norm": 0.9862735226573559,
"learning_rate": 6.100063262820474e-06,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15304933488368988,
"step": 3365,
"valid_targets_mean": 2384.2,
"valid_targets_min": 851
},
{
"epoch": 5.4006410256410255,
"grad_norm": 0.9764993056093113,
"learning_rate": 6.0427120299758236e-06,
"loss": 0.2421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1572096198797226,
"step": 3370,
"valid_targets_mean": 2534.1,
"valid_targets_min": 1192
},
{
"epoch": 5.408653846153846,
"grad_norm": 0.8959864428190588,
"learning_rate": 5.985583658158212e-06,
"loss": 0.2409,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12945888936519623,
"step": 3375,
"valid_targets_mean": 2567.4,
"valid_targets_min": 1399
},
{
"epoch": 5.416666666666667,
"grad_norm": 0.8552778775133383,
"learning_rate": 5.928679059556852e-06,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12539073824882507,
"step": 3380,
"valid_targets_mean": 2832.4,
"valid_targets_min": 1346
},
{
"epoch": 5.424679487179487,
"grad_norm": 0.8025920436996826,
"learning_rate": 5.871999142787908e-06,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13345125317573547,
"step": 3385,
"valid_targets_mean": 3709.1,
"valid_targets_min": 907
},
{
"epoch": 5.4326923076923075,
"grad_norm": 0.8911055708140087,
"learning_rate": 5.815544812879936e-06,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11404845118522644,
"step": 3390,
"valid_targets_mean": 2082.8,
"valid_targets_min": 615
},
{
"epoch": 5.440705128205128,
"grad_norm": 0.8366878051977619,
"learning_rate": 5.759316971259503e-06,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10606566071510315,
"step": 3395,
"valid_targets_mean": 2823.0,
"valid_targets_min": 1201
},
{
"epoch": 5.448717948717949,
"grad_norm": 0.8888192039843411,
"learning_rate": 5.703316515736734e-06,
"loss": 0.2548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09152843058109283,
"step": 3400,
"valid_targets_mean": 1674.8,
"valid_targets_min": 946
},
{
"epoch": 5.456730769230769,
"grad_norm": 0.8827382632913743,
"learning_rate": 5.647544340491007e-06,
"loss": 0.2562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13417841494083405,
"step": 3405,
"valid_targets_mean": 2341.6,
"valid_targets_min": 950
},
{
"epoch": 5.464743589743589,
"grad_norm": 0.9348158913522076,
"learning_rate": 5.592001336056659e-06,
"loss": 0.2599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11661595851182938,
"step": 3410,
"valid_targets_mean": 2148.5,
"valid_targets_min": 1151
},
{
"epoch": 5.472756410256411,
"grad_norm": 0.899463165773569,
"learning_rate": 5.536688389308782e-06,
"loss": 0.2133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11449143290519714,
"step": 3415,
"valid_targets_mean": 2986.8,
"valid_targets_min": 1542
},
{
"epoch": 5.480769230769231,
"grad_norm": 1.0221840707566308,
"learning_rate": 5.4816063834490496e-06,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11448987573385239,
"step": 3420,
"valid_targets_mean": 2707.9,
"valid_targets_min": 1385
},
{
"epoch": 5.488782051282051,
"grad_norm": 0.8886976079403867,
"learning_rate": 5.426756197991625e-06,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12407940626144409,
"step": 3425,
"valid_targets_mean": 2182.8,
"valid_targets_min": 1171
},
{
"epoch": 5.496794871794872,
"grad_norm": 0.9145768030794514,
"learning_rate": 5.372138708749104e-06,
"loss": 0.2468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1369701325893402,
"step": 3430,
"valid_targets_mean": 2594.4,
"valid_targets_min": 1301
},
{
"epoch": 5.5048076923076925,
"grad_norm": 1.009581529355524,
"learning_rate": 5.3177547878185436e-06,
"loss": 0.2506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14793305099010468,
"step": 3435,
"valid_targets_mean": 2712.1,
"valid_targets_min": 1151
},
{
"epoch": 5.512820512820513,
"grad_norm": 0.9955589264699403,
"learning_rate": 5.263605303567532e-06,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07715998589992523,
"step": 3440,
"valid_targets_mean": 1472.5,
"valid_targets_min": 880
},
{
"epoch": 5.520833333333333,
"grad_norm": 0.9208751898365475,
"learning_rate": 5.20969112062032e-06,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1354086697101593,
"step": 3445,
"valid_targets_mean": 2418.8,
"valid_targets_min": 730
},
{
"epoch": 5.528846153846154,
"grad_norm": 0.9221623243176863,
"learning_rate": 5.156013099844017e-06,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12082527577877045,
"step": 3450,
"valid_targets_mean": 2732.0,
"valid_targets_min": 682
},
{
"epoch": 5.5368589743589745,
"grad_norm": 0.8920903965938275,
"learning_rate": 5.1025720983348544e-06,
"loss": 0.2383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08986526727676392,
"step": 3455,
"valid_targets_mean": 1880.8,
"valid_targets_min": 358
},
{
"epoch": 5.544871794871795,
"grad_norm": 0.9181262406318845,
"learning_rate": 5.049368969404484e-06,
"loss": 0.2468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16663578152656555,
"step": 3460,
"valid_targets_mean": 2500.4,
"valid_targets_min": 233
},
{
"epoch": 5.552884615384615,
"grad_norm": 0.8756777064811084,
"learning_rate": 4.99640456256636e-06,
"loss": 0.2373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12099698930978775,
"step": 3465,
"valid_targets_mean": 2159.5,
"valid_targets_min": 1234
},
{
"epoch": 5.560897435897436,
"grad_norm": 0.7964295070270689,
"learning_rate": 4.9436797235221814e-06,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1270281970500946,
"step": 3470,
"valid_targets_mean": 3533.8,
"valid_targets_min": 1714
},
{
"epoch": 5.568910256410256,
"grad_norm": 0.8852318618982599,
"learning_rate": 4.891195294148376e-06,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13869354128837585,
"step": 3475,
"valid_targets_mean": 2751.9,
"valid_targets_min": 950
},
{
"epoch": 5.576923076923077,
"grad_norm": 0.9337792028669593,
"learning_rate": 4.838952112482671e-06,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11898134648799896,
"step": 3480,
"valid_targets_mean": 2228.0,
"valid_targets_min": 981
},
{
"epoch": 5.584935897435898,
"grad_norm": 0.9715871230675452,
"learning_rate": 4.786951012710699e-06,
"loss": 0.2491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11031315475702286,
"step": 3485,
"valid_targets_mean": 1735.4,
"valid_targets_min": 716
},
{
"epoch": 5.592948717948718,
"grad_norm": 1.098570377613153,
"learning_rate": 4.735192825152686e-06,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14487780630588531,
"step": 3490,
"valid_targets_mean": 2629.0,
"valid_targets_min": 1579
},
{
"epoch": 5.600961538461538,
"grad_norm": 1.103661958195554,
"learning_rate": 4.683678376250189e-06,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13785336911678314,
"step": 3495,
"valid_targets_mean": 2487.4,
"valid_targets_min": 718
},
{
"epoch": 5.608974358974359,
"grad_norm": 0.8912416531320945,
"learning_rate": 4.6324084885529086e-06,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14532919228076935,
"step": 3500,
"valid_targets_mean": 2370.6,
"valid_targets_min": 1463
},
{
"epoch": 5.61698717948718,
"grad_norm": 0.853809946943463,
"learning_rate": 4.581383980705538e-06,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11753176897764206,
"step": 3505,
"valid_targets_mean": 2203.1,
"valid_targets_min": 1053
},
{
"epoch": 5.625,
"grad_norm": 1.0148749521455824,
"learning_rate": 4.530605667434727e-06,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11378777027130127,
"step": 3510,
"valid_targets_mean": 1813.6,
"valid_targets_min": 907
},
{
"epoch": 5.63301282051282,
"grad_norm": 0.8809216737162711,
"learning_rate": 4.480074359536013e-06,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09223954379558563,
"step": 3515,
"valid_targets_mean": 2177.4,
"valid_targets_min": 1163
},
{
"epoch": 5.641025641025641,
"grad_norm": 0.7735268513204762,
"learning_rate": 4.429790863860934e-06,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09695015102624893,
"step": 3520,
"valid_targets_mean": 3094.4,
"valid_targets_min": 1022
},
{
"epoch": 5.649038461538462,
"grad_norm": 0.842148140258802,
"learning_rate": 4.3797559833041146e-06,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19254657626152039,
"step": 3525,
"valid_targets_mean": 4331.0,
"valid_targets_min": 849
},
{
"epoch": 5.657051282051282,
"grad_norm": 0.9672571755633537,
"learning_rate": 4.329970516790447e-06,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08324987441301346,
"step": 3530,
"valid_targets_mean": 1956.8,
"valid_targets_min": 911
},
{
"epoch": 5.665064102564102,
"grad_norm": 0.8246469423610661,
"learning_rate": 4.280435259262363e-06,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09709151834249496,
"step": 3535,
"valid_targets_mean": 2326.0,
"valid_targets_min": 1127
},
{
"epoch": 5.673076923076923,
"grad_norm": 1.1471517807706315,
"learning_rate": 4.231151001667077e-06,
"loss": 0.2477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12982910871505737,
"step": 3540,
"valid_targets_mean": 2151.2,
"valid_targets_min": 874
},
{
"epoch": 5.681089743589744,
"grad_norm": 0.9991407058243512,
"learning_rate": 4.182118530944044e-06,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1193799376487732,
"step": 3545,
"valid_targets_mean": 1818.6,
"valid_targets_min": 890
},
{
"epoch": 5.689102564102564,
"grad_norm": 1.0600994797819268,
"learning_rate": 4.133338630012307e-06,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12433040142059326,
"step": 3550,
"valid_targets_mean": 1742.8,
"valid_targets_min": 389
},
{
"epoch": 5.697115384615385,
"grad_norm": 0.9556963156284349,
"learning_rate": 4.0848120777580554e-06,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1410602331161499,
"step": 3555,
"valid_targets_mean": 2916.0,
"valid_targets_min": 1039
},
{
"epoch": 5.705128205128205,
"grad_norm": 0.9434224405006304,
"learning_rate": 4.036539649022182e-06,
"loss": 0.2604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1809200495481491,
"step": 3560,
"valid_targets_mean": 2309.0,
"valid_targets_min": 958
},
{
"epoch": 5.7131410256410255,
"grad_norm": 0.8716920870064443,
"learning_rate": 3.988522114587865e-06,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12875115871429443,
"step": 3565,
"valid_targets_mean": 2863.0,
"valid_targets_min": 1614
},
{
"epoch": 5.721153846153846,
"grad_norm": 1.0458563586692415,
"learning_rate": 3.940760241168331e-06,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11806829273700714,
"step": 3570,
"valid_targets_mean": 1454.2,
"valid_targets_min": 1001
},
{
"epoch": 5.729166666666667,
"grad_norm": 0.9062406947995726,
"learning_rate": 3.893254791394541e-06,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11536668241024017,
"step": 3575,
"valid_targets_mean": 2212.8,
"valid_targets_min": 1612
},
{
"epoch": 5.737179487179487,
"grad_norm": 1.330022131278515,
"learning_rate": 3.846006523803074e-06,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12758204340934753,
"step": 3580,
"valid_targets_mean": 2525.5,
"valid_targets_min": 1242
},
{
"epoch": 5.7451923076923075,
"grad_norm": 0.8835904952970588,
"learning_rate": 3.799016192823981e-06,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09581005573272705,
"step": 3585,
"valid_targets_mean": 1695.1,
"valid_targets_min": 338
},
{
"epoch": 5.753205128205128,
"grad_norm": 0.9420105033129872,
"learning_rate": 3.7522845487687276e-06,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14770177006721497,
"step": 3590,
"valid_targets_mean": 2628.4,
"valid_targets_min": 1034
},
{
"epoch": 5.761217948717949,
"grad_norm": 0.8676921782417414,
"learning_rate": 3.7058123378182664e-06,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08950576186180115,
"step": 3595,
"valid_targets_mean": 2229.5,
"valid_targets_min": 812
},
{
"epoch": 5.769230769230769,
"grad_norm": 1.0067847303064097,
"learning_rate": 3.6596003020110636e-06,
"loss": 0.2686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12687063217163086,
"step": 3600,
"valid_targets_mean": 1829.5,
"valid_targets_min": 1329
},
{
"epoch": 5.777243589743589,
"grad_norm": 0.9462956235007977,
"learning_rate": 3.613649179231287e-06,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12175004184246063,
"step": 3605,
"valid_targets_mean": 2789.6,
"valid_targets_min": 1053
},
{
"epoch": 5.785256410256411,
"grad_norm": 0.9538550126840127,
"learning_rate": 3.5679597031970017e-06,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11191975325345993,
"step": 3610,
"valid_targets_mean": 1783.1,
"valid_targets_min": 1165
},
{
"epoch": 5.793269230769231,
"grad_norm": 0.9448665396902267,
"learning_rate": 3.5225326034484764e-06,
"loss": 0.2259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11258763074874878,
"step": 3615,
"valid_targets_mean": 2813.6,
"valid_targets_min": 1010
},
{
"epoch": 5.801282051282051,
"grad_norm": 1.1921602754723932,
"learning_rate": 3.4773686053365197e-06,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.108152374625206,
"step": 3620,
"valid_targets_mean": 1980.9,
"valid_targets_min": 1051
},
{
"epoch": 5.809294871794872,
"grad_norm": 0.9389437871542158,
"learning_rate": 3.4324684300109003e-06,
"loss": 0.2454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12262805551290512,
"step": 3625,
"valid_targets_mean": 2210.5,
"valid_targets_min": 1501
},
{
"epoch": 5.8173076923076925,
"grad_norm": 0.8936446524664393,
"learning_rate": 3.387832794408832e-06,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11695268750190735,
"step": 3630,
"valid_targets_mean": 2020.8,
"valid_targets_min": 677
},
{
"epoch": 5.825320512820513,
"grad_norm": 0.9701527092625535,
"learning_rate": 3.3434624112435342e-06,
"loss": 0.2494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1281004697084427,
"step": 3635,
"valid_targets_mean": 2187.0,
"valid_targets_min": 1121
},
{
"epoch": 5.833333333333333,
"grad_norm": 0.8743840128057639,
"learning_rate": 3.2993579889928397e-06,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16947509348392487,
"step": 3640,
"valid_targets_mean": 3233.1,
"valid_targets_min": 1260
},
{
"epoch": 5.841346153846154,
"grad_norm": 1.098032928845481,
"learning_rate": 3.25552023188789e-06,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08012664318084717,
"step": 3645,
"valid_targets_mean": 1645.8,
"valid_targets_min": 299
},
{
"epoch": 5.8493589743589745,
"grad_norm": 0.800014973443817,
"learning_rate": 3.211949839901889e-06,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13721336424350739,
"step": 3650,
"valid_targets_mean": 3545.6,
"valid_targets_min": 1813
},
{
"epoch": 5.857371794871795,
"grad_norm": 0.8357203359294402,
"learning_rate": 3.168647508738927e-06,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13685111701488495,
"step": 3655,
"valid_targets_mean": 2689.5,
"valid_targets_min": 1076
},
{
"epoch": 5.865384615384615,
"grad_norm": 0.8044023365786744,
"learning_rate": 3.125613929822866e-06,
"loss": 0.2333,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11675594747066498,
"step": 3660,
"valid_targets_mean": 2676.8,
"valid_targets_min": 1320
},
{
"epoch": 5.873397435897436,
"grad_norm": 0.9867169190192657,
"learning_rate": 3.0828497902863106e-06,
"loss": 0.2405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13692760467529297,
"step": 3665,
"valid_targets_mean": 2082.4,
"valid_targets_min": 738
},
{
"epoch": 5.881410256410256,
"grad_norm": 1.033716028166094,
"learning_rate": 3.0403557729596267e-06,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08903215825557709,
"step": 3670,
"valid_targets_mean": 1578.8,
"valid_targets_min": 338
},
{
"epoch": 5.889423076923077,
"grad_norm": 0.9281432052223707,
"learning_rate": 2.998132556360038e-06,
"loss": 0.2475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1471833884716034,
"step": 3675,
"valid_targets_mean": 1990.5,
"valid_targets_min": 991
},
{
"epoch": 5.897435897435898,
"grad_norm": 0.9371734995128413,
"learning_rate": 2.9561808146808068e-06,
"loss": 0.2724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13200689852237701,
"step": 3680,
"valid_targets_mean": 2243.6,
"valid_targets_min": 997
},
{
"epoch": 5.905448717948718,
"grad_norm": 1.0373083841003878,
"learning_rate": 2.9145012177804476e-06,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1324290782213211,
"step": 3685,
"valid_targets_mean": 2374.5,
"valid_targets_min": 386
},
{
"epoch": 5.913461538461538,
"grad_norm": 1.2898842869596276,
"learning_rate": 2.8730944311720454e-06,
"loss": 0.2317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.140394926071167,
"step": 3690,
"valid_targets_mean": 2749.2,
"valid_targets_min": 1277
},
{
"epoch": 5.921474358974359,
"grad_norm": 0.9019036941814247,
"learning_rate": 2.8319611160126226e-06,
"loss": 0.2501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07446151226758957,
"step": 3695,
"valid_targets_mean": 1745.6,
"valid_targets_min": 879
},
{
"epoch": 5.92948717948718,
"grad_norm": 0.8839791385323709,
"learning_rate": 2.791101929092592e-06,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11784940958023071,
"step": 3700,
"valid_targets_mean": 2234.2,
"valid_targets_min": 1195
},
{
"epoch": 5.9375,
"grad_norm": 0.8330181151771336,
"learning_rate": 2.750517522825251e-06,
"loss": 0.25,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13366447389125824,
"step": 3705,
"valid_targets_mean": 2719.9,
"valid_targets_min": 1104
},
{
"epoch": 5.94551282051282,
"grad_norm": 0.9377041217700914,
"learning_rate": 2.710208545236397e-06,
"loss": 0.236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.133009672164917,
"step": 3710,
"valid_targets_mean": 2508.2,
"valid_targets_min": 929
},
{
"epoch": 5.953525641025641,
"grad_norm": 0.9820403258442009,
"learning_rate": 2.670175639953929e-06,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11438588798046112,
"step": 3715,
"valid_targets_mean": 2220.0,
"valid_targets_min": 1251
},
{
"epoch": 5.961538461538462,
"grad_norm": 0.7615622545783344,
"learning_rate": 2.6304194461976207e-06,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14797644317150116,
"step": 3720,
"valid_targets_mean": 3764.2,
"valid_targets_min": 1940
},
{
"epoch": 5.969551282051282,
"grad_norm": 1.3057101203774155,
"learning_rate": 2.5909405987688896e-06,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12257261574268341,
"step": 3725,
"valid_targets_mean": 2614.1,
"valid_targets_min": 1414
},
{
"epoch": 5.977564102564102,
"grad_norm": 0.9546669568666493,
"learning_rate": 2.5517397280406565e-06,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1352090984582901,
"step": 3730,
"valid_targets_mean": 1989.8,
"valid_targets_min": 1115
},
{
"epoch": 5.985576923076923,
"grad_norm": 0.8381510959729745,
"learning_rate": 2.512817459947312e-06,
"loss": 0.255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442822366952896,
"step": 3735,
"valid_targets_mean": 2502.4,
"valid_targets_min": 303
},
{
"epoch": 5.993589743589744,
"grad_norm": 0.8381879679213633,
"learning_rate": 2.4741744159746618e-06,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1361812949180603,
"step": 3740,
"valid_targets_mean": 2932.0,
"valid_targets_min": 1390
},
{
"epoch": 6.001602564102564,
"grad_norm": 0.8973578582889672,
"learning_rate": 2.435811213150079e-06,
"loss": 0.2243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11854055523872375,
"step": 3745,
"valid_targets_mean": 2506.2,
"valid_targets_min": 1387
},
{
"epoch": 6.009615384615385,
"grad_norm": 0.8534114522962257,
"learning_rate": 2.3977284640325805e-06,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10698527097702026,
"step": 3750,
"valid_targets_mean": 2164.8,
"valid_targets_min": 1463
},
{
"epoch": 6.017628205128205,
"grad_norm": 1.0624803521960697,
"learning_rate": 2.359926776703092e-06,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16178178787231445,
"step": 3755,
"valid_targets_mean": 1912.1,
"valid_targets_min": 1224
},
{
"epoch": 6.0256410256410255,
"grad_norm": 0.9211420738337137,
"learning_rate": 2.3224067547547357e-06,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1036263182759285,
"step": 3760,
"valid_targets_mean": 1760.0,
"valid_targets_min": 351
},
{
"epoch": 6.033653846153846,
"grad_norm": 0.9051511202364992,
"learning_rate": 2.2851689972831536e-06,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11598742753267288,
"step": 3765,
"valid_targets_mean": 2061.2,
"valid_targets_min": 618
},
{
"epoch": 6.041666666666667,
"grad_norm": 0.9418108298812553,
"learning_rate": 2.248214098877002e-06,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10721792280673981,
"step": 3770,
"valid_targets_mean": 1872.5,
"valid_targets_min": 314
},
{
"epoch": 6.049679487179487,
"grad_norm": 0.9797618243041817,
"learning_rate": 2.2115426496083958e-06,
"loss": 0.2498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11505149304866791,
"step": 3775,
"valid_targets_mean": 1678.6,
"valid_targets_min": 303
},
{
"epoch": 6.0576923076923075,
"grad_norm": 0.993599072618345,
"learning_rate": 2.175155235023536e-06,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11126979440450668,
"step": 3780,
"valid_targets_mean": 1965.8,
"valid_targets_min": 395
},
{
"epoch": 6.065705128205129,
"grad_norm": 1.2166175998444293,
"learning_rate": 2.1390524361333355e-06,
"loss": 0.2055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11817347258329391,
"step": 3785,
"valid_targets_mean": 2711.9,
"valid_targets_min": 1262
},
{
"epoch": 6.073717948717949,
"grad_norm": 1.0184639512858285,
"learning_rate": 2.1032348294041305e-06,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10550463944673538,
"step": 3790,
"valid_targets_mean": 2176.2,
"valid_targets_min": 413
},
{
"epoch": 6.081730769230769,
"grad_norm": 0.8816372867971991,
"learning_rate": 2.067702986748521e-06,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13984540104866028,
"step": 3795,
"valid_targets_mean": 2715.6,
"valid_targets_min": 1046
},
{
"epoch": 6.089743589743589,
"grad_norm": 0.856756363743796,
"learning_rate": 2.0324574755161764e-06,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11478455364704132,
"step": 3800,
"valid_targets_mean": 3045.0,
"valid_targets_min": 1110
},
{
"epoch": 6.097756410256411,
"grad_norm": 1.014237638787344,
"learning_rate": 1.9974988584848385e-06,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15924817323684692,
"step": 3805,
"valid_targets_mean": 2288.0,
"valid_targets_min": 552
},
{
"epoch": 6.105769230769231,
"grad_norm": 0.7358071224075459,
"learning_rate": 1.96282769385129e-06,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16144993901252747,
"step": 3810,
"valid_targets_mean": 3920.1,
"valid_targets_min": 1087
},
{
"epoch": 6.113782051282051,
"grad_norm": 0.8095160537437991,
"learning_rate": 1.9284445352224625e-06,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12894617021083832,
"step": 3815,
"valid_targets_mean": 4050.4,
"valid_targets_min": 1416
},
{
"epoch": 6.121794871794871,
"grad_norm": 0.8248147276134351,
"learning_rate": 1.894349931606596e-06,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10038469731807709,
"step": 3820,
"valid_targets_mean": 2216.5,
"valid_targets_min": 1070
},
{
"epoch": 6.1298076923076925,
"grad_norm": 0.9659691832090724,
"learning_rate": 1.8605444274044493e-06,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13512755930423737,
"step": 3825,
"valid_targets_mean": 3244.0,
"valid_targets_min": 1432
},
{
"epoch": 6.137820512820513,
"grad_norm": 1.0862713671449233,
"learning_rate": 1.827028562400659e-06,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09466798603534698,
"step": 3830,
"valid_targets_mean": 1761.5,
"valid_targets_min": 1029
},
{
"epoch": 6.145833333333333,
"grad_norm": 0.8998914205168546,
"learning_rate": 1.793802871755066e-06,
"loss": 0.2381,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13006693124771118,
"step": 3835,
"valid_targets_mean": 2522.0,
"valid_targets_min": 892
},
{
"epoch": 6.153846153846154,
"grad_norm": 0.9432779658728595,
"learning_rate": 1.760867885994202e-06,
"loss": 0.2438,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1070912778377533,
"step": 3840,
"valid_targets_mean": 1912.8,
"valid_targets_min": 898
},
{
"epoch": 6.1618589743589745,
"grad_norm": 0.9338261525659013,
"learning_rate": 1.7282241310028047e-06,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0991261750459671,
"step": 3845,
"valid_targets_mean": 1827.0,
"valid_targets_min": 816
},
{
"epoch": 6.169871794871795,
"grad_norm": 0.8125279588220881,
"learning_rate": 1.6958721280154232e-06,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09734629094600677,
"step": 3850,
"valid_targets_mean": 2683.1,
"valid_targets_min": 1626
},
{
"epoch": 6.177884615384615,
"grad_norm": 0.8247615418877465,
"learning_rate": 1.6638123936081085e-06,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10162614285945892,
"step": 3855,
"valid_targets_mean": 3007.8,
"valid_targets_min": 1285
},
{
"epoch": 6.185897435897436,
"grad_norm": 1.054167152401939,
"learning_rate": 1.6320454396901463e-06,
"loss": 0.2522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17180277407169342,
"step": 3860,
"valid_targets_mean": 2394.8,
"valid_targets_min": 835
},
{
"epoch": 6.193910256410256,
"grad_norm": 0.861439666599418,
"learning_rate": 1.6005717734958914e-06,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10443761199712753,
"step": 3865,
"valid_targets_mean": 2728.1,
"valid_targets_min": 1162
},
{
"epoch": 6.201923076923077,
"grad_norm": 1.1126631206428137,
"learning_rate": 1.569391897576671e-06,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13118451833724976,
"step": 3870,
"valid_targets_mean": 3325.9,
"valid_targets_min": 1334
},
{
"epoch": 6.209935897435898,
"grad_norm": 1.1962641290378953,
"learning_rate": 1.5385063097927533e-06,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15093114972114563,
"step": 3875,
"valid_targets_mean": 1901.5,
"valid_targets_min": 717
},
{
"epoch": 6.217948717948718,
"grad_norm": 0.8163609568748574,
"learning_rate": 1.5079155033054104e-06,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12418213486671448,
"step": 3880,
"valid_targets_mean": 3363.8,
"valid_targets_min": 1873
},
{
"epoch": 6.225961538461538,
"grad_norm": 0.8700233982216152,
"learning_rate": 1.4776199665690239e-06,
"loss": 0.2315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14278334379196167,
"step": 3885,
"valid_targets_mean": 2949.2,
"valid_targets_min": 2107
},
{
"epoch": 6.233974358974359,
"grad_norm": 0.9683775134031113,
"learning_rate": 1.4476201833233084e-06,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1428484171628952,
"step": 3890,
"valid_targets_mean": 2313.9,
"valid_targets_min": 904
},
{
"epoch": 6.24198717948718,
"grad_norm": 0.8620465618712795,
"learning_rate": 1.4179166325855676e-06,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10901591181755066,
"step": 3895,
"valid_targets_mean": 2681.1,
"valid_targets_min": 1417
},
{
"epoch": 6.25,
"grad_norm": 1.0173933841157816,
"learning_rate": 1.3885097886430599e-06,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11926823854446411,
"step": 3900,
"valid_targets_mean": 1679.1,
"valid_targets_min": 776
},
{
"epoch": 6.25801282051282,
"grad_norm": 0.9589762435954294,
"learning_rate": 1.35940012104542e-06,
"loss": 0.229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11792376637458801,
"step": 3905,
"valid_targets_mean": 2086.9,
"valid_targets_min": 1173
},
{
"epoch": 6.266025641025641,
"grad_norm": 0.8272561272888953,
"learning_rate": 1.3305880945971583e-06,
"loss": 0.2197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11362828314304352,
"step": 3910,
"valid_targets_mean": 2718.2,
"valid_targets_min": 1210
},
{
"epoch": 6.274038461538462,
"grad_norm": 0.874758503329499,
"learning_rate": 1.3020741693502403e-06,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11108657717704773,
"step": 3915,
"valid_targets_mean": 2434.9,
"valid_targets_min": 876
},
{
"epoch": 6.282051282051282,
"grad_norm": 0.9079477576801739,
"learning_rate": 1.27385880059675e-06,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12969839572906494,
"step": 3920,
"valid_targets_mean": 2454.9,
"valid_targets_min": 1137
},
{
"epoch": 6.290064102564102,
"grad_norm": 2.0808279255459916,
"learning_rate": 1.245942438861607e-06,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14092810451984406,
"step": 3925,
"valid_targets_mean": 4037.8,
"valid_targets_min": 1906
},
{
"epoch": 6.298076923076923,
"grad_norm": 0.899393114401227,
"learning_rate": 1.2183255298953788e-06,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11960645020008087,
"step": 3930,
"valid_targets_mean": 2517.6,
"valid_targets_min": 294
},
{
"epoch": 6.306089743589744,
"grad_norm": 0.8903825930436158,
"learning_rate": 1.1910085146671645e-06,
"loss": 0.2335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09993119537830353,
"step": 3935,
"valid_targets_mean": 2103.9,
"valid_targets_min": 947
},
{
"epoch": 6.314102564102564,
"grad_norm": 0.954308249771596,
"learning_rate": 1.1639918293575492e-06,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10835768282413483,
"step": 3940,
"valid_targets_mean": 2119.8,
"valid_targets_min": 872
},
{
"epoch": 6.322115384615385,
"grad_norm": 0.7514063558774706,
"learning_rate": 1.1372759053516536e-06,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07814587652683258,
"step": 3945,
"valid_targets_mean": 1868.4,
"valid_targets_min": 1116
},
{
"epoch": 6.330128205128205,
"grad_norm": 1.2072460679937176,
"learning_rate": 1.1108611692322157e-06,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12843677401542664,
"step": 3950,
"valid_targets_mean": 2542.8,
"valid_targets_min": 1621
},
{
"epoch": 6.3381410256410255,
"grad_norm": 1.0878840127555423,
"learning_rate": 1.0847480427728142e-06,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1504746973514557,
"step": 3955,
"valid_targets_mean": 2188.8,
"valid_targets_min": 1581
},
{
"epoch": 6.346153846153846,
"grad_norm": 0.9562102985761943,
"learning_rate": 1.0589369429311125e-06,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13461454212665558,
"step": 3960,
"valid_targets_mean": 2561.5,
"valid_targets_min": 1333
},
{
"epoch": 6.354166666666667,
"grad_norm": 0.9752919981880385,
"learning_rate": 1.0334282818422037e-06,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1450095921754837,
"step": 3965,
"valid_targets_mean": 2425.1,
"valid_targets_min": 1062
},
{
"epoch": 6.362179487179487,
"grad_norm": 1.5311355387380936,
"learning_rate": 1.008222466812041e-06,
"loss": 0.2553,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07920059561729431,
"step": 3970,
"valid_targets_mean": 2347.8,
"valid_targets_min": 966
},
{
"epoch": 6.3701923076923075,
"grad_norm": 1.0924705252685218,
"learning_rate": 9.83319900310915e-07,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12321265786886215,
"step": 3975,
"valid_targets_mean": 2116.4,
"valid_targets_min": 1230
},
{
"epoch": 6.378205128205128,
"grad_norm": 0.9640948057385402,
"learning_rate": 9.587209799670495e-07,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11751890182495117,
"step": 3980,
"valid_targets_mean": 2322.9,
"valid_targets_min": 1085
},
{
"epoch": 6.386217948717949,
"grad_norm": 1.079236125695824,
"learning_rate": 9.344260985602327e-07,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16698667407035828,
"step": 3985,
"valid_targets_mean": 1949.1,
"valid_targets_min": 812
},
{
"epoch": 6.394230769230769,
"grad_norm": 1.0803656519063216,
"learning_rate": 9.104356440155526e-07,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.140387624502182,
"step": 3990,
"valid_targets_mean": 2234.5,
"valid_targets_min": 1183
},
{
"epoch": 6.402243589743589,
"grad_norm": 0.8456195863558014,
"learning_rate": 8.867499993972162e-07,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13046512007713318,
"step": 3995,
"valid_targets_mean": 3625.6,
"valid_targets_min": 979
},
{
"epoch": 6.410256410256411,
"grad_norm": 0.8977134484616605,
"learning_rate": 8.633695429024058e-07,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10581670701503754,
"step": 4000,
"valid_targets_mean": 2741.9,
"valid_targets_min": 921
},
{
"epoch": 6.418269230769231,
"grad_norm": 0.7948378106951604,
"learning_rate": 8.402946478552732e-07,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09752516448497772,
"step": 4005,
"valid_targets_mean": 3156.9,
"valid_targets_min": 473
},
{
"epoch": 6.426282051282051,
"grad_norm": 0.8443688864845404,
"learning_rate": 8.175256827009392e-07,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10218418389558792,
"step": 4010,
"valid_targets_mean": 2307.0,
"valid_targets_min": 1029
},
{
"epoch": 6.434294871794872,
"grad_norm": 1.7792482258762818,
"learning_rate": 7.95063010999646e-07,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09822884202003479,
"step": 4015,
"valid_targets_mean": 1924.8,
"valid_targets_min": 981
},
{
"epoch": 6.4423076923076925,
"grad_norm": 0.926606896282617,
"learning_rate": 7.729069914209409e-07,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11828078329563141,
"step": 4020,
"valid_targets_mean": 2529.9,
"valid_targets_min": 1042
},
{
"epoch": 6.450320512820513,
"grad_norm": 1.0827086250732898,
"learning_rate": 7.510579777379345e-07,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10486094653606415,
"step": 4025,
"valid_targets_mean": 1429.4,
"valid_targets_min": 297
},
{
"epoch": 6.458333333333333,
"grad_norm": 0.9839272238313078,
"learning_rate": 7.295163188216792e-07,
"loss": 0.2348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1142701581120491,
"step": 4030,
"valid_targets_mean": 2105.8,
"valid_targets_min": 973
},
{
"epoch": 6.466346153846154,
"grad_norm": 0.9291054329783041,
"learning_rate": 7.08282358635568e-07,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12670905888080597,
"step": 4035,
"valid_targets_mean": 2173.2,
"valid_targets_min": 1040
},
{
"epoch": 6.4743589743589745,
"grad_norm": 0.9426259395664396,
"learning_rate": 6.87356436229869e-07,
"loss": 0.2555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12212735414505005,
"step": 4040,
"valid_targets_mean": 1812.4,
"valid_targets_min": 1033
},
{
"epoch": 6.482371794871795,
"grad_norm": 0.7380513636736298,
"learning_rate": 6.667388857362977e-07,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09599901735782623,
"step": 4045,
"valid_targets_mean": 2941.8,
"valid_targets_min": 934
},
{
"epoch": 6.490384615384615,
"grad_norm": 0.9099419008308579,
"learning_rate": 6.464300363626797e-07,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11146557331085205,
"step": 4050,
"valid_targets_mean": 2807.4,
"valid_targets_min": 968
},
{
"epoch": 6.498397435897436,
"grad_norm": 0.9809559308191058,
"learning_rate": 6.264302123877053e-07,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11797185242176056,
"step": 4055,
"valid_targets_mean": 2723.9,
"valid_targets_min": 1600
},
{
"epoch": 6.506410256410256,
"grad_norm": 0.9350599141578312,
"learning_rate": 6.067397331557412e-07,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12935124337673187,
"step": 4060,
"valid_targets_mean": 2216.0,
"valid_targets_min": 1135
},
{
"epoch": 6.514423076923077,
"grad_norm": 1.4016198586806865,
"learning_rate": 5.873589130717405e-07,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12601718306541443,
"step": 4065,
"valid_targets_mean": 1985.8,
"valid_targets_min": 1158
},
{
"epoch": 6.522435897435898,
"grad_norm": 0.8251427320454606,
"learning_rate": 5.682880615962116e-07,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10815025866031647,
"step": 4070,
"valid_targets_mean": 2696.6,
"valid_targets_min": 1190
},
{
"epoch": 6.530448717948718,
"grad_norm": 0.8955660099878735,
"learning_rate": 5.495274832402841e-07,
"loss": 0.2244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10643479228019714,
"step": 4075,
"valid_targets_mean": 2961.2,
"valid_targets_min": 886
},
{
"epoch": 6.538461538461538,
"grad_norm": 0.9604493791278844,
"learning_rate": 5.310774775608529e-07,
"loss": 0.2425,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1176200807094574,
"step": 4080,
"valid_targets_mean": 2403.2,
"valid_targets_min": 654
},
{
"epoch": 6.546474358974359,
"grad_norm": 0.9762190869394272,
"learning_rate": 5.129383391557751e-07,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1663392037153244,
"step": 4085,
"valid_targets_mean": 1939.5,
"valid_targets_min": 855
},
{
"epoch": 6.55448717948718,
"grad_norm": 0.842222470742701,
"learning_rate": 4.951103576591876e-07,
"loss": 0.225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10071545094251633,
"step": 4090,
"valid_targets_mean": 2852.8,
"valid_targets_min": 1331
},
{
"epoch": 6.5625,
"grad_norm": 0.9307268460212219,
"learning_rate": 4.7759381773687e-07,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11373141407966614,
"step": 4095,
"valid_targets_mean": 2556.9,
"valid_targets_min": 913
},
{
"epoch": 6.57051282051282,
"grad_norm": 0.8457918011171499,
"learning_rate": 4.6038899908170234e-07,
"loss": 0.2277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13154616951942444,
"step": 4100,
"valid_targets_mean": 2821.9,
"valid_targets_min": 1106
},
{
"epoch": 6.578525641025641,
"grad_norm": 0.8387894923769624,
"learning_rate": 4.4349617640920164e-07,
"loss": 0.2495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1035970151424408,
"step": 4105,
"valid_targets_mean": 1948.8,
"valid_targets_min": 1123
},
{
"epoch": 6.586538461538462,
"grad_norm": 0.9037859502058307,
"learning_rate": 4.2691561945312764e-07,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1121777892112732,
"step": 4110,
"valid_targets_mean": 2629.9,
"valid_targets_min": 1407
},
{
"epoch": 6.594551282051282,
"grad_norm": 0.8863493487648947,
"learning_rate": 4.106475929611886e-07,
"loss": 0.2289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11576659977436066,
"step": 4115,
"valid_targets_mean": 2561.9,
"valid_targets_min": 1661
},
{
"epoch": 6.602564102564102,
"grad_norm": 0.8878216680524392,
"learning_rate": 3.9469235669080007e-07,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10847125947475433,
"step": 4120,
"valid_targets_mean": 2641.6,
"valid_targets_min": 1118
},
{
"epoch": 6.610576923076923,
"grad_norm": 1.0358019265981901,
"learning_rate": 3.7905016540495053e-07,
"loss": 0.2547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11162734031677246,
"step": 4125,
"valid_targets_mean": 1598.9,
"valid_targets_min": 508
},
{
"epoch": 6.618589743589744,
"grad_norm": 0.7745868367967038,
"learning_rate": 3.63721268868118e-07,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0914057046175003,
"step": 4130,
"valid_targets_mean": 2922.6,
"valid_targets_min": 1394
},
{
"epoch": 6.626602564102564,
"grad_norm": 1.0567183316790034,
"learning_rate": 3.487059118422997e-07,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11103471368551254,
"step": 4135,
"valid_targets_mean": 1526.8,
"valid_targets_min": 417
},
{
"epoch": 6.634615384615385,
"grad_norm": 0.7607762113223796,
"learning_rate": 3.3400433408308895e-07,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09019508957862854,
"step": 4140,
"valid_targets_mean": 2316.9,
"valid_targets_min": 447
},
{
"epoch": 6.642628205128205,
"grad_norm": 0.8802472861580645,
"learning_rate": 3.196167703358577e-07,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1006564050912857,
"step": 4145,
"valid_targets_mean": 2205.8,
"valid_targets_min": 945
},
{
"epoch": 6.6506410256410255,
"grad_norm": 0.8730051710281508,
"learning_rate": 3.0554345033199985e-07,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12638235092163086,
"step": 4150,
"valid_targets_mean": 3004.1,
"valid_targets_min": 796
},
{
"epoch": 6.658653846153846,
"grad_norm": 1.1553489157125603,
"learning_rate": 2.917845987852652e-07,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1155930757522583,
"step": 4155,
"valid_targets_mean": 2950.5,
"valid_targets_min": 1269
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.8952157916587886,
"learning_rate": 2.783404353881758e-07,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08050580322742462,
"step": 4160,
"valid_targets_mean": 2010.8,
"valid_targets_min": 1010
},
{
"epoch": 6.674679487179487,
"grad_norm": 0.9408776457030263,
"learning_rate": 2.652111748085151e-07,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11845621466636658,
"step": 4165,
"valid_targets_mean": 2520.0,
"valid_targets_min": 1905
},
{
"epoch": 6.6826923076923075,
"grad_norm": 1.0642164005801316,
"learning_rate": 2.523970266859044e-07,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15462008118629456,
"step": 4170,
"valid_targets_mean": 2359.5,
"valid_targets_min": 1170
},
{
"epoch": 6.690705128205128,
"grad_norm": 0.9995337282018758,
"learning_rate": 2.398981956284363e-07,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1114429384469986,
"step": 4175,
"valid_targets_mean": 1883.6,
"valid_targets_min": 1075
},
{
"epoch": 6.698717948717949,
"grad_norm": 0.8561185272458319,
"learning_rate": 2.2771488120944207e-07,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11397942900657654,
"step": 4180,
"valid_targets_mean": 2592.9,
"valid_targets_min": 1095
},
{
"epoch": 6.706730769230769,
"grad_norm": 0.9740156202400301,
"learning_rate": 2.1584727796427174e-07,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14512796700000763,
"step": 4185,
"valid_targets_mean": 2518.9,
"valid_targets_min": 973
},
{
"epoch": 6.714743589743589,
"grad_norm": 1.1588496532617867,
"learning_rate": 2.0429557538720556e-07,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1153675764799118,
"step": 4190,
"valid_targets_mean": 2192.1,
"valid_targets_min": 1588
},
{
"epoch": 6.722756410256411,
"grad_norm": 0.8519923964077011,
"learning_rate": 1.930599579284298e-07,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10996921360492706,
"step": 4195,
"valid_targets_mean": 2487.8,
"valid_targets_min": 1049
},
{
"epoch": 6.730769230769231,
"grad_norm": 1.0100576905261862,
"learning_rate": 1.8214060499107679e-07,
"loss": 0.2561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1439555585384369,
"step": 4200,
"valid_targets_mean": 2279.6,
"valid_targets_min": 1079
},
{
"epoch": 6.738782051282051,
"grad_norm": 0.8166556725836737,
"learning_rate": 1.7153769092837614e-07,
"loss": 0.2148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10187620669603348,
"step": 4205,
"valid_targets_mean": 3076.2,
"valid_targets_min": 1198
},
{
"epoch": 6.746794871794872,
"grad_norm": 0.8522985195219519,
"learning_rate": 1.6125138504086146e-07,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.122517429292202,
"step": 4210,
"valid_targets_mean": 2788.5,
"valid_targets_min": 1052
},
{
"epoch": 6.7548076923076925,
"grad_norm": 1.04741022514734,
"learning_rate": 1.5128185157367247e-07,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11223140358924866,
"step": 4215,
"valid_targets_mean": 1682.9,
"valid_targets_min": 944
},
{
"epoch": 6.762820512820513,
"grad_norm": 1.0466928727574043,
"learning_rate": 1.4162924971393044e-07,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1298060417175293,
"step": 4220,
"valid_targets_mean": 1969.2,
"valid_targets_min": 292
},
{
"epoch": 6.770833333333333,
"grad_norm": 0.8061561581755782,
"learning_rate": 1.322937335881891e-07,
"loss": 0.2473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16025656461715698,
"step": 4225,
"valid_targets_mean": 3525.5,
"valid_targets_min": 877
},
{
"epoch": 6.778846153846154,
"grad_norm": 0.9449521007617103,
"learning_rate": 1.2327545225999215e-07,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11590196937322617,
"step": 4230,
"valid_targets_mean": 2609.0,
"valid_targets_min": 1021
},
{
"epoch": 6.7868589743589745,
"grad_norm": 0.925371088266695,
"learning_rate": 1.145745497274664e-07,
"loss": 0.2468,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14536672830581665,
"step": 4235,
"valid_targets_mean": 2727.6,
"valid_targets_min": 1387
},
{
"epoch": 6.794871794871795,
"grad_norm": 0.7532084104831867,
"learning_rate": 1.061911649210523e-07,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07455575466156006,
"step": 4240,
"valid_targets_mean": 2051.8,
"valid_targets_min": 371
},
{
"epoch": 6.802884615384615,
"grad_norm": 0.9954452940831777,
"learning_rate": 9.812543170126365e-08,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11818395555019379,
"step": 4245,
"valid_targets_mean": 2523.9,
"valid_targets_min": 1100
},
{
"epoch": 6.810897435897436,
"grad_norm": 0.8810844606785796,
"learning_rate": 9.03774788565559e-08,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10779982805252075,
"step": 4250,
"valid_targets_mean": 2419.9,
"valid_targets_min": 1234
},
{
"epoch": 6.818910256410256,
"grad_norm": 0.7587255090249656,
"learning_rate": 8.294743010127448e-08,
"loss": 0.2293,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09742031991481781,
"step": 4255,
"valid_targets_mean": 2819.4,
"valid_targets_min": 1493
},
{
"epoch": 6.826923076923077,
"grad_norm": 0.9186887291366199,
"learning_rate": 7.583540407367418e-08,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11129537224769592,
"step": 4260,
"valid_targets_mean": 2361.5,
"valid_targets_min": 1146
},
{
"epoch": 6.834935897435898,
"grad_norm": 0.8638613619075678,
"learning_rate": 6.904151433402728e-08,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10862366110086441,
"step": 4265,
"valid_targets_mean": 2177.1,
"valid_targets_min": 1521
},
{
"epoch": 6.842948717948718,
"grad_norm": 0.887431984510552,
"learning_rate": 6.256586936281172e-08,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12638813257217407,
"step": 4270,
"valid_targets_mean": 2991.6,
"valid_targets_min": 1543
},
{
"epoch": 6.850961538461538,
"grad_norm": 1.0013091054241623,
"learning_rate": 5.6408572558972475e-08,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11181466281414032,
"step": 4275,
"valid_targets_mean": 1893.5,
"valid_targets_min": 1160
},
{
"epoch": 6.858974358974359,
"grad_norm": 1.0227568011240404,
"learning_rate": 5.0569722238280605e-08,
"loss": 0.246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16308793425559998,
"step": 4280,
"valid_targets_mean": 2498.2,
"valid_targets_min": 997
},
{
"epoch": 6.86698717948718,
"grad_norm": 0.9842765844108,
"learning_rate": 4.504941163175236e-08,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12176279723644257,
"step": 4285,
"valid_targets_mean": 1907.0,
"valid_targets_min": 953
},
{
"epoch": 6.875,
"grad_norm": 1.3291503879689117,
"learning_rate": 3.984772888417032e-08,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11058434844017029,
"step": 4290,
"valid_targets_mean": 2407.4,
"valid_targets_min": 1244
},
{
"epoch": 6.88301282051282,
"grad_norm": 0.7907667503962194,
"learning_rate": 3.4964757052671216e-08,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07719993591308594,
"step": 4295,
"valid_targets_mean": 2425.5,
"valid_targets_min": 882
},
{
"epoch": 6.891025641025641,
"grad_norm": 0.9147924117446959,
"learning_rate": 3.0400574105415856e-08,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11411920189857483,
"step": 4300,
"valid_targets_mean": 2327.2,
"valid_targets_min": 1051
},
{
"epoch": 6.899038461538462,
"grad_norm": 0.8184445022532079,
"learning_rate": 2.615525292035459e-08,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10698746144771576,
"step": 4305,
"valid_targets_mean": 3427.0,
"valid_targets_min": 1359
},
{
"epoch": 6.907051282051282,
"grad_norm": 0.969049875717242,
"learning_rate": 2.222886128405266e-08,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09935212880373001,
"step": 4310,
"valid_targets_mean": 2346.5,
"valid_targets_min": 446
},
{
"epoch": 6.915064102564102,
"grad_norm": 0.8366135689501649,
"learning_rate": 1.8621461890617752e-08,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10085824131965637,
"step": 4315,
"valid_targets_mean": 2112.9,
"valid_targets_min": 1382
},
{
"epoch": 6.923076923076923,
"grad_norm": 0.9757835486083863,
"learning_rate": 1.5333112340687463e-08,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1587846875190735,
"step": 4320,
"valid_targets_mean": 2357.0,
"valid_targets_min": 845
},
{
"epoch": 6.931089743589744,
"grad_norm": 0.7896507256157604,
"learning_rate": 1.2363865140518905e-08,
"loss": 0.2664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1322735846042633,
"step": 4325,
"valid_targets_mean": 2378.5,
"valid_targets_min": 1000
},
{
"epoch": 6.939102564102564,
"grad_norm": 0.7394443171363577,
"learning_rate": 9.713767701151621e-09,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10028460621833801,
"step": 4330,
"valid_targets_mean": 3140.5,
"valid_targets_min": 1022
},
{
"epoch": 6.947115384615385,
"grad_norm": 0.937378550902355,
"learning_rate": 7.382862337641516e-09,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1184074729681015,
"step": 4335,
"valid_targets_mean": 2002.2,
"valid_targets_min": 883
},
{
"epoch": 6.955128205128205,
"grad_norm": 0.8929545659767167,
"learning_rate": 5.371186268390283e-09,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0951998233795166,
"step": 4340,
"valid_targets_mean": 2122.8,
"valid_targets_min": 385
},
{
"epoch": 6.9631410256410255,
"grad_norm": 0.8450524750277165,
"learning_rate": 3.678771614550325e-09,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1101217120885849,
"step": 4345,
"valid_targets_mean": 1946.5,
"valid_targets_min": 865
},
{
"epoch": 6.971153846153846,
"grad_norm": 0.8222550737458072,
"learning_rate": 2.3056453995162763e-09,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06940317898988724,
"step": 4350,
"valid_targets_mean": 1825.2,
"valid_targets_min": 803
},
{
"epoch": 6.979166666666667,
"grad_norm": 0.9510199952831588,
"learning_rate": 1.2518295484875708e-09,
"loss": 0.2619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10881343483924866,
"step": 4355,
"valid_targets_mean": 1923.4,
"valid_targets_min": 672
},
{
"epoch": 6.987179487179487,
"grad_norm": 0.9425580090389156,
"learning_rate": 5.173408881198328e-10,
"loss": 0.2432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1133669912815094,
"step": 4360,
"valid_targets_mean": 1864.9,
"valid_targets_min": 1216
},
{
"epoch": 6.9951923076923075,
"grad_norm": 0.9452987456146136,
"learning_rate": 1.0219114625398263e-10,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13046550750732422,
"step": 4365,
"valid_targets_mean": 2728.5,
"valid_targets_min": 1249
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06942301988601685,
"step": 4368,
"total_flos": 7.09204861186474e+17,
"train_loss": 0.32849771289270874,
"train_runtime": 20331.9971,
"train_samples_per_second": 3.436,
"train_steps_per_second": 0.215,
"valid_targets_mean": 1305.1,
"valid_targets_min": 490
}
],
"logging_steps": 5,
"max_steps": 4368,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 7.09204861186474e+17,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}