a1-stack_phpunit / trainer_state.json
EtashGuha's picture
Upload folder using huggingface_hub
0a0b04d verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4627,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.007564296520423601,
"grad_norm": 19.058784422912282,
"learning_rate": 3.455723542116631e-07,
"loss": 0.7153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7505241632461548,
"step": 5,
"valid_targets_mean": 3790.7,
"valid_targets_min": 239
},
{
"epoch": 0.015128593040847202,
"grad_norm": 17.486795894826894,
"learning_rate": 7.77537796976242e-07,
"loss": 0.6813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6587737798690796,
"step": 10,
"valid_targets_mean": 5055.8,
"valid_targets_min": 943
},
{
"epoch": 0.0226928895612708,
"grad_norm": 17.853758617180958,
"learning_rate": 1.209503239740821e-06,
"loss": 0.71,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7153316736221313,
"step": 15,
"valid_targets_mean": 5290.3,
"valid_targets_min": 803
},
{
"epoch": 0.030257186081694403,
"grad_norm": 13.456561875333087,
"learning_rate": 1.6414686825053995e-06,
"loss": 0.6532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6719971895217896,
"step": 20,
"valid_targets_mean": 4477.1,
"valid_targets_min": 461
},
{
"epoch": 0.037821482602118005,
"grad_norm": 8.589481200641513,
"learning_rate": 2.0734341252699786e-06,
"loss": 0.5971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6080985069274902,
"step": 25,
"valid_targets_mean": 4065.7,
"valid_targets_min": 797
},
{
"epoch": 0.0453857791225416,
"grad_norm": 4.7772774074698585,
"learning_rate": 2.505399568034557e-06,
"loss": 0.5155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4876701831817627,
"step": 30,
"valid_targets_mean": 5669.8,
"valid_targets_min": 727
},
{
"epoch": 0.0529500756429652,
"grad_norm": 2.9036893563370665,
"learning_rate": 2.9373650107991366e-06,
"loss": 0.4905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44498470425605774,
"step": 35,
"valid_targets_mean": 4442.9,
"valid_targets_min": 795
},
{
"epoch": 0.060514372163388806,
"grad_norm": 1.5763541463717798,
"learning_rate": 3.369330453563715e-06,
"loss": 0.4976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.492475301027298,
"step": 40,
"valid_targets_mean": 5954.6,
"valid_targets_min": 583
},
{
"epoch": 0.0680786686838124,
"grad_norm": 1.4394911122910266,
"learning_rate": 3.801295896328294e-06,
"loss": 0.4597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5117167234420776,
"step": 45,
"valid_targets_mean": 4686.0,
"valid_targets_min": 610
},
{
"epoch": 0.07564296520423601,
"grad_norm": 1.1660007728840187,
"learning_rate": 4.233261339092873e-06,
"loss": 0.456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4414580464363098,
"step": 50,
"valid_targets_mean": 4432.8,
"valid_targets_min": 710
},
{
"epoch": 0.0832072617246596,
"grad_norm": 1.0994270688976955,
"learning_rate": 4.665226781857452e-06,
"loss": 0.4252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5082100629806519,
"step": 55,
"valid_targets_mean": 4157.1,
"valid_targets_min": 620
},
{
"epoch": 0.0907715582450832,
"grad_norm": 0.8284788849012524,
"learning_rate": 5.09719222462203e-06,
"loss": 0.4232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44552695751190186,
"step": 60,
"valid_targets_mean": 4501.6,
"valid_targets_min": 705
},
{
"epoch": 0.09833585476550681,
"grad_norm": 0.6310211132039384,
"learning_rate": 5.52915766738661e-06,
"loss": 0.3835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3460736572742462,
"step": 65,
"valid_targets_mean": 4682.3,
"valid_targets_min": 342
},
{
"epoch": 0.1059001512859304,
"grad_norm": 0.6177628509419143,
"learning_rate": 5.961123110151188e-06,
"loss": 0.3921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38838571310043335,
"step": 70,
"valid_targets_mean": 5989.1,
"valid_targets_min": 1412
},
{
"epoch": 0.11346444780635401,
"grad_norm": 0.6780059407854138,
"learning_rate": 6.393088552915767e-06,
"loss": 0.3815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3895452618598938,
"step": 75,
"valid_targets_mean": 4225.5,
"valid_targets_min": 391
},
{
"epoch": 0.12102874432677761,
"grad_norm": 0.5643766880346435,
"learning_rate": 6.825053995680346e-06,
"loss": 0.3558,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3587391972541809,
"step": 80,
"valid_targets_mean": 5413.6,
"valid_targets_min": 559
},
{
"epoch": 0.12859304084720122,
"grad_norm": 0.9090969514772852,
"learning_rate": 7.257019438444926e-06,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3452695310115814,
"step": 85,
"valid_targets_mean": 4190.5,
"valid_targets_min": 561
},
{
"epoch": 0.1361573373676248,
"grad_norm": 0.5075113193939108,
"learning_rate": 7.688984881209504e-06,
"loss": 0.3446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3218182325363159,
"step": 90,
"valid_targets_mean": 5132.1,
"valid_targets_min": 821
},
{
"epoch": 0.1437216338880484,
"grad_norm": 0.4582977864357091,
"learning_rate": 8.120950323974082e-06,
"loss": 0.3514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3215479254722595,
"step": 95,
"valid_targets_mean": 6527.9,
"valid_targets_min": 629
},
{
"epoch": 0.15128593040847202,
"grad_norm": 0.48765027679444184,
"learning_rate": 8.552915766738662e-06,
"loss": 0.3573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33919212222099304,
"step": 100,
"valid_targets_mean": 5894.4,
"valid_targets_min": 1048
},
{
"epoch": 0.1588502269288956,
"grad_norm": 0.6167067050085139,
"learning_rate": 8.98488120950324e-06,
"loss": 0.347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3706921935081482,
"step": 105,
"valid_targets_mean": 4482.9,
"valid_targets_min": 571
},
{
"epoch": 0.1664145234493192,
"grad_norm": 0.5778398632077648,
"learning_rate": 9.41684665226782e-06,
"loss": 0.3286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3193400502204895,
"step": 110,
"valid_targets_mean": 5415.0,
"valid_targets_min": 1665
},
{
"epoch": 0.17397881996974282,
"grad_norm": 0.5647079800698889,
"learning_rate": 9.848812095032398e-06,
"loss": 0.3556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3541482090950012,
"step": 115,
"valid_targets_mean": 5123.8,
"valid_targets_min": 1269
},
{
"epoch": 0.1815431164901664,
"grad_norm": 0.5820680453553746,
"learning_rate": 1.0280777537796978e-05,
"loss": 0.3176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30285853147506714,
"step": 120,
"valid_targets_mean": 4204.3,
"valid_targets_min": 556
},
{
"epoch": 0.18910741301059,
"grad_norm": 0.47973201670838,
"learning_rate": 1.0712742980561557e-05,
"loss": 0.3178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3058018088340759,
"step": 125,
"valid_targets_mean": 5260.8,
"valid_targets_min": 868
},
{
"epoch": 0.19667170953101362,
"grad_norm": 0.5518953360121684,
"learning_rate": 1.1144708423326134e-05,
"loss": 0.3187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3173016905784607,
"step": 130,
"valid_targets_mean": 5620.1,
"valid_targets_min": 2169
},
{
"epoch": 0.2042360060514372,
"grad_norm": 0.5717143166242276,
"learning_rate": 1.1576673866090712e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35504987835884094,
"step": 135,
"valid_targets_mean": 5265.2,
"valid_targets_min": 785
},
{
"epoch": 0.2118003025718608,
"grad_norm": 0.47865096065818147,
"learning_rate": 1.2008639308855293e-05,
"loss": 0.2921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2680158019065857,
"step": 140,
"valid_targets_mean": 5838.5,
"valid_targets_min": 2352
},
{
"epoch": 0.21936459909228442,
"grad_norm": 0.5085856003812484,
"learning_rate": 1.2440604751619871e-05,
"loss": 0.2999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3085848391056061,
"step": 145,
"valid_targets_mean": 4785.6,
"valid_targets_min": 653
},
{
"epoch": 0.22692889561270801,
"grad_norm": 0.5716698549308541,
"learning_rate": 1.287257019438445e-05,
"loss": 0.2984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28182756900787354,
"step": 150,
"valid_targets_mean": 4273.5,
"valid_targets_min": 825
},
{
"epoch": 0.2344931921331316,
"grad_norm": 0.5245334119291116,
"learning_rate": 1.330453563714903e-05,
"loss": 0.2842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.264009952545166,
"step": 155,
"valid_targets_mean": 4866.6,
"valid_targets_min": 467
},
{
"epoch": 0.24205748865355523,
"grad_norm": 0.4935476283105332,
"learning_rate": 1.3736501079913609e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28478801250457764,
"step": 160,
"valid_targets_mean": 5374.4,
"valid_targets_min": 2048
},
{
"epoch": 0.24962178517397882,
"grad_norm": 0.49385239011355125,
"learning_rate": 1.4168466522678186e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3246859908103943,
"step": 165,
"valid_targets_mean": 6078.2,
"valid_targets_min": 1784
},
{
"epoch": 0.25718608169440244,
"grad_norm": 0.5031354977672869,
"learning_rate": 1.4600431965442764e-05,
"loss": 0.2931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2915901839733124,
"step": 170,
"valid_targets_mean": 5410.8,
"valid_targets_min": 1914
},
{
"epoch": 0.264750378214826,
"grad_norm": 0.5743132892962913,
"learning_rate": 1.5032397408207345e-05,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3496958315372467,
"step": 175,
"valid_targets_mean": 4596.1,
"valid_targets_min": 747
},
{
"epoch": 0.2723146747352496,
"grad_norm": 0.6417430609782164,
"learning_rate": 1.5464362850971925e-05,
"loss": 0.2873,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27849793434143066,
"step": 180,
"valid_targets_mean": 4129.8,
"valid_targets_min": 711
},
{
"epoch": 0.27987897125567324,
"grad_norm": 0.5525787543900736,
"learning_rate": 1.5896328293736503e-05,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27930599451065063,
"step": 185,
"valid_targets_mean": 5218.1,
"valid_targets_min": 2197
},
{
"epoch": 0.2874432677760968,
"grad_norm": 0.5887797757799174,
"learning_rate": 1.6328293736501082e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3260801434516907,
"step": 190,
"valid_targets_mean": 4696.6,
"valid_targets_min": 1128
},
{
"epoch": 0.2950075642965204,
"grad_norm": 0.5611439547047103,
"learning_rate": 1.676025917926566e-05,
"loss": 0.2916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26734042167663574,
"step": 195,
"valid_targets_mean": 5061.5,
"valid_targets_min": 594
},
{
"epoch": 0.30257186081694404,
"grad_norm": 0.8142320877951509,
"learning_rate": 1.719222462203024e-05,
"loss": 0.2739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2744123935699463,
"step": 200,
"valid_targets_mean": 4981.4,
"valid_targets_min": 2432
},
{
"epoch": 0.3101361573373676,
"grad_norm": 0.5453776678521185,
"learning_rate": 1.7624190064794818e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2693478465080261,
"step": 205,
"valid_targets_mean": 4538.8,
"valid_targets_min": 2627
},
{
"epoch": 0.3177004538577912,
"grad_norm": 0.572823640761258,
"learning_rate": 1.8056155507559396e-05,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24936965107917786,
"step": 210,
"valid_targets_mean": 4717.1,
"valid_targets_min": 1796
},
{
"epoch": 0.32526475037821484,
"grad_norm": 0.48857192086223755,
"learning_rate": 1.8488120950323975e-05,
"loss": 0.2703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27971357107162476,
"step": 215,
"valid_targets_mean": 5259.7,
"valid_targets_min": 2080
},
{
"epoch": 0.3328290468986384,
"grad_norm": 0.5832326533648584,
"learning_rate": 1.8920086393088553e-05,
"loss": 0.2682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2944541871547699,
"step": 220,
"valid_targets_mean": 5435.7,
"valid_targets_min": 622
},
{
"epoch": 0.340393343419062,
"grad_norm": 0.5304901414198607,
"learning_rate": 1.9352051835853135e-05,
"loss": 0.276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2581842541694641,
"step": 225,
"valid_targets_mean": 5475.9,
"valid_targets_min": 1850
},
{
"epoch": 0.34795763993948564,
"grad_norm": 0.5584973891534915,
"learning_rate": 1.9784017278617714e-05,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2856540381908417,
"step": 230,
"valid_targets_mean": 5040.7,
"valid_targets_min": 837
},
{
"epoch": 0.3555219364599092,
"grad_norm": 0.7615559789848529,
"learning_rate": 2.021598272138229e-05,
"loss": 0.2762,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27540600299835205,
"step": 235,
"valid_targets_mean": 4862.9,
"valid_targets_min": 921
},
{
"epoch": 0.3630862329803328,
"grad_norm": 0.5494333839539911,
"learning_rate": 2.064794816414687e-05,
"loss": 0.2627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25492146611213684,
"step": 240,
"valid_targets_mean": 4764.6,
"valid_targets_min": 1899
},
{
"epoch": 0.37065052950075644,
"grad_norm": 0.5675208041808972,
"learning_rate": 2.107991360691145e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30120372772216797,
"step": 245,
"valid_targets_mean": 4816.8,
"valid_targets_min": 496
},
{
"epoch": 0.37821482602118,
"grad_norm": 0.5516462624650181,
"learning_rate": 2.1511879049676025e-05,
"loss": 0.2668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2463807463645935,
"step": 250,
"valid_targets_mean": 4821.3,
"valid_targets_min": 892
},
{
"epoch": 0.3857791225416036,
"grad_norm": 0.5808471847669502,
"learning_rate": 2.1943844492440607e-05,
"loss": 0.2605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25385603308677673,
"step": 255,
"valid_targets_mean": 4108.7,
"valid_targets_min": 697
},
{
"epoch": 0.39334341906202724,
"grad_norm": 1.3051521187963644,
"learning_rate": 2.2375809935205186e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2327377051115036,
"step": 260,
"valid_targets_mean": 3904.6,
"valid_targets_min": 526
},
{
"epoch": 0.4009077155824508,
"grad_norm": 0.540688473321198,
"learning_rate": 2.2807775377969764e-05,
"loss": 0.2775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2616848945617676,
"step": 265,
"valid_targets_mean": 5200.8,
"valid_targets_min": 723
},
{
"epoch": 0.4084720121028744,
"grad_norm": 0.5572137635803951,
"learning_rate": 2.3239740820734343e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2894093096256256,
"step": 270,
"valid_targets_mean": 5997.7,
"valid_targets_min": 2741
},
{
"epoch": 0.41603630862329805,
"grad_norm": 0.5219797727194595,
"learning_rate": 2.3671706263498925e-05,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23676098883152008,
"step": 275,
"valid_targets_mean": 5215.8,
"valid_targets_min": 372
},
{
"epoch": 0.4236006051437216,
"grad_norm": 0.7269531089041338,
"learning_rate": 2.41036717062635e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29276716709136963,
"step": 280,
"valid_targets_mean": 5125.2,
"valid_targets_min": 941
},
{
"epoch": 0.43116490166414523,
"grad_norm": 0.6854032248788718,
"learning_rate": 2.453563714902808e-05,
"loss": 0.2533,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2404939830303192,
"step": 285,
"valid_targets_mean": 4140.1,
"valid_targets_min": 913
},
{
"epoch": 0.43872919818456885,
"grad_norm": 0.5427787800863983,
"learning_rate": 2.496760259179266e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29159748554229736,
"step": 290,
"valid_targets_mean": 5585.8,
"valid_targets_min": 738
},
{
"epoch": 0.4462934947049924,
"grad_norm": 0.6325587088135726,
"learning_rate": 2.5399568034557236e-05,
"loss": 0.2709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24903929233551025,
"step": 295,
"valid_targets_mean": 4124.8,
"valid_targets_min": 760
},
{
"epoch": 0.45385779122541603,
"grad_norm": 0.6302528172341179,
"learning_rate": 2.5831533477321818e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2755891680717468,
"step": 300,
"valid_targets_mean": 5041.9,
"valid_targets_min": 765
},
{
"epoch": 0.46142208774583965,
"grad_norm": 0.6101680849058813,
"learning_rate": 2.6263498920086393e-05,
"loss": 0.251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23466572165489197,
"step": 305,
"valid_targets_mean": 4039.0,
"valid_targets_min": 1489
},
{
"epoch": 0.4689863842662632,
"grad_norm": 0.5098554824207316,
"learning_rate": 2.6695464362850975e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24894092977046967,
"step": 310,
"valid_targets_mean": 5165.2,
"valid_targets_min": 543
},
{
"epoch": 0.47655068078668683,
"grad_norm": 0.5153701765469025,
"learning_rate": 2.7127429805615553e-05,
"loss": 0.2987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24448314309120178,
"step": 315,
"valid_targets_mean": 4878.4,
"valid_targets_min": 1165
},
{
"epoch": 0.48411497730711045,
"grad_norm": 0.5150020480544099,
"learning_rate": 2.755939524838013e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24626128375530243,
"step": 320,
"valid_targets_mean": 5491.0,
"valid_targets_min": 2393
},
{
"epoch": 0.491679273827534,
"grad_norm": 0.44779275422444326,
"learning_rate": 2.799136069114471e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25347915291786194,
"step": 325,
"valid_targets_mean": 6012.2,
"valid_targets_min": 1728
},
{
"epoch": 0.49924357034795763,
"grad_norm": 0.5689898293216941,
"learning_rate": 2.842332613390929e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2442246973514557,
"step": 330,
"valid_targets_mean": 5822.6,
"valid_targets_min": 1755
},
{
"epoch": 0.5068078668683812,
"grad_norm": 0.4828012134297725,
"learning_rate": 2.885529157667387e-05,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22166290879249573,
"step": 335,
"valid_targets_mean": 5591.9,
"valid_targets_min": 2595
},
{
"epoch": 0.5143721633888049,
"grad_norm": 0.5206534739708626,
"learning_rate": 2.9287257019438446e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24545502662658691,
"step": 340,
"valid_targets_mean": 4507.7,
"valid_targets_min": 1277
},
{
"epoch": 0.5219364599092284,
"grad_norm": 0.5375743058233416,
"learning_rate": 2.9719222462203028e-05,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24855747818946838,
"step": 345,
"valid_targets_mean": 4502.4,
"valid_targets_min": 706
},
{
"epoch": 0.529500756429652,
"grad_norm": 0.47062515075329686,
"learning_rate": 3.0151187904967603e-05,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23291119933128357,
"step": 350,
"valid_targets_mean": 5619.4,
"valid_targets_min": 729
},
{
"epoch": 0.5370650529500757,
"grad_norm": 0.5065710560218952,
"learning_rate": 3.058315334773218e-05,
"loss": 0.2257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23068980872631073,
"step": 355,
"valid_targets_mean": 5067.8,
"valid_targets_min": 800
},
{
"epoch": 0.5446293494704992,
"grad_norm": 0.6071927129549767,
"learning_rate": 3.101511879049676e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2714073061943054,
"step": 360,
"valid_targets_mean": 4807.8,
"valid_targets_min": 321
},
{
"epoch": 0.5521936459909228,
"grad_norm": 0.5932902639247645,
"learning_rate": 3.144708423326134e-05,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2581622004508972,
"step": 365,
"valid_targets_mean": 4726.7,
"valid_targets_min": 263
},
{
"epoch": 0.5597579425113465,
"grad_norm": 0.5342014246005196,
"learning_rate": 3.1879049676025925e-05,
"loss": 0.2527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28950175642967224,
"step": 370,
"valid_targets_mean": 5759.0,
"valid_targets_min": 736
},
{
"epoch": 0.56732223903177,
"grad_norm": 0.6598267814370526,
"learning_rate": 3.23110151187905e-05,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23706093430519104,
"step": 375,
"valid_targets_mean": 3705.8,
"valid_targets_min": 511
},
{
"epoch": 0.5748865355521936,
"grad_norm": 0.5781352859246836,
"learning_rate": 3.274298056155508e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2128780633211136,
"step": 380,
"valid_targets_mean": 4299.5,
"valid_targets_min": 565
},
{
"epoch": 0.5824508320726173,
"grad_norm": 0.5201196925356668,
"learning_rate": 3.317494600431966e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2847621440887451,
"step": 385,
"valid_targets_mean": 5042.4,
"valid_targets_min": 825
},
{
"epoch": 0.5900151285930408,
"grad_norm": 0.571209286797819,
"learning_rate": 3.360691144708423e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.261477530002594,
"step": 390,
"valid_targets_mean": 4204.5,
"valid_targets_min": 831
},
{
"epoch": 0.5975794251134644,
"grad_norm": 0.5703991894869983,
"learning_rate": 3.4038876889848814e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22247353196144104,
"step": 395,
"valid_targets_mean": 4025.1,
"valid_targets_min": 811
},
{
"epoch": 0.6051437216338881,
"grad_norm": 0.5694115354716299,
"learning_rate": 3.447084233261339e-05,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2540602684020996,
"step": 400,
"valid_targets_mean": 4897.0,
"valid_targets_min": 1926
},
{
"epoch": 0.6127080181543116,
"grad_norm": 0.543873277094909,
"learning_rate": 3.490280777537797e-05,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2412918210029602,
"step": 405,
"valid_targets_mean": 5347.6,
"valid_targets_min": 2336
},
{
"epoch": 0.6202723146747352,
"grad_norm": 0.5539147349076818,
"learning_rate": 3.533477321814255e-05,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27449312806129456,
"step": 410,
"valid_targets_mean": 4702.8,
"valid_targets_min": 641
},
{
"epoch": 0.6278366111951589,
"grad_norm": 0.5147878532498119,
"learning_rate": 3.5766738660907135e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21562246978282928,
"step": 415,
"valid_targets_mean": 4832.5,
"valid_targets_min": 2092
},
{
"epoch": 0.6354009077155824,
"grad_norm": 0.5550659610309338,
"learning_rate": 3.619870410367171e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23504087328910828,
"step": 420,
"valid_targets_mean": 4465.6,
"valid_targets_min": 643
},
{
"epoch": 0.642965204236006,
"grad_norm": 0.5881025450085932,
"learning_rate": 3.6630669546436286e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2751597464084625,
"step": 425,
"valid_targets_mean": 5010.4,
"valid_targets_min": 575
},
{
"epoch": 0.6505295007564297,
"grad_norm": 0.5850477950512473,
"learning_rate": 3.706263498920087e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2643757462501526,
"step": 430,
"valid_targets_mean": 4947.0,
"valid_targets_min": 678
},
{
"epoch": 0.6580937972768532,
"grad_norm": 0.8028527221952423,
"learning_rate": 3.749460043196544e-05,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23027735948562622,
"step": 435,
"valid_targets_mean": 4532.6,
"valid_targets_min": 632
},
{
"epoch": 0.6656580937972768,
"grad_norm": 0.5991434210232877,
"learning_rate": 3.7926565874730025e-05,
"loss": 0.233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21481779217720032,
"step": 440,
"valid_targets_mean": 4295.4,
"valid_targets_min": 1930
},
{
"epoch": 0.6732223903177005,
"grad_norm": 0.601475737977575,
"learning_rate": 3.83585313174946e-05,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2731437683105469,
"step": 445,
"valid_targets_mean": 4081.8,
"valid_targets_min": 789
},
{
"epoch": 0.680786686838124,
"grad_norm": 0.544970754754265,
"learning_rate": 3.879049676025918e-05,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2417784333229065,
"step": 450,
"valid_targets_mean": 4546.8,
"valid_targets_min": 687
},
{
"epoch": 0.6883509833585476,
"grad_norm": 0.5772939399178783,
"learning_rate": 3.9222462203023764e-05,
"loss": 0.2556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23565149307250977,
"step": 455,
"valid_targets_mean": 4297.6,
"valid_targets_min": 662
},
{
"epoch": 0.6959152798789713,
"grad_norm": 0.557273760966465,
"learning_rate": 3.965442764578834e-05,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23695287108421326,
"step": 460,
"valid_targets_mean": 5605.1,
"valid_targets_min": 478
},
{
"epoch": 0.7034795763993948,
"grad_norm": 0.552751474708773,
"learning_rate": 3.9999994307824485e-05,
"loss": 0.238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23529154062271118,
"step": 465,
"valid_targets_mean": 4646.6,
"valid_targets_min": 843
},
{
"epoch": 0.7110438729198184,
"grad_norm": 0.5778857269434653,
"learning_rate": 3.9999795082021543e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3176231384277344,
"step": 470,
"valid_targets_mean": 5449.4,
"valid_targets_min": 538
},
{
"epoch": 0.7186081694402421,
"grad_norm": 0.5157110157373845,
"learning_rate": 3.999931125068276e-05,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2607157230377197,
"step": 475,
"valid_targets_mean": 5027.3,
"valid_targets_min": 951
},
{
"epoch": 0.7261724659606656,
"grad_norm": 0.4933102641109027,
"learning_rate": 3.9998542820693246e-05,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20662082731723785,
"step": 480,
"valid_targets_mean": 5754.7,
"valid_targets_min": 635
},
{
"epoch": 0.7337367624810892,
"grad_norm": 0.5426556147022381,
"learning_rate": 3.9997489802988096e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23219190537929535,
"step": 485,
"valid_targets_mean": 4775.2,
"valid_targets_min": 729
},
{
"epoch": 0.7413010590015129,
"grad_norm": 0.4802976906182571,
"learning_rate": 3.9996152212552195e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22934921085834503,
"step": 490,
"valid_targets_mean": 5057.2,
"valid_targets_min": 639
},
{
"epoch": 0.7488653555219364,
"grad_norm": 0.6122232574312276,
"learning_rate": 3.999453006842002e-05,
"loss": 0.2389,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.244462788105011,
"step": 495,
"valid_targets_mean": 4329.6,
"valid_targets_min": 574
},
{
"epoch": 0.75642965204236,
"grad_norm": 0.5032216034650763,
"learning_rate": 3.999262339367536e-05,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25049036741256714,
"step": 500,
"valid_targets_mean": 4904.4,
"valid_targets_min": 1007
},
{
"epoch": 0.7639939485627837,
"grad_norm": 0.6238287961984283,
"learning_rate": 3.9990432215451006e-05,
"loss": 0.2482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26027706265449524,
"step": 505,
"valid_targets_mean": 3938.6,
"valid_targets_min": 639
},
{
"epoch": 0.7715582450832073,
"grad_norm": 0.5535062102674121,
"learning_rate": 3.998795656492836e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23881468176841736,
"step": 510,
"valid_targets_mean": 4196.7,
"valid_targets_min": 744
},
{
"epoch": 0.7791225416036308,
"grad_norm": 0.4897831464999995,
"learning_rate": 3.998519647733696e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2844647169113159,
"step": 515,
"valid_targets_mean": 6344.6,
"valid_targets_min": 601
},
{
"epoch": 0.7866868381240545,
"grad_norm": 0.5746692133321736,
"learning_rate": 3.998215199195403e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23050951957702637,
"step": 520,
"valid_targets_mean": 4142.7,
"valid_targets_min": 547
},
{
"epoch": 0.794251134644478,
"grad_norm": 0.49159881041487485,
"learning_rate": 3.997882315210388e-05,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2426537573337555,
"step": 525,
"valid_targets_mean": 5857.8,
"valid_targets_min": 1111
},
{
"epoch": 0.8018154311649016,
"grad_norm": 0.4965814246543715,
"learning_rate": 3.997521000515731e-05,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22411620616912842,
"step": 530,
"valid_targets_mean": 5881.9,
"valid_targets_min": 1661
},
{
"epoch": 0.8093797276853253,
"grad_norm": 0.5557055978474669,
"learning_rate": 3.997131260253092e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25896748900413513,
"step": 535,
"valid_targets_mean": 4466.9,
"valid_targets_min": 592
},
{
"epoch": 0.8169440242057489,
"grad_norm": 0.4931361228707487,
"learning_rate": 3.9967130999686405e-05,
"loss": 0.2356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.249818816781044,
"step": 540,
"valid_targets_mean": 4829.9,
"valid_targets_min": 932
},
{
"epoch": 0.8245083207261724,
"grad_norm": 0.5733474556869196,
"learning_rate": 3.996266525612973e-05,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2596126198768616,
"step": 545,
"valid_targets_mean": 3922.8,
"valid_targets_min": 709
},
{
"epoch": 0.8320726172465961,
"grad_norm": 0.5330244819228089,
"learning_rate": 3.9957915435410334e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2414190173149109,
"step": 550,
"valid_targets_mean": 5284.2,
"valid_targets_min": 1105
},
{
"epoch": 0.8396369137670197,
"grad_norm": 0.505181937458707,
"learning_rate": 3.995288160512015e-05,
"loss": 0.2424,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21243470907211304,
"step": 555,
"valid_targets_mean": 4745.8,
"valid_targets_min": 684
},
{
"epoch": 0.8472012102874432,
"grad_norm": 0.5379741211579597,
"learning_rate": 3.9947563836892725e-05,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22850680351257324,
"step": 560,
"valid_targets_mean": 4773.2,
"valid_targets_min": 678
},
{
"epoch": 0.8547655068078669,
"grad_norm": 0.47372136138382365,
"learning_rate": 3.994196220640214e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.245782271027565,
"step": 565,
"valid_targets_mean": 6413.9,
"valid_targets_min": 2439
},
{
"epoch": 0.8623298033282905,
"grad_norm": 0.5036552343967776,
"learning_rate": 3.993607679336197e-05,
"loss": 0.2394,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24518650770187378,
"step": 570,
"valid_targets_mean": 4881.8,
"valid_targets_min": 80
},
{
"epoch": 0.869894099848714,
"grad_norm": 0.4729695754905281,
"learning_rate": 3.992990768152412e-05,
"loss": 0.2385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2571276128292084,
"step": 575,
"valid_targets_mean": 5548.9,
"valid_targets_min": 899
},
{
"epoch": 0.8774583963691377,
"grad_norm": 0.4880547361382435,
"learning_rate": 3.9923454958677676e-05,
"loss": 0.2416,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2370157688856125,
"step": 580,
"valid_targets_mean": 5140.8,
"valid_targets_min": 920
},
{
"epoch": 0.8850226928895613,
"grad_norm": 0.46748870246205226,
"learning_rate": 3.991671871664759e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22495149075984955,
"step": 585,
"valid_targets_mean": 4875.2,
"valid_targets_min": 710
},
{
"epoch": 0.8925869894099848,
"grad_norm": 0.499170334869546,
"learning_rate": 3.9909699051293455e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2324574738740921,
"step": 590,
"valid_targets_mean": 4126.8,
"valid_targets_min": 672
},
{
"epoch": 0.9001512859304085,
"grad_norm": 0.5367539699554082,
"learning_rate": 3.990239606250805e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22277456521987915,
"step": 595,
"valid_targets_mean": 4875.0,
"valid_targets_min": 723
},
{
"epoch": 0.9077155824508321,
"grad_norm": 0.46291726470280686,
"learning_rate": 3.989480985421602e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21236249804496765,
"step": 600,
"valid_targets_mean": 5088.1,
"valid_targets_min": 1250
},
{
"epoch": 0.9152798789712556,
"grad_norm": 0.4944239868363532,
"learning_rate": 3.988694053437229e-05,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2805103063583374,
"step": 605,
"valid_targets_mean": 5184.2,
"valid_targets_min": 686
},
{
"epoch": 0.9228441754916793,
"grad_norm": 0.9200503353718761,
"learning_rate": 3.987878821496062e-05,
"loss": 0.2349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23494309186935425,
"step": 610,
"valid_targets_mean": 4795.9,
"valid_targets_min": 512
},
{
"epoch": 0.9304084720121029,
"grad_norm": 0.45541430053417153,
"learning_rate": 3.9870353011991955e-05,
"loss": 0.2367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.258321613073349,
"step": 615,
"valid_targets_mean": 5087.6,
"valid_targets_min": 708
},
{
"epoch": 0.9379727685325264,
"grad_norm": 0.8707406129846743,
"learning_rate": 3.986163504550281e-05,
"loss": 0.2422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2552441656589508,
"step": 620,
"valid_targets_mean": 3817.4,
"valid_targets_min": 710
},
{
"epoch": 0.9455370650529501,
"grad_norm": 0.453725523450877,
"learning_rate": 3.985263443955351e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1943071186542511,
"step": 625,
"valid_targets_mean": 4514.4,
"valid_targets_min": 797
},
{
"epoch": 0.9531013615733737,
"grad_norm": 0.4650173033154279,
"learning_rate": 3.9843351322226496e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25859200954437256,
"step": 630,
"valid_targets_mean": 6504.8,
"valid_targets_min": 776
},
{
"epoch": 0.9606656580937972,
"grad_norm": 0.5183996451091001,
"learning_rate": 3.983378582562446e-05,
"loss": 0.2404,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2556428909301758,
"step": 635,
"valid_targets_mean": 4473.8,
"valid_targets_min": 517
},
{
"epoch": 0.9682299546142209,
"grad_norm": 0.45985350131749686,
"learning_rate": 3.982393808586843e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21027632057666779,
"step": 640,
"valid_targets_mean": 5296.2,
"valid_targets_min": 1148
},
{
"epoch": 0.9757942511346445,
"grad_norm": 0.552817017780005,
"learning_rate": 3.981380824309594e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.233289435505867,
"step": 645,
"valid_targets_mean": 3743.4,
"valid_targets_min": 474
},
{
"epoch": 0.983358547655068,
"grad_norm": 0.43042887165024196,
"learning_rate": 3.9803396441458917e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21018920838832855,
"step": 650,
"valid_targets_mean": 5031.2,
"valid_targets_min": 1803
},
{
"epoch": 0.9909228441754917,
"grad_norm": 0.48810810379501984,
"learning_rate": 3.979270282912169e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22822780907154083,
"step": 655,
"valid_targets_mean": 3996.4,
"valid_targets_min": 711
},
{
"epoch": 0.9984871406959153,
"grad_norm": 0.4961721738119889,
"learning_rate": 3.9781727558258896e-05,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22998680174350739,
"step": 660,
"valid_targets_mean": 4072.9,
"valid_targets_min": 606
},
{
"epoch": 1.006051437216339,
"grad_norm": 0.42967061225570735,
"learning_rate": 3.977047078505327e-05,
"loss": 0.2189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19665825366973877,
"step": 665,
"valid_targets_mean": 4729.6,
"valid_targets_min": 873
},
{
"epoch": 1.0136157337367624,
"grad_norm": 0.4669397363717281,
"learning_rate": 3.975893266969346e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.242275670170784,
"step": 670,
"valid_targets_mean": 4723.4,
"valid_targets_min": 351
},
{
"epoch": 1.021180030257186,
"grad_norm": 0.5341853659851667,
"learning_rate": 3.9747113376371704e-05,
"loss": 0.2467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24473215639591217,
"step": 675,
"valid_targets_mean": 4814.8,
"valid_targets_min": 628
},
{
"epoch": 1.0287443267776097,
"grad_norm": 0.44043846408793436,
"learning_rate": 3.9735013073281564e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24138009548187256,
"step": 680,
"valid_targets_mean": 6298.2,
"valid_targets_min": 603
},
{
"epoch": 1.0363086232980332,
"grad_norm": 0.5003817149788394,
"learning_rate": 3.972263193261545e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.201238214969635,
"step": 685,
"valid_targets_mean": 4762.5,
"valid_targets_min": 1345
},
{
"epoch": 1.0438729198184569,
"grad_norm": 0.4523758197633264,
"learning_rate": 3.970997013056224e-05,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24418559670448303,
"step": 690,
"valid_targets_mean": 6598.0,
"valid_targets_min": 643
},
{
"epoch": 1.0514372163388805,
"grad_norm": 0.4562342522704356,
"learning_rate": 3.969702784730471e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20137807726860046,
"step": 695,
"valid_targets_mean": 5147.5,
"valid_targets_min": 754
},
{
"epoch": 1.059001512859304,
"grad_norm": 0.5011541733249977,
"learning_rate": 3.9683805267017035e-05,
"loss": 0.2311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20954594016075134,
"step": 700,
"valid_targets_mean": 4591.2,
"valid_targets_min": 632
},
{
"epoch": 1.0665658093797277,
"grad_norm": 0.5176851021286845,
"learning_rate": 3.9670302577862124e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2231058031320572,
"step": 705,
"valid_targets_mean": 4647.5,
"valid_targets_min": 680
},
{
"epoch": 1.0741301059001513,
"grad_norm": 0.48011232672163284,
"learning_rate": 3.965651997198893e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22521618008613586,
"step": 710,
"valid_targets_mean": 5078.5,
"valid_targets_min": 641
},
{
"epoch": 1.0816944024205748,
"grad_norm": 0.4767421483930465,
"learning_rate": 3.964245764552978e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19617989659309387,
"step": 715,
"valid_targets_mean": 4258.9,
"valid_targets_min": 617
},
{
"epoch": 1.0892586989409985,
"grad_norm": 0.4104761710291779,
"learning_rate": 3.9628115798597505e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21169023215770721,
"step": 720,
"valid_targets_mean": 6263.8,
"valid_targets_min": 1551
},
{
"epoch": 1.0968229954614221,
"grad_norm": 0.578932648769492,
"learning_rate": 3.961349463528266e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22551500797271729,
"step": 725,
"valid_targets_mean": 5194.9,
"valid_targets_min": 662
},
{
"epoch": 1.1043872919818456,
"grad_norm": 0.4523935856836432,
"learning_rate": 3.959859436365057e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21178296208381653,
"step": 730,
"valid_targets_mean": 5042.5,
"valid_targets_min": 574
},
{
"epoch": 1.1119515885022693,
"grad_norm": 0.549130917647338,
"learning_rate": 3.95834151957384e-05,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2177426964044571,
"step": 735,
"valid_targets_mean": 4108.4,
"valid_targets_min": 791
},
{
"epoch": 1.119515885022693,
"grad_norm": 0.480466921821431,
"learning_rate": 3.956795734755213e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25843045115470886,
"step": 740,
"valid_targets_mean": 5000.5,
"valid_targets_min": 1302
},
{
"epoch": 1.1270801815431164,
"grad_norm": 0.4572027005951852,
"learning_rate": 3.955222103906346e-05,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19742241501808167,
"step": 745,
"valid_targets_mean": 4523.0,
"valid_targets_min": 538
},
{
"epoch": 1.13464447806354,
"grad_norm": 0.5232066650642148,
"learning_rate": 3.953620649420672e-05,
"loss": 0.2395,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2422420084476471,
"step": 750,
"valid_targets_mean": 5202.1,
"valid_targets_min": 1226
},
{
"epoch": 1.1422087745839637,
"grad_norm": 0.8229962292212416,
"learning_rate": 3.951991394087565e-05,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25070637464523315,
"step": 755,
"valid_targets_mean": 4194.7,
"valid_targets_min": 660
},
{
"epoch": 1.1497730711043872,
"grad_norm": 0.4391216524045533,
"learning_rate": 3.950334361092016e-05,
"loss": 0.2112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19606730341911316,
"step": 760,
"valid_targets_mean": 4927.8,
"valid_targets_min": 813
},
{
"epoch": 1.1573373676248109,
"grad_norm": 0.4725978644426478,
"learning_rate": 3.948649574014306e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2184830904006958,
"step": 765,
"valid_targets_mean": 4678.1,
"valid_targets_min": 727
},
{
"epoch": 1.1649016641452345,
"grad_norm": 0.47754919190950834,
"learning_rate": 3.946937056829666e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21192710101604462,
"step": 770,
"valid_targets_mean": 4708.8,
"valid_targets_min": 746
},
{
"epoch": 1.172465960665658,
"grad_norm": 0.38443453641184966,
"learning_rate": 3.9451968339079405e-05,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19585570693016052,
"step": 775,
"valid_targets_mean": 6528.1,
"valid_targets_min": 587
},
{
"epoch": 1.1800302571860817,
"grad_norm": 0.8213353673339491,
"learning_rate": 3.9434289300132355e-05,
"loss": 0.2099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24312201142311096,
"step": 780,
"valid_targets_mean": 4561.7,
"valid_targets_min": 578
},
{
"epoch": 1.1875945537065054,
"grad_norm": 0.5298968932603556,
"learning_rate": 3.941633370303572e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21988344192504883,
"step": 785,
"valid_targets_mean": 4631.4,
"valid_targets_min": 943
},
{
"epoch": 1.1951588502269288,
"grad_norm": 0.5091383820044767,
"learning_rate": 3.939810180330523e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20156526565551758,
"step": 790,
"valid_targets_mean": 4222.6,
"valid_targets_min": 653
},
{
"epoch": 1.2027231467473525,
"grad_norm": 0.4445758252408178,
"learning_rate": 3.9379593860388515e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23469144105911255,
"step": 795,
"valid_targets_mean": 5451.9,
"valid_targets_min": 2175
},
{
"epoch": 1.2102874432677762,
"grad_norm": 0.463702459884302,
"learning_rate": 3.936081013766143e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20840583741664886,
"step": 800,
"valid_targets_mean": 4844.2,
"valid_targets_min": 914
},
{
"epoch": 1.2178517397881996,
"grad_norm": 0.4949026215273616,
"learning_rate": 3.9341750902424294e-05,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22504504024982452,
"step": 805,
"valid_targets_mean": 4049.9,
"valid_targets_min": 729
},
{
"epoch": 1.2254160363086233,
"grad_norm": 0.45408544850056803,
"learning_rate": 3.932241642589807e-05,
"loss": 0.2197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18734216690063477,
"step": 810,
"valid_targets_mean": 5329.8,
"valid_targets_min": 674
},
{
"epoch": 1.232980332829047,
"grad_norm": 0.5377546774189591,
"learning_rate": 3.930280698322053e-05,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2399473488330841,
"step": 815,
"valid_targets_mean": 4738.1,
"valid_targets_min": 699
},
{
"epoch": 1.2405446293494704,
"grad_norm": 0.5558393542261922,
"learning_rate": 3.928292285344234e-05,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24337920546531677,
"step": 820,
"valid_targets_mean": 4106.7,
"valid_targets_min": 482
},
{
"epoch": 1.248108925869894,
"grad_norm": 0.4955456861000246,
"learning_rate": 3.926276431952306e-05,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22561465203762054,
"step": 825,
"valid_targets_mean": 5400.7,
"valid_targets_min": 1936
},
{
"epoch": 1.2556732223903178,
"grad_norm": 0.5418907911165872,
"learning_rate": 3.924233166832714e-05,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22385621070861816,
"step": 830,
"valid_targets_mean": 4220.5,
"valid_targets_min": 695
},
{
"epoch": 1.2632375189107412,
"grad_norm": 0.8088318043473532,
"learning_rate": 3.922162519061986e-05,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1984093189239502,
"step": 835,
"valid_targets_mean": 6244.4,
"valid_targets_min": 2041
},
{
"epoch": 1.2708018154311649,
"grad_norm": 0.4634253765330138,
"learning_rate": 3.920064518106313e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20426660776138306,
"step": 840,
"valid_targets_mean": 4512.1,
"valid_targets_min": 515
},
{
"epoch": 1.2783661119515886,
"grad_norm": 0.5244110379217045,
"learning_rate": 3.917939193821136e-05,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22082944214344025,
"step": 845,
"valid_targets_mean": 4429.2,
"valid_targets_min": 717
},
{
"epoch": 1.2859304084720122,
"grad_norm": 0.43483407663968293,
"learning_rate": 3.915786576450719e-05,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18737539649009705,
"step": 850,
"valid_targets_mean": 5059.6,
"valid_targets_min": 2458
},
{
"epoch": 1.2934947049924357,
"grad_norm": 0.4500103073766876,
"learning_rate": 3.913606696627715e-05,
"loss": 0.2105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1978236436843872,
"step": 855,
"valid_targets_mean": 4524.5,
"valid_targets_min": 823
},
{
"epoch": 1.3010590015128594,
"grad_norm": 0.43028683215121355,
"learning_rate": 3.911399585372735e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20554819703102112,
"step": 860,
"valid_targets_mean": 5189.1,
"valid_targets_min": 610
},
{
"epoch": 1.3086232980332828,
"grad_norm": 0.47627559033509903,
"learning_rate": 3.909165274093906e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21493449807167053,
"step": 865,
"valid_targets_mean": 4325.8,
"valid_targets_min": 781
},
{
"epoch": 1.3161875945537065,
"grad_norm": 0.44911088564844376,
"learning_rate": 3.906903794586422e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21005885303020477,
"step": 870,
"valid_targets_mean": 6040.7,
"valid_targets_min": 981
},
{
"epoch": 1.3237518910741302,
"grad_norm": 0.47753214474506056,
"learning_rate": 3.9046151790320905e-05,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.218666210770607,
"step": 875,
"valid_targets_mean": 4738.8,
"valid_targets_min": 725
},
{
"epoch": 1.3313161875945538,
"grad_norm": 0.43454590648723285,
"learning_rate": 3.902299459998879e-05,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18541982769966125,
"step": 880,
"valid_targets_mean": 5201.4,
"valid_targets_min": 2448
},
{
"epoch": 1.3388804841149773,
"grad_norm": 0.5156990006182292,
"learning_rate": 3.8999566704404476e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2260858565568924,
"step": 885,
"valid_targets_mean": 4169.7,
"valid_targets_min": 662
},
{
"epoch": 1.346444780635401,
"grad_norm": 0.4731314327931749,
"learning_rate": 3.8975868436956826e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21620869636535645,
"step": 890,
"valid_targets_mean": 4723.3,
"valid_targets_min": 696
},
{
"epoch": 1.3540090771558244,
"grad_norm": 0.5539722000570312,
"learning_rate": 3.895190013488219e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23198354244232178,
"step": 895,
"valid_targets_mean": 4731.4,
"valid_targets_min": 819
},
{
"epoch": 1.361573373676248,
"grad_norm": 0.5363884689933821,
"learning_rate": 3.892766213925965e-05,
"loss": 0.2092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21815639734268188,
"step": 900,
"valid_targets_mean": 3884.6,
"valid_targets_min": 512
},
{
"epoch": 1.3691376701966718,
"grad_norm": 0.46987778063844016,
"learning_rate": 3.890315479500611e-05,
"loss": 0.2161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2229079008102417,
"step": 905,
"valid_targets_mean": 5161.0,
"valid_targets_min": 888
},
{
"epoch": 1.3767019667170954,
"grad_norm": 0.44993849954248105,
"learning_rate": 3.887837845087144e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28664612770080566,
"step": 910,
"valid_targets_mean": 6543.5,
"valid_targets_min": 714
},
{
"epoch": 1.384266263237519,
"grad_norm": 0.43051713745825515,
"learning_rate": 3.885333345943349e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19189190864562988,
"step": 915,
"valid_targets_mean": 4741.1,
"valid_targets_min": 594
},
{
"epoch": 1.3918305597579426,
"grad_norm": 0.4805693823287516,
"learning_rate": 3.882802017709307e-05,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2096354365348816,
"step": 920,
"valid_targets_mean": 5091.5,
"valid_targets_min": 639
},
{
"epoch": 1.399394856278366,
"grad_norm": 0.44999557297889736,
"learning_rate": 3.880243896406889e-05,
"loss": 0.2274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22826901078224182,
"step": 925,
"valid_targets_mean": 6125.1,
"valid_targets_min": 1021
},
{
"epoch": 1.4069591527987897,
"grad_norm": 0.6717221286999777,
"learning_rate": 3.877659018439242e-05,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20602205395698547,
"step": 930,
"valid_targets_mean": 4478.8,
"valid_targets_min": 873
},
{
"epoch": 1.4145234493192134,
"grad_norm": 0.5169880935134787,
"learning_rate": 3.8750474205902715e-05,
"loss": 0.2193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23473864793777466,
"step": 935,
"valid_targets_mean": 4604.6,
"valid_targets_min": 584
},
{
"epoch": 1.422087745839637,
"grad_norm": 0.5143284382260722,
"learning_rate": 3.872409140024119e-05,
"loss": 0.2306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2324678599834442,
"step": 940,
"valid_targets_mean": 4128.6,
"valid_targets_min": 553
},
{
"epoch": 1.4296520423600605,
"grad_norm": 0.4971476793353403,
"learning_rate": 3.8697442142846314e-05,
"loss": 0.2213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23143915832042694,
"step": 945,
"valid_targets_mean": 4315.7,
"valid_targets_min": 576
},
{
"epoch": 1.4372163388804842,
"grad_norm": 0.4666851291643823,
"learning_rate": 3.867052681294828e-05,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21455539762973785,
"step": 950,
"valid_targets_mean": 4984.6,
"valid_targets_min": 1899
},
{
"epoch": 1.4447806354009076,
"grad_norm": 0.46105558167163246,
"learning_rate": 3.8643345793563606e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19814419746398926,
"step": 955,
"valid_targets_mean": 5288.9,
"valid_targets_min": 474
},
{
"epoch": 1.4523449319213313,
"grad_norm": 0.48073898579476537,
"learning_rate": 3.86158994714897e-05,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22171683609485626,
"step": 960,
"valid_targets_mean": 4704.9,
"valid_targets_min": 692
},
{
"epoch": 1.459909228441755,
"grad_norm": 0.6948950979765578,
"learning_rate": 3.858818823729931e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23459002375602722,
"step": 965,
"valid_targets_mean": 4975.9,
"valid_targets_min": 644
},
{
"epoch": 1.4674735249621786,
"grad_norm": 0.46636381876975636,
"learning_rate": 3.856021248533501e-05,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2228977084159851,
"step": 970,
"valid_targets_mean": 5289.2,
"valid_targets_min": 761
},
{
"epoch": 1.475037821482602,
"grad_norm": 0.4797474742441079,
"learning_rate": 3.853197261370357e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23371240496635437,
"step": 975,
"valid_targets_mean": 4752.7,
"valid_targets_min": 602
},
{
"epoch": 1.4826021180030258,
"grad_norm": 0.4546404058434165,
"learning_rate": 3.850346902427031e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20179343223571777,
"step": 980,
"valid_targets_mean": 4409.6,
"valid_targets_min": 1001
},
{
"epoch": 1.4901664145234492,
"grad_norm": 0.4436841609266024,
"learning_rate": 3.847470212265334e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16983595490455627,
"step": 985,
"valid_targets_mean": 4392.0,
"valid_targets_min": 478
},
{
"epoch": 1.497730711043873,
"grad_norm": 0.5042058235443482,
"learning_rate": 3.844567231821784e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23303237557411194,
"step": 990,
"valid_targets_mean": 4484.5,
"valid_targets_min": 461
},
{
"epoch": 1.5052950075642966,
"grad_norm": 0.5004283160780041,
"learning_rate": 3.8416380024070175e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2369617521762848,
"step": 995,
"valid_targets_mean": 5191.1,
"valid_targets_min": 565
},
{
"epoch": 1.5128593040847202,
"grad_norm": 0.4692148393457612,
"learning_rate": 3.838682565705209e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20685143768787384,
"step": 1000,
"valid_targets_mean": 4244.8,
"valid_targets_min": 1197
},
{
"epoch": 1.5204236006051437,
"grad_norm": 0.47144086137537927,
"learning_rate": 3.83570096377347e-05,
"loss": 0.2133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22664126753807068,
"step": 1005,
"valid_targets_mean": 4241.9,
"valid_targets_min": 534
},
{
"epoch": 1.5279878971255674,
"grad_norm": 0.47989912387325484,
"learning_rate": 3.8326932390412584e-05,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2084951400756836,
"step": 1010,
"valid_targets_mean": 5305.8,
"valid_targets_min": 1825
},
{
"epoch": 1.5355521936459908,
"grad_norm": 0.43046270561239386,
"learning_rate": 3.829659434309765e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23686754703521729,
"step": 1015,
"valid_targets_mean": 5570.4,
"valid_targets_min": 1879
},
{
"epoch": 1.5431164901664145,
"grad_norm": 0.44060406935360946,
"learning_rate": 3.8265995927513155e-05,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.209512859582901,
"step": 1020,
"valid_targets_mean": 4430.0,
"valid_targets_min": 797
},
{
"epoch": 1.5506807866868382,
"grad_norm": 0.4466657762243492,
"learning_rate": 3.823513757908748e-05,
"loss": 0.2197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21596594154834747,
"step": 1025,
"valid_targets_mean": 5183.5,
"valid_targets_min": 2442
},
{
"epoch": 1.5582450832072618,
"grad_norm": 0.4485453853157434,
"learning_rate": 3.820401973694796e-05,
"loss": 0.2169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19774681329727173,
"step": 1030,
"valid_targets_mean": 4629.1,
"valid_targets_min": 1966
},
{
"epoch": 1.5658093797276853,
"grad_norm": 0.4594903967129758,
"learning_rate": 3.817264284391464e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2078075408935547,
"step": 1035,
"valid_targets_mean": 4402.6,
"valid_targets_min": 702
},
{
"epoch": 1.573373676248109,
"grad_norm": 0.474824847270428,
"learning_rate": 3.8141007346493964e-05,
"loss": 0.2141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20694419741630554,
"step": 1040,
"valid_targets_mean": 3961.7,
"valid_targets_min": 615
},
{
"epoch": 1.5809379727685324,
"grad_norm": 0.49033992895453127,
"learning_rate": 3.8109113694872436e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20570620894432068,
"step": 1045,
"valid_targets_mean": 5230.1,
"valid_targets_min": 917
},
{
"epoch": 1.588502269288956,
"grad_norm": 0.4305573822598727,
"learning_rate": 3.80769623429102e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1743043065071106,
"step": 1050,
"valid_targets_mean": 4900.6,
"valid_targets_min": 2108
},
{
"epoch": 1.5960665658093798,
"grad_norm": 0.4002556203162745,
"learning_rate": 3.804455374813456e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20624500513076782,
"step": 1055,
"valid_targets_mean": 5544.1,
"valid_targets_min": 831
},
{
"epoch": 1.6036308623298035,
"grad_norm": 0.46098253527478694,
"learning_rate": 3.8011888371733536e-05,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21792328357696533,
"step": 1060,
"valid_targets_mean": 4735.6,
"valid_targets_min": 709
},
{
"epoch": 1.611195158850227,
"grad_norm": 0.4323494824069755,
"learning_rate": 3.797896667854924e-05,
"loss": 0.2126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21409177780151367,
"step": 1065,
"valid_targets_mean": 5365.8,
"valid_targets_min": 1040
},
{
"epoch": 1.6187594553706506,
"grad_norm": 0.48091408016876297,
"learning_rate": 3.7945789137071264e-05,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22255632281303406,
"step": 1070,
"valid_targets_mean": 5012.9,
"valid_targets_min": 167
},
{
"epoch": 1.626323751891074,
"grad_norm": 0.5061657168291416,
"learning_rate": 3.791235621943005e-05,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23962201178073883,
"step": 1075,
"valid_targets_mean": 4036.9,
"valid_targets_min": 541
},
{
"epoch": 1.6338880484114977,
"grad_norm": 0.5930611198562358,
"learning_rate": 3.7878668401390157e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27482351660728455,
"step": 1080,
"valid_targets_mean": 2996.6,
"valid_targets_min": 535
},
{
"epoch": 1.6414523449319214,
"grad_norm": 0.49753058500461794,
"learning_rate": 3.784472616234345e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21738803386688232,
"step": 1085,
"valid_targets_mean": 3911.5,
"valid_targets_min": 492
},
{
"epoch": 1.649016641452345,
"grad_norm": 0.40647299631956285,
"learning_rate": 3.7810529985302354e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23166729509830475,
"step": 1090,
"valid_targets_mean": 5627.1,
"valid_targets_min": 701
},
{
"epoch": 1.6565809379727685,
"grad_norm": 0.4505033940645788,
"learning_rate": 3.77760803568929e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.185359388589859,
"step": 1095,
"valid_targets_mean": 4292.2,
"valid_targets_min": 631
},
{
"epoch": 1.6641452344931922,
"grad_norm": 0.5731571126335391,
"learning_rate": 3.774137776734788e-05,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23054252564907074,
"step": 1100,
"valid_targets_mean": 4484.4,
"valid_targets_min": 821
},
{
"epoch": 1.6717095310136156,
"grad_norm": 0.4784802801846398,
"learning_rate": 3.770642271049979e-05,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2124379724264145,
"step": 1105,
"valid_targets_mean": 4393.8,
"valid_targets_min": 775
},
{
"epoch": 1.6792738275340393,
"grad_norm": 0.5134935440685385,
"learning_rate": 3.767121568377387e-05,
"loss": 0.2341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21781983971595764,
"step": 1110,
"valid_targets_mean": 4165.0,
"valid_targets_min": 432
},
{
"epoch": 1.686838124054463,
"grad_norm": 0.47819089354766536,
"learning_rate": 3.763575718818099e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2285154014825821,
"step": 1115,
"valid_targets_mean": 4118.8,
"valid_targets_min": 841
},
{
"epoch": 1.6944024205748867,
"grad_norm": 0.4468206203889348,
"learning_rate": 3.760004772831052e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25908660888671875,
"step": 1120,
"valid_targets_mean": 4985.1,
"valid_targets_min": 627
},
{
"epoch": 1.70196671709531,
"grad_norm": 0.5621098040132918,
"learning_rate": 3.7564087812323176e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21479949355125427,
"step": 1125,
"valid_targets_mean": 3941.1,
"valid_targets_min": 640
},
{
"epoch": 1.7095310136157338,
"grad_norm": 0.47379514306217524,
"learning_rate": 3.7527877951943745e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2008206844329834,
"step": 1130,
"valid_targets_mean": 4877.2,
"valid_targets_min": 635
},
{
"epoch": 1.7170953101361572,
"grad_norm": 0.4138650914953261,
"learning_rate": 3.749141866245385e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23996658623218536,
"step": 1135,
"valid_targets_mean": 5840.4,
"valid_targets_min": 3031
},
{
"epoch": 1.724659606656581,
"grad_norm": 0.45004503636425675,
"learning_rate": 3.745471046268459e-05,
"loss": 0.2063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2210957556962967,
"step": 1140,
"valid_targets_mean": 5032.8,
"valid_targets_min": 778
},
{
"epoch": 1.7322239031770046,
"grad_norm": 0.45471390290097,
"learning_rate": 3.7417753875009156e-05,
"loss": 0.1975,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19280803203582764,
"step": 1145,
"valid_targets_mean": 4949.8,
"valid_targets_min": 665
},
{
"epoch": 1.7397881996974283,
"grad_norm": 0.419924001810217,
"learning_rate": 3.738054942533541e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2240639328956604,
"step": 1150,
"valid_targets_mean": 6157.3,
"valid_targets_min": 1996
},
{
"epoch": 1.7473524962178517,
"grad_norm": 0.4040114013155955,
"learning_rate": 3.734309764309839e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19116798043251038,
"step": 1155,
"valid_targets_mean": 5477.1,
"valid_targets_min": 533
},
{
"epoch": 1.7549167927382754,
"grad_norm": 0.44527208272245994,
"learning_rate": 3.7305399061252795e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21052294969558716,
"step": 1160,
"valid_targets_mean": 5120.7,
"valid_targets_min": 2604
},
{
"epoch": 1.7624810892586988,
"grad_norm": 0.47454028755125877,
"learning_rate": 3.726745421626537e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18771414458751678,
"step": 1165,
"valid_targets_mean": 3559.8,
"valid_targets_min": 745
},
{
"epoch": 1.7700453857791225,
"grad_norm": 0.43637966175679893,
"learning_rate": 3.7229263648107285e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21924227476119995,
"step": 1170,
"valid_targets_mean": 5584.8,
"valid_targets_min": 730
},
{
"epoch": 1.7776096822995462,
"grad_norm": 0.48512408703189136,
"learning_rate": 3.7190827900246474e-05,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2824190557003021,
"step": 1175,
"valid_targets_mean": 4822.8,
"valid_targets_min": 324
},
{
"epoch": 1.7851739788199699,
"grad_norm": 0.4085379036791164,
"learning_rate": 3.715214751963987e-05,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20510166883468628,
"step": 1180,
"valid_targets_mean": 5139.8,
"valid_targets_min": 654
},
{
"epoch": 1.7927382753403933,
"grad_norm": 0.4729236016827413,
"learning_rate": 3.711322305672563e-05,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20955510437488556,
"step": 1185,
"valid_targets_mean": 5596.6,
"valid_targets_min": 518
},
{
"epoch": 1.800302571860817,
"grad_norm": 0.48668657427380835,
"learning_rate": 3.707405506541532e-05,
"loss": 0.2362,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.318617582321167,
"step": 1190,
"valid_targets_mean": 6068.5,
"valid_targets_min": 1636
},
{
"epoch": 1.8078668683812404,
"grad_norm": 0.4638826690530358,
"learning_rate": 3.703464410308601e-05,
"loss": 0.1973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20980286598205566,
"step": 1195,
"valid_targets_mean": 5101.1,
"valid_targets_min": 582
},
{
"epoch": 1.8154311649016641,
"grad_norm": 0.45348458053897023,
"learning_rate": 3.699499073057234e-05,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22972343862056732,
"step": 1200,
"valid_targets_mean": 5133.1,
"valid_targets_min": 580
},
{
"epoch": 1.8229954614220878,
"grad_norm": 0.46690448724128925,
"learning_rate": 3.6955095512158554e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20475982129573822,
"step": 1205,
"valid_targets_mean": 4050.1,
"valid_targets_min": 263
},
{
"epoch": 1.8305597579425115,
"grad_norm": 0.38598946854284577,
"learning_rate": 3.691495901557048e-05,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.191079780459404,
"step": 1210,
"valid_targets_mean": 5022.6,
"valid_targets_min": 831
},
{
"epoch": 1.838124054462935,
"grad_norm": 0.4758287501019245,
"learning_rate": 3.6874581811967425e-05,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2127455770969391,
"step": 1215,
"valid_targets_mean": 4499.1,
"valid_targets_min": 1004
},
{
"epoch": 1.8456883509833586,
"grad_norm": 0.5274867081099741,
"learning_rate": 3.683396447593406e-05,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23229683935642242,
"step": 1220,
"valid_targets_mean": 3733.7,
"valid_targets_min": 620
},
{
"epoch": 1.853252647503782,
"grad_norm": 0.5325193798816835,
"learning_rate": 3.6793107585472234e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18608064949512482,
"step": 1225,
"valid_targets_mean": 4011.7,
"valid_targets_min": 651
},
{
"epoch": 1.8608169440242057,
"grad_norm": 0.4796697965319729,
"learning_rate": 3.675201172199277e-05,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21180656552314758,
"step": 1230,
"valid_targets_mean": 4636.1,
"valid_targets_min": 664
},
{
"epoch": 1.8683812405446294,
"grad_norm": 0.46507622330055887,
"learning_rate": 3.6710677470307174e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19449734687805176,
"step": 1235,
"valid_targets_mean": 5142.5,
"valid_targets_min": 684
},
{
"epoch": 1.875945537065053,
"grad_norm": 0.4498886408384691,
"learning_rate": 3.6669105418619307e-05,
"loss": 0.214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24638114869594574,
"step": 1240,
"valid_targets_mean": 4571.3,
"valid_targets_min": 947
},
{
"epoch": 1.8835098335854765,
"grad_norm": 0.38613380520350143,
"learning_rate": 3.6627296158517035e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20049728453159332,
"step": 1245,
"valid_targets_mean": 5270.2,
"valid_targets_min": 506
},
{
"epoch": 1.8910741301059002,
"grad_norm": 0.42668472851640654,
"learning_rate": 3.658525028496382e-05,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20964312553405762,
"step": 1250,
"valid_targets_mean": 5350.7,
"valid_targets_min": 939
},
{
"epoch": 1.8986384266263236,
"grad_norm": 0.45077998259356017,
"learning_rate": 3.654296839629017e-05,
"loss": 0.2269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21868251264095306,
"step": 1255,
"valid_targets_mean": 4306.2,
"valid_targets_min": 648
},
{
"epoch": 1.9062027231467473,
"grad_norm": 0.4172755513143054,
"learning_rate": 3.650045109418526e-05,
"loss": 0.2105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20290303230285645,
"step": 1260,
"valid_targets_mean": 4538.8,
"valid_targets_min": 729
},
{
"epoch": 1.913767019667171,
"grad_norm": 0.39469743941144136,
"learning_rate": 3.645769898368826e-05,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2144225537776947,
"step": 1265,
"valid_targets_mean": 5632.7,
"valid_targets_min": 1531
},
{
"epoch": 1.9213313161875947,
"grad_norm": 0.43115820343190236,
"learning_rate": 3.641471267317976e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1905321180820465,
"step": 1270,
"valid_targets_mean": 5414.7,
"valid_targets_min": 3137
},
{
"epoch": 1.9288956127080181,
"grad_norm": 0.43617197993062395,
"learning_rate": 3.637149277437313e-05,
"loss": 0.2128,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18612077832221985,
"step": 1275,
"valid_targets_mean": 4280.9,
"valid_targets_min": 913
},
{
"epoch": 1.9364599092284418,
"grad_norm": 0.4134925897382423,
"learning_rate": 3.6328039902305806e-05,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2115355283021927,
"step": 1280,
"valid_targets_mean": 5742.0,
"valid_targets_min": 2905
},
{
"epoch": 1.9440242057488653,
"grad_norm": 0.48642626046401954,
"learning_rate": 3.628435467533051e-05,
"loss": 0.1973,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20169591903686523,
"step": 1285,
"valid_targets_mean": 4847.1,
"valid_targets_min": 697
},
{
"epoch": 1.951588502269289,
"grad_norm": 0.45981955132140206,
"learning_rate": 3.624043771510647e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2202417254447937,
"step": 1290,
"valid_targets_mean": 4461.9,
"valid_targets_min": 768
},
{
"epoch": 1.9591527987897126,
"grad_norm": 0.5548992370748099,
"learning_rate": 3.619628964659061e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20979902148246765,
"step": 1295,
"valid_targets_mean": 4232.5,
"valid_targets_min": 605
},
{
"epoch": 1.9667170953101363,
"grad_norm": 0.45509897761384305,
"learning_rate": 3.61519110980286e-05,
"loss": 0.221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23807252943515778,
"step": 1300,
"valid_targets_mean": 5210.3,
"valid_targets_min": 653
},
{
"epoch": 1.9742813918305597,
"grad_norm": 0.4954616432107395,
"learning_rate": 3.6107302700945925e-05,
"loss": 0.2177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19750761985778809,
"step": 1305,
"valid_targets_mean": 4131.4,
"valid_targets_min": 1256
},
{
"epoch": 1.9818456883509834,
"grad_norm": 0.4950490512679412,
"learning_rate": 3.6062465090138936e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21456892788410187,
"step": 1310,
"valid_targets_mean": 4869.4,
"valid_targets_min": 276
},
{
"epoch": 1.9894099848714069,
"grad_norm": 0.4002985029551449,
"learning_rate": 3.6017398903665787e-05,
"loss": 0.2075,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21733352541923523,
"step": 1315,
"valid_targets_mean": 5251.1,
"valid_targets_min": 509
},
{
"epoch": 1.9969742813918305,
"grad_norm": 0.45582333361758404,
"learning_rate": 3.597210478283735e-05,
"loss": 0.2115,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18914233148097992,
"step": 1320,
"valid_targets_mean": 4262.2,
"valid_targets_min": 627
},
{
"epoch": 2.004538577912254,
"grad_norm": 0.40702543737998387,
"learning_rate": 3.5926583372208106e-05,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1540646106004715,
"step": 1325,
"valid_targets_mean": 4975.2,
"valid_targets_min": 700
},
{
"epoch": 2.012102874432678,
"grad_norm": 0.4496790435497547,
"learning_rate": 3.588083531956698e-05,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2218005359172821,
"step": 1330,
"valid_targets_mean": 5816.9,
"valid_targets_min": 904
},
{
"epoch": 2.0196671709531016,
"grad_norm": 0.46863438000971996,
"learning_rate": 3.583486127592807e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18488076329231262,
"step": 1335,
"valid_targets_mean": 5440.6,
"valid_targets_min": 3085
},
{
"epoch": 2.027231467473525,
"grad_norm": 0.5151916546138103,
"learning_rate": 3.5788661895521455e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2258104532957077,
"step": 1340,
"valid_targets_mean": 4155.2,
"valid_targets_min": 630
},
{
"epoch": 2.0347957639939485,
"grad_norm": 0.49594114456507576,
"learning_rate": 3.574223783578385e-05,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22207194566726685,
"step": 1345,
"valid_targets_mean": 4207.0,
"valid_targets_min": 315
},
{
"epoch": 2.042360060514372,
"grad_norm": 0.4943620883953129,
"learning_rate": 3.569558975734923e-05,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2514224350452423,
"step": 1350,
"valid_targets_mean": 4149.8,
"valid_targets_min": 344
},
{
"epoch": 2.049924357034796,
"grad_norm": 0.5253116434763031,
"learning_rate": 3.564871832403948e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2232326716184616,
"step": 1355,
"valid_targets_mean": 4119.2,
"valid_targets_min": 276
},
{
"epoch": 2.0574886535552195,
"grad_norm": 0.5737491130225292,
"learning_rate": 3.560162420285489e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18539798259735107,
"step": 1360,
"valid_targets_mean": 3559.8,
"valid_targets_min": 636
},
{
"epoch": 2.065052950075643,
"grad_norm": 0.4385320487150631,
"learning_rate": 3.555430806396471e-05,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17747828364372253,
"step": 1365,
"valid_targets_mean": 5143.0,
"valid_targets_min": 786
},
{
"epoch": 2.0726172465960664,
"grad_norm": 0.4516448141785158,
"learning_rate": 3.55067705806976e-05,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17075631022453308,
"step": 1370,
"valid_targets_mean": 3945.9,
"valid_targets_min": 708
},
{
"epoch": 2.08018154311649,
"grad_norm": 0.4568200680232734,
"learning_rate": 3.545901242953203e-05,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1752496063709259,
"step": 1375,
"valid_targets_mean": 4810.1,
"valid_targets_min": 589
},
{
"epoch": 2.0877458396369137,
"grad_norm": 0.42407318340899935,
"learning_rate": 3.541103429008666e-05,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18580807745456696,
"step": 1380,
"valid_targets_mean": 4368.6,
"valid_targets_min": 1246
},
{
"epoch": 2.0953101361573374,
"grad_norm": 0.4653908136883707,
"learning_rate": 3.5362836845110716e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19469863176345825,
"step": 1385,
"valid_targets_mean": 4756.0,
"valid_targets_min": 733
},
{
"epoch": 2.102874432677761,
"grad_norm": 0.5635103968025736,
"learning_rate": 3.5314420780474186e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2790437936782837,
"step": 1390,
"valid_targets_mean": 4166.2,
"valid_targets_min": 710
},
{
"epoch": 2.1104387291981848,
"grad_norm": 0.43205481737773477,
"learning_rate": 3.5265786785158145e-05,
"loss": 0.1817,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1872987449169159,
"step": 1395,
"valid_targets_mean": 5274.1,
"valid_targets_min": 864
},
{
"epoch": 2.118003025718608,
"grad_norm": 0.4774922261941819,
"learning_rate": 3.5216935551244896e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21239280700683594,
"step": 1400,
"valid_targets_mean": 4354.2,
"valid_targets_min": 728
},
{
"epoch": 2.1255673222390317,
"grad_norm": 0.4294646533171388,
"learning_rate": 3.516786777390813e-05,
"loss": 0.205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19841662049293518,
"step": 1405,
"valid_targets_mean": 4863.3,
"valid_targets_min": 831
},
{
"epoch": 2.1331316187594553,
"grad_norm": 0.4456489658314288,
"learning_rate": 3.511858415140307e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17594018578529358,
"step": 1410,
"valid_targets_mean": 4792.0,
"valid_targets_min": 313
},
{
"epoch": 2.140695915279879,
"grad_norm": 0.44465763211771253,
"learning_rate": 3.506908538505648e-05,
"loss": 0.1999,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18716633319854736,
"step": 1415,
"valid_targets_mean": 5343.8,
"valid_targets_min": 251
},
{
"epoch": 2.1482602118003027,
"grad_norm": 0.39752123335367506,
"learning_rate": 3.501937217925673e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18770697712898254,
"step": 1420,
"valid_targets_mean": 6363.2,
"valid_targets_min": 2667
},
{
"epoch": 2.1558245083207264,
"grad_norm": 0.39155216335682075,
"learning_rate": 3.496944524144375e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19712628424167633,
"step": 1425,
"valid_targets_mean": 5730.4,
"valid_targets_min": 1000
},
{
"epoch": 2.1633888048411496,
"grad_norm": 0.43195947367825904,
"learning_rate": 3.4919305282098946e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24122843146324158,
"step": 1430,
"valid_targets_mean": 6412.1,
"valid_targets_min": 889
},
{
"epoch": 2.1709531013615733,
"grad_norm": 0.4398943111486007,
"learning_rate": 3.486895301473515e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19659355282783508,
"step": 1435,
"valid_targets_mean": 5464.9,
"valid_targets_min": 1276
},
{
"epoch": 2.178517397881997,
"grad_norm": 0.48362329298743195,
"learning_rate": 3.4818389155886394e-05,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2112506628036499,
"step": 1440,
"valid_targets_mean": 4218.0,
"valid_targets_min": 1231
},
{
"epoch": 2.1860816944024206,
"grad_norm": 0.42445784479643406,
"learning_rate": 3.476761442509776e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20175385475158691,
"step": 1445,
"valid_targets_mean": 5042.2,
"valid_targets_min": 650
},
{
"epoch": 2.1936459909228443,
"grad_norm": 0.46863858194637786,
"learning_rate": 3.4716629544915124e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18960747122764587,
"step": 1450,
"valid_targets_mean": 4570.9,
"valid_targets_min": 289
},
{
"epoch": 2.201210287443268,
"grad_norm": 0.4081654878828203,
"learning_rate": 3.4665435240874883e-05,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21481245756149292,
"step": 1455,
"valid_targets_mean": 5856.9,
"valid_targets_min": 697
},
{
"epoch": 2.208774583963691,
"grad_norm": 0.4111346302978917,
"learning_rate": 3.46140322414936e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19531169533729553,
"step": 1460,
"valid_targets_mean": 5301.0,
"valid_targets_min": 2624
},
{
"epoch": 2.216338880484115,
"grad_norm": 0.4377217717133345,
"learning_rate": 3.456242127825769e-05,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20428526401519775,
"step": 1465,
"valid_targets_mean": 5484.6,
"valid_targets_min": 825
},
{
"epoch": 2.2239031770045385,
"grad_norm": 0.4506208136550606,
"learning_rate": 3.4510603085612984e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23383532464504242,
"step": 1470,
"valid_targets_mean": 5352.6,
"valid_targets_min": 510
},
{
"epoch": 2.231467473524962,
"grad_norm": 0.43942764521770533,
"learning_rate": 3.445857840095425e-05,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22128233313560486,
"step": 1475,
"valid_targets_mean": 5222.1,
"valid_targets_min": 580
},
{
"epoch": 2.239031770045386,
"grad_norm": 0.4503478854825486,
"learning_rate": 3.4406347964614725e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21977970004081726,
"step": 1480,
"valid_targets_mean": 4908.6,
"valid_targets_min": 899
},
{
"epoch": 2.2465960665658096,
"grad_norm": 0.4413787827481323,
"learning_rate": 3.4353912519855605e-05,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19306686520576477,
"step": 1485,
"valid_targets_mean": 4952.8,
"valid_targets_min": 458
},
{
"epoch": 2.254160363086233,
"grad_norm": 0.5587470714781764,
"learning_rate": 3.4301272812855425e-05,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2252560257911682,
"step": 1490,
"valid_targets_mean": 4599.5,
"valid_targets_min": 671
},
{
"epoch": 2.2617246596066565,
"grad_norm": 0.4687262608875152,
"learning_rate": 3.4248429592699455e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25899726152420044,
"step": 1495,
"valid_targets_mean": 4973.8,
"valid_targets_min": 1007
},
{
"epoch": 2.26928895612708,
"grad_norm": 0.49079428216545606,
"learning_rate": 3.419538361136906e-05,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.182472363114357,
"step": 1500,
"valid_targets_mean": 5454.8,
"valid_targets_min": 308
},
{
"epoch": 2.276853252647504,
"grad_norm": 0.49359503726236653,
"learning_rate": 3.4142135623730954e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19357086718082428,
"step": 1505,
"valid_targets_mean": 3701.8,
"valid_targets_min": 606
},
{
"epoch": 2.2844175491679275,
"grad_norm": 0.4153158668013505,
"learning_rate": 3.408868638752652e-05,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17256566882133484,
"step": 1510,
"valid_targets_mean": 4801.5,
"valid_targets_min": 547
},
{
"epoch": 2.291981845688351,
"grad_norm": 0.4244264255761697,
"learning_rate": 3.4035036663360975e-05,
"loss": 0.1946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1777007281780243,
"step": 1515,
"valid_targets_mean": 4332.2,
"valid_targets_min": 633
},
{
"epoch": 2.2995461422087744,
"grad_norm": 0.45909023723152254,
"learning_rate": 3.398118721469255e-05,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20535892248153687,
"step": 1520,
"valid_targets_mean": 4871.4,
"valid_targets_min": 718
},
{
"epoch": 2.307110438729198,
"grad_norm": 0.4473665556214724,
"learning_rate": 3.392713880782168e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23217563331127167,
"step": 1525,
"valid_targets_mean": 5512.5,
"valid_targets_min": 1040
},
{
"epoch": 2.3146747352496218,
"grad_norm": 0.42374613530545113,
"learning_rate": 3.3872892211880024e-05,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1817803978919983,
"step": 1530,
"valid_targets_mean": 5129.2,
"valid_targets_min": 518
},
{
"epoch": 2.3222390317700454,
"grad_norm": 0.4276274337247246,
"learning_rate": 3.381844819881956e-05,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18477100133895874,
"step": 1535,
"valid_targets_mean": 4986.2,
"valid_targets_min": 3046
},
{
"epoch": 2.329803328290469,
"grad_norm": 0.47276929234987713,
"learning_rate": 3.376380754340161e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18416282534599304,
"step": 1540,
"valid_targets_mean": 5228.8,
"valid_targets_min": 768
},
{
"epoch": 2.3373676248108928,
"grad_norm": 0.4196095119449812,
"learning_rate": 3.370897102318579e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20898360013961792,
"step": 1545,
"valid_targets_mean": 4759.8,
"valid_targets_min": 492
},
{
"epoch": 2.344931921331316,
"grad_norm": 0.4748812000021928,
"learning_rate": 3.365393941851895e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19465558230876923,
"step": 1550,
"valid_targets_mean": 5065.6,
"valid_targets_min": 593
},
{
"epoch": 2.3524962178517397,
"grad_norm": 0.45592369911420205,
"learning_rate": 3.3598713512524095e-05,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20027290284633636,
"step": 1555,
"valid_targets_mean": 4513.0,
"valid_targets_min": 813
},
{
"epoch": 2.3600605143721634,
"grad_norm": 0.47210399853307966,
"learning_rate": 3.3543294091089196e-05,
"loss": 0.1866,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1730816662311554,
"step": 1560,
"valid_targets_mean": 4316.6,
"valid_targets_min": 1518
},
{
"epoch": 2.367624810892587,
"grad_norm": 0.41410239848604946,
"learning_rate": 3.348768194285604e-05,
"loss": 0.2187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18337824940681458,
"step": 1565,
"valid_targets_mean": 5466.7,
"valid_targets_min": 757
},
{
"epoch": 2.3751891074130107,
"grad_norm": 0.45973957172447916,
"learning_rate": 3.343187785920899e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1856488138437271,
"step": 1570,
"valid_targets_mean": 4216.2,
"valid_targets_min": 307
},
{
"epoch": 2.3827534039334344,
"grad_norm": 0.4378622827189698,
"learning_rate": 3.337588263426376e-05,
"loss": 0.2074,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19100350141525269,
"step": 1575,
"valid_targets_mean": 5184.4,
"valid_targets_min": 619
},
{
"epoch": 2.3903177004538576,
"grad_norm": 0.4386524001539198,
"learning_rate": 3.331969706485604e-05,
"loss": 0.201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17415636777877808,
"step": 1580,
"valid_targets_mean": 4543.0,
"valid_targets_min": 370
},
{
"epoch": 2.3978819969742813,
"grad_norm": 0.43023639119991364,
"learning_rate": 3.3263321950530244e-05,
"loss": 0.2013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20897901058197021,
"step": 1585,
"valid_targets_mean": 4961.1,
"valid_targets_min": 662
},
{
"epoch": 2.405446293494705,
"grad_norm": 0.42713339383685595,
"learning_rate": 3.320675809352807e-05,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19284377992153168,
"step": 1590,
"valid_targets_mean": 5614.0,
"valid_targets_min": 688
},
{
"epoch": 2.4130105900151286,
"grad_norm": 0.5523601616423389,
"learning_rate": 3.31500062987771e-05,
"loss": 0.1983,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19253116846084595,
"step": 1595,
"valid_targets_mean": 4295.9,
"valid_targets_min": 557
},
{
"epoch": 2.4205748865355523,
"grad_norm": 0.5607373427621611,
"learning_rate": 3.309306737387936e-05,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1754857301712036,
"step": 1600,
"valid_targets_mean": 4523.5,
"valid_targets_min": 780
},
{
"epoch": 2.428139183055976,
"grad_norm": 0.4720039398009578,
"learning_rate": 3.303594212909981e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2118072211742401,
"step": 1605,
"valid_targets_mean": 4806.7,
"valid_targets_min": 1473
},
{
"epoch": 2.435703479576399,
"grad_norm": 0.42277502230438585,
"learning_rate": 3.297863137735483e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18252259492874146,
"step": 1610,
"valid_targets_mean": 4898.9,
"valid_targets_min": 1972
},
{
"epoch": 2.443267776096823,
"grad_norm": 0.399237439365295,
"learning_rate": 3.292113593420064e-05,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21672359108924866,
"step": 1615,
"valid_targets_mean": 5876.3,
"valid_targets_min": 583
},
{
"epoch": 2.4508320726172466,
"grad_norm": 0.4486669185061525,
"learning_rate": 3.2863456617821686e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19526150822639465,
"step": 1620,
"valid_targets_mean": 4571.8,
"valid_targets_min": 563
},
{
"epoch": 2.4583963691376702,
"grad_norm": 0.44285518845846517,
"learning_rate": 3.280559424901902e-05,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1940869390964508,
"step": 1625,
"valid_targets_mean": 4653.3,
"valid_targets_min": 932
},
{
"epoch": 2.465960665658094,
"grad_norm": 0.43307975933325155,
"learning_rate": 3.274754965119859e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19831156730651855,
"step": 1630,
"valid_targets_mean": 6298.4,
"valid_targets_min": 831
},
{
"epoch": 2.4735249621785176,
"grad_norm": 0.44815134988666483,
"learning_rate": 3.268932365035957e-05,
"loss": 0.1905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17851749062538147,
"step": 1635,
"valid_targets_mean": 4155.0,
"valid_targets_min": 873
},
{
"epoch": 2.481089258698941,
"grad_norm": 0.4758137431057834,
"learning_rate": 3.2630917075082545e-05,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21051645278930664,
"step": 1640,
"valid_targets_mean": 4256.6,
"valid_targets_min": 543
},
{
"epoch": 2.4886535552193645,
"grad_norm": 0.4856266870931895,
"learning_rate": 3.257233075651776e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2091045379638672,
"step": 1645,
"valid_targets_mean": 3996.8,
"valid_targets_min": 772
},
{
"epoch": 2.496217851739788,
"grad_norm": 0.4596232547209677,
"learning_rate": 3.251356552837331e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20302638411521912,
"step": 1650,
"valid_targets_mean": 4664.9,
"valid_targets_min": 559
},
{
"epoch": 2.503782148260212,
"grad_norm": 0.445645358686214,
"learning_rate": 3.24546222269032e-05,
"loss": 0.2,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20104148983955383,
"step": 1655,
"valid_targets_mean": 4935.3,
"valid_targets_min": 648
},
{
"epoch": 2.5113464447806355,
"grad_norm": 0.4163593861795244,
"learning_rate": 3.239550169089554e-05,
"loss": 0.2021,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20811429619789124,
"step": 1660,
"valid_targets_mean": 4935.7,
"valid_targets_min": 846
},
{
"epoch": 2.5189107413010587,
"grad_norm": 0.4506628867755876,
"learning_rate": 3.233620476166052e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19512595236301422,
"step": 1665,
"valid_targets_mean": 4339.9,
"valid_targets_min": 841
},
{
"epoch": 2.5264750378214824,
"grad_norm": 0.4613561611964294,
"learning_rate": 3.227673228301852e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2082904875278473,
"step": 1670,
"valid_targets_mean": 5157.9,
"valid_targets_min": 239
},
{
"epoch": 2.534039334341906,
"grad_norm": 0.4300736454991396,
"learning_rate": 3.221708510128803e-05,
"loss": 0.2126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22433291375637054,
"step": 1675,
"valid_targets_mean": 5423.8,
"valid_targets_min": 874
},
{
"epoch": 2.5416036308623298,
"grad_norm": 0.4490922816670387,
"learning_rate": 3.215726406527366e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2263888120651245,
"step": 1680,
"valid_targets_mean": 5079.9,
"valid_targets_min": 716
},
{
"epoch": 2.5491679273827534,
"grad_norm": 0.4252724518754956,
"learning_rate": 3.209727002625403e-05,
"loss": 0.1827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18171165883541107,
"step": 1685,
"valid_targets_mean": 5157.6,
"valid_targets_min": 736
},
{
"epoch": 2.556732223903177,
"grad_norm": 0.5227593631370397,
"learning_rate": 3.203710383796968e-05,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22884613275527954,
"step": 1690,
"valid_targets_mean": 3696.8,
"valid_targets_min": 583
},
{
"epoch": 2.564296520423601,
"grad_norm": 0.40394341246737125,
"learning_rate": 3.197676635661088e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16832637786865234,
"step": 1695,
"valid_targets_mean": 4719.4,
"valid_targets_min": 883
},
{
"epoch": 2.5718608169440245,
"grad_norm": 0.4100683829903881,
"learning_rate": 3.191625844080549e-05,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17842620611190796,
"step": 1700,
"valid_targets_mean": 4411.6,
"valid_targets_min": 765
},
{
"epoch": 2.5794251134644477,
"grad_norm": 0.4485180434538262,
"learning_rate": 3.185558095160673e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21995443105697632,
"step": 1705,
"valid_targets_mean": 5099.1,
"valid_targets_min": 679
},
{
"epoch": 2.5869894099848714,
"grad_norm": 0.38074545321551795,
"learning_rate": 3.1794734752480904e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16947045922279358,
"step": 1710,
"valid_targets_mean": 5466.0,
"valid_targets_min": 1958
},
{
"epoch": 2.594553706505295,
"grad_norm": 0.3895212805166888,
"learning_rate": 3.173372070929516e-05,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17781910300254822,
"step": 1715,
"valid_targets_mean": 5277.6,
"valid_targets_min": 361
},
{
"epoch": 2.6021180030257187,
"grad_norm": 0.41926890792799176,
"learning_rate": 3.1672539690305085e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18371908366680145,
"step": 1720,
"valid_targets_mean": 4538.6,
"valid_targets_min": 653
},
{
"epoch": 2.609682299546142,
"grad_norm": 0.41803066739386174,
"learning_rate": 3.161119256614245e-05,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19282883405685425,
"step": 1725,
"valid_targets_mean": 4689.3,
"valid_targets_min": 332
},
{
"epoch": 2.6172465960665656,
"grad_norm": 0.4163373440445869,
"learning_rate": 3.1549680209802755e-05,
"loss": 0.1998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21184735000133514,
"step": 1730,
"valid_targets_mean": 5217.1,
"valid_targets_min": 625
},
{
"epoch": 2.6248108925869893,
"grad_norm": 0.43278351740246923,
"learning_rate": 3.148800349663284e-05,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17267610132694244,
"step": 1735,
"valid_targets_mean": 5302.0,
"valid_targets_min": 961
},
{
"epoch": 2.632375189107413,
"grad_norm": 0.4301909115075832,
"learning_rate": 3.142616330431838e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21546387672424316,
"step": 1740,
"valid_targets_mean": 5153.0,
"valid_targets_min": 677
},
{
"epoch": 2.6399394856278366,
"grad_norm": 0.43182873571569885,
"learning_rate": 3.136416051287145e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2066439390182495,
"step": 1745,
"valid_targets_mean": 5306.9,
"valid_targets_min": 786
},
{
"epoch": 2.6475037821482603,
"grad_norm": 0.4085125515579365,
"learning_rate": 3.130199600461797e-05,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1787445843219757,
"step": 1750,
"valid_targets_mean": 5295.1,
"valid_targets_min": 619
},
{
"epoch": 2.655068078668684,
"grad_norm": 0.42252400798877315,
"learning_rate": 3.1239670664185175e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2020232379436493,
"step": 1755,
"valid_targets_mean": 5475.5,
"valid_targets_min": 514
},
{
"epoch": 2.6626323751891077,
"grad_norm": 0.896652188415317,
"learning_rate": 3.1177185378488984e-05,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18937832117080688,
"step": 1760,
"valid_targets_mean": 3316.6,
"valid_targets_min": 635
},
{
"epoch": 2.670196671709531,
"grad_norm": 0.4448738975213965,
"learning_rate": 3.111454103672143e-05,
"loss": 0.1974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19633612036705017,
"step": 1765,
"valid_targets_mean": 4133.8,
"valid_targets_min": 712
},
{
"epoch": 2.6777609682299546,
"grad_norm": 0.4466168476220182,
"learning_rate": 3.105173853033796e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20809951424598694,
"step": 1770,
"valid_targets_mean": 4109.6,
"valid_targets_min": 667
},
{
"epoch": 2.6853252647503782,
"grad_norm": 0.4951441062549152,
"learning_rate": 3.098877875304478e-05,
"loss": 0.2108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18588414788246155,
"step": 1775,
"valid_targets_mean": 5792.4,
"valid_targets_min": 716
},
{
"epoch": 2.692889561270802,
"grad_norm": 0.3783523235737496,
"learning_rate": 3.092566260078614e-05,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17155107855796814,
"step": 1780,
"valid_targets_mean": 5417.6,
"valid_targets_min": 687
},
{
"epoch": 2.700453857791225,
"grad_norm": 0.41078514757696655,
"learning_rate": 3.086239097173155e-05,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2063501477241516,
"step": 1785,
"valid_targets_mean": 5055.7,
"valid_targets_min": 892
},
{
"epoch": 2.708018154311649,
"grad_norm": 0.43887043899986533,
"learning_rate": 3.079896476626303e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21934330463409424,
"step": 1790,
"valid_targets_mean": 5341.4,
"valid_targets_min": 891
},
{
"epoch": 2.7155824508320725,
"grad_norm": 0.4255605078324983,
"learning_rate": 3.073538488696229e-05,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18903899192810059,
"step": 1795,
"valid_targets_mean": 5615.9,
"valid_targets_min": 592
},
{
"epoch": 2.723146747352496,
"grad_norm": 0.589823722023372,
"learning_rate": 3.0671652238597873e-05,
"loss": 0.1924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1876818835735321,
"step": 1800,
"valid_targets_mean": 5229.2,
"valid_targets_min": 1796
},
{
"epoch": 2.73071104387292,
"grad_norm": 0.48691578647433853,
"learning_rate": 3.060776772811231e-05,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2318037450313568,
"step": 1805,
"valid_targets_mean": 4098.2,
"valid_targets_min": 830
},
{
"epoch": 2.7382753403933435,
"grad_norm": 0.660918859398447,
"learning_rate": 3.0543732264609174e-05,
"loss": 0.1963,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2070668637752533,
"step": 1810,
"valid_targets_mean": 5188.2,
"valid_targets_min": 1829
},
{
"epoch": 2.745839636913767,
"grad_norm": 0.42428761873536697,
"learning_rate": 3.0479546759340176e-05,
"loss": 0.1968,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17107611894607544,
"step": 1815,
"valid_targets_mean": 4367.8,
"valid_targets_min": 324
},
{
"epoch": 2.753403933434191,
"grad_norm": 0.4370704783114705,
"learning_rate": 3.0415212125692184e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19081702828407288,
"step": 1820,
"valid_targets_mean": 4557.9,
"valid_targets_min": 723
},
{
"epoch": 2.760968229954614,
"grad_norm": 0.46349591557486075,
"learning_rate": 3.0350729279174212e-05,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19641894102096558,
"step": 1825,
"valid_targets_mean": 5278.9,
"valid_targets_min": 2337
},
{
"epoch": 2.768532526475038,
"grad_norm": 0.524642612915043,
"learning_rate": 3.0286099137404426e-05,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19328051805496216,
"step": 1830,
"valid_targets_mean": 5464.6,
"valid_targets_min": 663
},
{
"epoch": 2.7760968229954615,
"grad_norm": 0.43508313940321147,
"learning_rate": 3.0221322620097047e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19558432698249817,
"step": 1835,
"valid_targets_mean": 4772.1,
"valid_targets_min": 2237
},
{
"epoch": 2.783661119515885,
"grad_norm": 0.4041659272772562,
"learning_rate": 3.01564006490493e-05,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20566602051258087,
"step": 1840,
"valid_targets_mean": 6452.6,
"valid_targets_min": 2725
},
{
"epoch": 2.7912254160363084,
"grad_norm": 0.4030427238187041,
"learning_rate": 3.0091334148128265e-05,
"loss": 0.1965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17462749779224396,
"step": 1845,
"valid_targets_mean": 5316.8,
"valid_targets_min": 600
},
{
"epoch": 2.798789712556732,
"grad_norm": 0.4961824149557135,
"learning_rate": 3.002612404325774e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2178715467453003,
"step": 1850,
"valid_targets_mean": 3882.9,
"valid_targets_min": 540
},
{
"epoch": 2.8063540090771557,
"grad_norm": 0.42175695435983496,
"learning_rate": 2.9960771262405085e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1930299699306488,
"step": 1855,
"valid_targets_mean": 5572.1,
"valid_targets_min": 2244
},
{
"epoch": 2.8139183055975794,
"grad_norm": 0.40908551740974003,
"learning_rate": 2.9895276735567988e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17899967730045319,
"step": 1860,
"valid_targets_mean": 5095.8,
"valid_targets_min": 1007
},
{
"epoch": 2.821482602118003,
"grad_norm": 0.4248876340373272,
"learning_rate": 2.982964139476124e-05,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1757224202156067,
"step": 1865,
"valid_targets_mean": 4697.9,
"valid_targets_min": 1035
},
{
"epoch": 2.8290468986384267,
"grad_norm": 0.42593735085657447,
"learning_rate": 2.9763866174003473e-05,
"loss": 0.2023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23707634210586548,
"step": 1870,
"valid_targets_mean": 6115.4,
"valid_targets_min": 1386
},
{
"epoch": 2.8366111951588504,
"grad_norm": 0.45026114969687053,
"learning_rate": 2.9697952009303886e-05,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.187404602766037,
"step": 1875,
"valid_targets_mean": 4572.1,
"valid_targets_min": 823
},
{
"epoch": 2.844175491679274,
"grad_norm": 0.42649362408455643,
"learning_rate": 2.9631899838648887e-05,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18948125839233398,
"step": 1880,
"valid_targets_mean": 4665.5,
"valid_targets_min": 911
},
{
"epoch": 2.8517397881996973,
"grad_norm": 0.3720008592357275,
"learning_rate": 2.9565710601988783e-05,
"loss": 0.1893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16390863060951233,
"step": 1885,
"valid_targets_mean": 5894.8,
"valid_targets_min": 638
},
{
"epoch": 2.859304084720121,
"grad_norm": 0.43144241147993634,
"learning_rate": 2.9499385241224395e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20528359711170197,
"step": 1890,
"valid_targets_mean": 5719.8,
"valid_targets_min": 1110
},
{
"epoch": 2.8668683812405447,
"grad_norm": 0.4390908805212251,
"learning_rate": 2.943292470019361e-05,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17955082654953003,
"step": 1895,
"valid_targets_mean": 4001.1,
"valid_targets_min": 688
},
{
"epoch": 2.8744326777609683,
"grad_norm": 0.38596306723643325,
"learning_rate": 2.936632992465803e-05,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18508818745613098,
"step": 1900,
"valid_targets_mean": 5744.8,
"valid_targets_min": 4281
},
{
"epoch": 2.8819969742813916,
"grad_norm": 0.4795728053309178,
"learning_rate": 2.9299601862289453e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18243417143821716,
"step": 1905,
"valid_targets_mean": 3936.1,
"valid_targets_min": 856
},
{
"epoch": 2.8895612708018152,
"grad_norm": 0.4594467335481041,
"learning_rate": 2.92327414626564e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18039527535438538,
"step": 1910,
"valid_targets_mean": 4143.9,
"valid_targets_min": 634
},
{
"epoch": 2.897125567322239,
"grad_norm": 0.39267385150227535,
"learning_rate": 2.9165749677210615e-05,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1811700463294983,
"step": 1915,
"valid_targets_mean": 5184.6,
"valid_targets_min": 968
},
{
"epoch": 2.9046898638426626,
"grad_norm": 0.4868122959844636,
"learning_rate": 2.9098627459273516e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20172417163848877,
"step": 1920,
"valid_targets_mean": 4043.6,
"valid_targets_min": 553
},
{
"epoch": 2.9122541603630863,
"grad_norm": 0.46754401466860396,
"learning_rate": 2.9031375764022627e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18514400720596313,
"step": 1925,
"valid_targets_mean": 4837.5,
"valid_targets_min": 333
},
{
"epoch": 2.91981845688351,
"grad_norm": 0.4056142272807577,
"learning_rate": 2.8963995548477996e-05,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17639204859733582,
"step": 1930,
"valid_targets_mean": 4832.6,
"valid_targets_min": 635
},
{
"epoch": 2.9273827534039336,
"grad_norm": 0.621399576217883,
"learning_rate": 2.8896487771488564e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21237429976463318,
"step": 1935,
"valid_targets_mean": 3703.5,
"valid_targets_min": 711
},
{
"epoch": 2.9349470499243573,
"grad_norm": 0.42986488062021244,
"learning_rate": 2.882885339371852e-05,
"loss": 0.2017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20180043578147888,
"step": 1940,
"valid_targets_mean": 5049.2,
"valid_targets_min": 775
},
{
"epoch": 2.9425113464447805,
"grad_norm": 0.4259342195024064,
"learning_rate": 2.8761093377633657e-05,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1935410350561142,
"step": 1945,
"valid_targets_mean": 5046.2,
"valid_targets_min": 969
},
{
"epoch": 2.950075642965204,
"grad_norm": 0.4108347413723792,
"learning_rate": 2.8693208687487617e-05,
"loss": 0.1989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1827128529548645,
"step": 1950,
"valid_targets_mean": 5555.4,
"valid_targets_min": 1354
},
{
"epoch": 2.957639939485628,
"grad_norm": 0.4045575068570252,
"learning_rate": 2.8625200289308242e-05,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19365639984607697,
"step": 1955,
"valid_targets_mean": 5364.6,
"valid_targets_min": 1894
},
{
"epoch": 2.9652042360060515,
"grad_norm": 0.4645036427391149,
"learning_rate": 2.855706915088378e-05,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20481233298778534,
"step": 1960,
"valid_targets_mean": 4193.6,
"valid_targets_min": 842
},
{
"epoch": 2.9727685325264748,
"grad_norm": 0.45940755177813786,
"learning_rate": 2.8488816241749123e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1904478818178177,
"step": 1965,
"valid_targets_mean": 3872.9,
"valid_targets_min": 793
},
{
"epoch": 2.9803328290468984,
"grad_norm": 0.4316864521638559,
"learning_rate": 2.8420442533171995e-05,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18184807896614075,
"step": 1970,
"valid_targets_mean": 4514.9,
"valid_targets_min": 680
},
{
"epoch": 2.987897125567322,
"grad_norm": 0.41611560629943883,
"learning_rate": 2.8351948998139187e-05,
"loss": 0.1939,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19364595413208008,
"step": 1975,
"valid_targets_mean": 4439.6,
"valid_targets_min": 834
},
{
"epoch": 2.995461422087746,
"grad_norm": 0.37967027522286967,
"learning_rate": 2.8283336611342634e-05,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18696758151054382,
"step": 1980,
"valid_targets_mean": 5346.8,
"valid_targets_min": 697
},
{
"epoch": 3.0030257186081695,
"grad_norm": 0.42663777104066586,
"learning_rate": 2.8214606349165587e-05,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1831974983215332,
"step": 1985,
"valid_targets_mean": 5566.9,
"valid_targets_min": 2660
},
{
"epoch": 3.010590015128593,
"grad_norm": 0.4650435000504031,
"learning_rate": 2.8145759189668748e-05,
"loss": 0.1838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17917796969413757,
"step": 1990,
"valid_targets_mean": 4684.1,
"valid_targets_min": 908
},
{
"epoch": 3.018154311649017,
"grad_norm": 0.4426288047149243,
"learning_rate": 2.8076796112576273e-05,
"loss": 0.1816,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2020592838525772,
"step": 1995,
"valid_targets_mean": 4922.2,
"valid_targets_min": 606
},
{
"epoch": 3.02571860816944,
"grad_norm": 0.43542206084007723,
"learning_rate": 2.8007718099261886e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18459182977676392,
"step": 2000,
"valid_targets_mean": 5220.1,
"valid_targets_min": 432
},
{
"epoch": 3.0332829046898637,
"grad_norm": 0.5115612104025097,
"learning_rate": 2.7938526132734923e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17348910868167877,
"step": 2005,
"valid_targets_mean": 4200.2,
"valid_targets_min": 633
},
{
"epoch": 3.0408472012102874,
"grad_norm": 0.4885826302307685,
"learning_rate": 2.7869221197626307e-05,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1716952621936798,
"step": 2010,
"valid_targets_mean": 4950.1,
"valid_targets_min": 2131
},
{
"epoch": 3.048411497730711,
"grad_norm": 0.41076102496913264,
"learning_rate": 2.7799804280174547e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20202207565307617,
"step": 2015,
"valid_targets_mean": 5878.2,
"valid_targets_min": 803
},
{
"epoch": 3.0559757942511347,
"grad_norm": 0.5180887749992029,
"learning_rate": 2.773027636821171e-05,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1683463305234909,
"step": 2020,
"valid_targets_mean": 4372.1,
"valid_targets_min": 770
},
{
"epoch": 3.0635400907715584,
"grad_norm": 0.4322804601397516,
"learning_rate": 2.7660638451149377e-05,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1704043745994568,
"step": 2025,
"valid_targets_mean": 5918.9,
"valid_targets_min": 746
},
{
"epoch": 3.0711043872919817,
"grad_norm": 0.47686737853887257,
"learning_rate": 2.7590891519964523e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16545140743255615,
"step": 2030,
"valid_targets_mean": 4430.4,
"valid_targets_min": 793
},
{
"epoch": 3.0786686838124053,
"grad_norm": 0.49402131162912494,
"learning_rate": 2.7521036567185467e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1749613881111145,
"step": 2035,
"valid_targets_mean": 4374.2,
"valid_targets_min": 865
},
{
"epoch": 3.086232980332829,
"grad_norm": 0.4881940238049801,
"learning_rate": 2.74510745868777e-05,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18618690967559814,
"step": 2040,
"valid_targets_mean": 4110.2,
"valid_targets_min": 980
},
{
"epoch": 3.0937972768532527,
"grad_norm": 0.46079816423016295,
"learning_rate": 2.7381006574629764e-05,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17987105250358582,
"step": 2045,
"valid_targets_mean": 4255.6,
"valid_targets_min": 925
},
{
"epoch": 3.1013615733736764,
"grad_norm": 0.43563452348577103,
"learning_rate": 2.7310833527539092e-05,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1708250641822815,
"step": 2050,
"valid_targets_mean": 4816.2,
"valid_targets_min": 674
},
{
"epoch": 3.1089258698941,
"grad_norm": 0.45727170609137696,
"learning_rate": 2.7240556444197794e-05,
"loss": 0.192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2242300808429718,
"step": 2055,
"valid_targets_mean": 5413.7,
"valid_targets_min": 868
},
{
"epoch": 3.1164901664145233,
"grad_norm": 0.4239934474026591,
"learning_rate": 2.7170176324678466e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18958163261413574,
"step": 2060,
"valid_targets_mean": 4843.6,
"valid_targets_min": 828
},
{
"epoch": 3.124054462934947,
"grad_norm": 0.41161803317312445,
"learning_rate": 2.7099694170519954e-05,
"loss": 0.1847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17357945442199707,
"step": 2065,
"valid_targets_mean": 5419.1,
"valid_targets_min": 2847
},
{
"epoch": 3.1316187594553706,
"grad_norm": 0.46439839012149947,
"learning_rate": 2.702911098471309e-05,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18104906380176544,
"step": 2070,
"valid_targets_mean": 4799.9,
"valid_targets_min": 405
},
{
"epoch": 3.1391830559757943,
"grad_norm": 0.4750168385041568,
"learning_rate": 2.6958427771686442e-05,
"loss": 0.188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22222860157489777,
"step": 2075,
"valid_targets_mean": 4794.3,
"valid_targets_min": 785
},
{
"epoch": 3.146747352496218,
"grad_norm": 0.45925547907351283,
"learning_rate": 2.6887645537292e-05,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18778520822525024,
"step": 2080,
"valid_targets_mean": 4274.8,
"valid_targets_min": 992
},
{
"epoch": 3.1543116490166416,
"grad_norm": 0.46409549568295294,
"learning_rate": 2.681676528879087e-05,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16386860609054565,
"step": 2085,
"valid_targets_mean": 4708.4,
"valid_targets_min": 894
},
{
"epoch": 3.161875945537065,
"grad_norm": 0.40226973478172007,
"learning_rate": 2.674578803483894e-05,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16758553683757782,
"step": 2090,
"valid_targets_mean": 4964.8,
"valid_targets_min": 2351
},
{
"epoch": 3.1694402420574885,
"grad_norm": 0.4606500236707901,
"learning_rate": 2.6674714785472543e-05,
"loss": 0.1844,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17645390331745148,
"step": 2095,
"valid_targets_mean": 4287.9,
"valid_targets_min": 730
},
{
"epoch": 3.177004538577912,
"grad_norm": 0.4595539891435698,
"learning_rate": 2.660354655209403e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1777542382478714,
"step": 2100,
"valid_targets_mean": 4656.0,
"valid_targets_min": 1155
},
{
"epoch": 3.184568835098336,
"grad_norm": 0.5052944223699203,
"learning_rate": 2.653228434745746e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19221368432044983,
"step": 2105,
"valid_targets_mean": 4579.3,
"valid_targets_min": 849
},
{
"epoch": 3.1921331316187596,
"grad_norm": 0.4365900032242633,
"learning_rate": 2.6460929185654106e-05,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16588276624679565,
"step": 2110,
"valid_targets_mean": 4732.4,
"valid_targets_min": 1479
},
{
"epoch": 3.1996974281391832,
"grad_norm": 0.38714216198205725,
"learning_rate": 2.6389482082098078e-05,
"loss": 0.1869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2058732509613037,
"step": 2115,
"valid_targets_mean": 6171.4,
"valid_targets_min": 1037
},
{
"epoch": 3.2072617246596065,
"grad_norm": 0.4664429065916817,
"learning_rate": 2.6317944053511853e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17922240495681763,
"step": 2120,
"valid_targets_mean": 4987.2,
"valid_targets_min": 922
},
{
"epoch": 3.21482602118003,
"grad_norm": 0.45793374742151755,
"learning_rate": 2.6246316117911804e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18207323551177979,
"step": 2125,
"valid_targets_mean": 4121.9,
"valid_targets_min": 1004
},
{
"epoch": 3.222390317700454,
"grad_norm": 0.41559127939266016,
"learning_rate": 2.6174599294593738e-05,
"loss": 0.1664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15605135262012482,
"step": 2130,
"valid_targets_mean": 5834.4,
"valid_targets_min": 3253
},
{
"epoch": 3.2299546142208775,
"grad_norm": 0.4164323582327294,
"learning_rate": 2.6102794604118345e-05,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14102093875408173,
"step": 2135,
"valid_targets_mean": 4710.9,
"valid_targets_min": 372
},
{
"epoch": 3.237518910741301,
"grad_norm": 0.5017731025945408,
"learning_rate": 2.6030903068296724e-05,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2099505364894867,
"step": 2140,
"valid_targets_mean": 3947.9,
"valid_targets_min": 470
},
{
"epoch": 3.245083207261725,
"grad_norm": 0.47115821805759717,
"learning_rate": 2.5958925710175803e-05,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1678295135498047,
"step": 2145,
"valid_targets_mean": 4823.2,
"valid_targets_min": 970
},
{
"epoch": 3.252647503782148,
"grad_norm": 0.45159081763090103,
"learning_rate": 2.5886863554023807e-05,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15815192461013794,
"step": 2150,
"valid_targets_mean": 5319.1,
"valid_targets_min": 671
},
{
"epoch": 3.2602118003025717,
"grad_norm": 0.42568279295852773,
"learning_rate": 2.581471762531568e-05,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1752796769142151,
"step": 2155,
"valid_targets_mean": 5423.6,
"valid_targets_min": 1749
},
{
"epoch": 3.2677760968229954,
"grad_norm": 0.42884597917657213,
"learning_rate": 2.574248895071846e-05,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1902637481689453,
"step": 2160,
"valid_targets_mean": 5324.8,
"valid_targets_min": 2412
},
{
"epoch": 3.275340393343419,
"grad_norm": 0.40297700891719374,
"learning_rate": 2.5670178558076724e-05,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2010069340467453,
"step": 2165,
"valid_targets_mean": 5642.1,
"valid_targets_min": 582
},
{
"epoch": 3.2829046898638428,
"grad_norm": 0.39785109407004443,
"learning_rate": 2.5597787476397918e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19962245225906372,
"step": 2170,
"valid_targets_mean": 6636.6,
"valid_targets_min": 637
},
{
"epoch": 3.2904689863842664,
"grad_norm": 0.4203008064142974,
"learning_rate": 2.5525316735837713e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17891038954257965,
"step": 2175,
"valid_targets_mean": 4486.1,
"valid_targets_min": 664
},
{
"epoch": 3.29803328290469,
"grad_norm": 0.4649648211079789,
"learning_rate": 2.545276736768538e-05,
"loss": 0.1749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17492157220840454,
"step": 2180,
"valid_targets_mean": 4677.6,
"valid_targets_min": 635
},
{
"epoch": 3.3055975794251133,
"grad_norm": 0.483126836509343,
"learning_rate": 2.5380140404349094e-05,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2014307975769043,
"step": 2185,
"valid_targets_mean": 4459.1,
"valid_targets_min": 543
},
{
"epoch": 3.313161875945537,
"grad_norm": 0.4936867068007607,
"learning_rate": 2.5307436879341226e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1675454080104828,
"step": 2190,
"valid_targets_mean": 3605.6,
"valid_targets_min": 473
},
{
"epoch": 3.3207261724659607,
"grad_norm": 0.41968907431035,
"learning_rate": 2.523465782726366e-05,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16863587498664856,
"step": 2195,
"valid_targets_mean": 4795.8,
"valid_targets_min": 919
},
{
"epoch": 3.3282904689863844,
"grad_norm": 0.4582209550444048,
"learning_rate": 2.5161804283793078e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18313094973564148,
"step": 2200,
"valid_targets_mean": 4105.4,
"valid_targets_min": 486
},
{
"epoch": 3.335854765506808,
"grad_norm": 0.5132053187633295,
"learning_rate": 2.508887728566617e-05,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1868969351053238,
"step": 2205,
"valid_targets_mean": 4217.6,
"valid_targets_min": 648
},
{
"epoch": 3.3434190620272313,
"grad_norm": 0.4521820461040364,
"learning_rate": 2.5015877870664956e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1981300413608551,
"step": 2210,
"valid_targets_mean": 4518.8,
"valid_targets_min": 753
},
{
"epoch": 3.350983358547655,
"grad_norm": 0.46305852598208186,
"learning_rate": 2.494280707760195e-05,
"loss": 0.1996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23940429091453552,
"step": 2215,
"valid_targets_mean": 4959.1,
"valid_targets_min": 364
},
{
"epoch": 3.3585476550680786,
"grad_norm": 0.4555340985592675,
"learning_rate": 2.4869665946305416e-05,
"loss": 0.1745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17548419535160065,
"step": 2220,
"valid_targets_mean": 4283.8,
"valid_targets_min": 881
},
{
"epoch": 3.3661119515885023,
"grad_norm": 0.42662145474665314,
"learning_rate": 2.479645551760457e-05,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17197197675704956,
"step": 2225,
"valid_targets_mean": 5630.0,
"valid_targets_min": 1287
},
{
"epoch": 3.373676248108926,
"grad_norm": 0.47357132814368386,
"learning_rate": 2.4723176833314746e-05,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22617679834365845,
"step": 2230,
"valid_targets_mean": 4526.4,
"valid_targets_min": 344
},
{
"epoch": 3.3812405446293496,
"grad_norm": 0.48402693776368155,
"learning_rate": 2.4649830936222587e-05,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20617449283599854,
"step": 2235,
"valid_targets_mean": 4520.4,
"valid_targets_min": 625
},
{
"epoch": 3.3888048411497733,
"grad_norm": 0.4224957696383896,
"learning_rate": 2.457641887007121e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1821061074733734,
"step": 2240,
"valid_targets_mean": 5160.4,
"valid_targets_min": 502
},
{
"epoch": 3.3963691376701965,
"grad_norm": 0.7483855310876051,
"learning_rate": 2.4502941679545332e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19686508178710938,
"step": 2245,
"valid_targets_mean": 4059.4,
"valid_targets_min": 565
},
{
"epoch": 3.40393343419062,
"grad_norm": 0.36065371648657907,
"learning_rate": 2.442940041025643e-05,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16048836708068848,
"step": 2250,
"valid_targets_mean": 6123.6,
"valid_targets_min": 2298
},
{
"epoch": 3.411497730711044,
"grad_norm": 0.4624913171269963,
"learning_rate": 2.4355796108727847e-05,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20563645660877228,
"step": 2255,
"valid_targets_mean": 5261.8,
"valid_targets_min": 923
},
{
"epoch": 3.4190620272314676,
"grad_norm": 0.4389355151757325,
"learning_rate": 2.4282129822379896e-05,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18385478854179382,
"step": 2260,
"valid_targets_mean": 4616.0,
"valid_targets_min": 831
},
{
"epoch": 3.4266263237518912,
"grad_norm": 0.430635795414073,
"learning_rate": 2.4208402599514957e-05,
"loss": 0.178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17968051135540009,
"step": 2265,
"valid_targets_mean": 4419.5,
"valid_targets_min": 796
},
{
"epoch": 3.4341906202723145,
"grad_norm": 0.43408866333909196,
"learning_rate": 2.4134615489302577e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17835617065429688,
"step": 2270,
"valid_targets_mean": 4954.6,
"valid_targets_min": 662
},
{
"epoch": 3.441754916792738,
"grad_norm": 0.38546381741261365,
"learning_rate": 2.4060769541764516e-05,
"loss": 0.1854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1849050521850586,
"step": 2275,
"valid_targets_mean": 5661.0,
"valid_targets_min": 924
},
{
"epoch": 3.449319213313162,
"grad_norm": 0.36932351801842705,
"learning_rate": 2.39868658077598e-05,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1613771617412567,
"step": 2280,
"valid_targets_mean": 5770.8,
"valid_targets_min": 3163
},
{
"epoch": 3.4568835098335855,
"grad_norm": 0.41601773727093444,
"learning_rate": 2.3912905338969815e-05,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19377577304840088,
"step": 2285,
"valid_targets_mean": 5156.2,
"valid_targets_min": 1963
},
{
"epoch": 3.464447806354009,
"grad_norm": 0.42662998952413006,
"learning_rate": 2.383888918788328e-05,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17014576494693756,
"step": 2290,
"valid_targets_mean": 4985.0,
"valid_targets_min": 1421
},
{
"epoch": 3.472012102874433,
"grad_norm": 0.4400712878742386,
"learning_rate": 2.37648184077813e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17249350249767303,
"step": 2295,
"valid_targets_mean": 4962.9,
"valid_targets_min": 534
},
{
"epoch": 3.4795763993948565,
"grad_norm": 0.41166735172705915,
"learning_rate": 2.3690694052722384e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17984776198863983,
"step": 2300,
"valid_targets_mean": 4898.3,
"valid_targets_min": 882
},
{
"epoch": 3.4871406959152798,
"grad_norm": 0.8846258046228039,
"learning_rate": 2.361651717752742e-05,
"loss": 0.1852,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19693221151828766,
"step": 2305,
"valid_targets_mean": 4449.8,
"valid_targets_min": 579
},
{
"epoch": 3.4947049924357034,
"grad_norm": 0.46403787630805754,
"learning_rate": 2.35422888377647e-05,
"loss": 0.1832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18936261534690857,
"step": 2310,
"valid_targets_mean": 4979.9,
"valid_targets_min": 678
},
{
"epoch": 3.502269288956127,
"grad_norm": 0.46099375157582895,
"learning_rate": 2.3468010089734854e-05,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23048534989356995,
"step": 2315,
"valid_targets_mean": 4629.5,
"valid_targets_min": 837
},
{
"epoch": 3.5098335854765508,
"grad_norm": 0.6381971347550925,
"learning_rate": 2.3393681990455877e-05,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16190201044082642,
"step": 2320,
"valid_targets_mean": 3028.9,
"valid_targets_min": 289
},
{
"epoch": 3.517397881996974,
"grad_norm": 0.42880307161777065,
"learning_rate": 2.331930559764801e-05,
"loss": 0.1755,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16737881302833557,
"step": 2325,
"valid_targets_mean": 4284.9,
"valid_targets_min": 642
},
{
"epoch": 3.5249621785173977,
"grad_norm": 0.4561996764949505,
"learning_rate": 2.3244881969718768e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20272359251976013,
"step": 2330,
"valid_targets_mean": 4521.2,
"valid_targets_min": 543
},
{
"epoch": 3.5325264750378214,
"grad_norm": 0.4728536704189786,
"learning_rate": 2.317041216574782e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19389662146568298,
"step": 2335,
"valid_targets_mean": 4810.5,
"valid_targets_min": 651
},
{
"epoch": 3.540090771558245,
"grad_norm": 0.40806576729419003,
"learning_rate": 2.309589724547195e-05,
"loss": 0.1757,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1756885051727295,
"step": 2340,
"valid_targets_mean": 5160.0,
"valid_targets_min": 860
},
{
"epoch": 3.5476550680786687,
"grad_norm": 0.4620549711410424,
"learning_rate": 2.3021338269269968e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1837664544582367,
"step": 2345,
"valid_targets_mean": 3869.1,
"valid_targets_min": 458
},
{
"epoch": 3.5552193645990924,
"grad_norm": 0.4565329021286906,
"learning_rate": 2.2946736298147605e-05,
"loss": 0.1847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20962950587272644,
"step": 2350,
"valid_targets_mean": 4646.9,
"valid_targets_min": 694
},
{
"epoch": 3.562783661119516,
"grad_norm": 0.467940605445892,
"learning_rate": 2.287209239372244e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17753881216049194,
"step": 2355,
"valid_targets_mean": 4308.3,
"valid_targets_min": 695
},
{
"epoch": 3.5703479576399397,
"grad_norm": 0.48279623085929807,
"learning_rate": 2.2797407618208784e-05,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19052711129188538,
"step": 2360,
"valid_targets_mean": 3844.9,
"valid_targets_min": 658
},
{
"epoch": 3.577912254160363,
"grad_norm": 0.4593538362268239,
"learning_rate": 2.2722683034402543e-05,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1733306348323822,
"step": 2365,
"valid_targets_mean": 4635.1,
"valid_targets_min": 614
},
{
"epoch": 3.5854765506807866,
"grad_norm": 0.4544985432412134,
"learning_rate": 2.264791970566613e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18841543793678284,
"step": 2370,
"valid_targets_mean": 4705.8,
"valid_targets_min": 879
},
{
"epoch": 3.5930408472012103,
"grad_norm": 0.45753745132477175,
"learning_rate": 2.2573118695913303e-05,
"loss": 0.1773,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19560250639915466,
"step": 2375,
"valid_targets_mean": 4873.1,
"valid_targets_min": 660
},
{
"epoch": 3.600605143721634,
"grad_norm": 0.443248808335626,
"learning_rate": 2.2498281069594045e-05,
"loss": 0.1818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20620426535606384,
"step": 2380,
"valid_targets_mean": 5684.8,
"valid_targets_min": 502
},
{
"epoch": 3.608169440242057,
"grad_norm": 0.4440169248740688,
"learning_rate": 2.2423407891679405e-05,
"loss": 0.1894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17821472883224487,
"step": 2385,
"valid_targets_mean": 4816.6,
"valid_targets_min": 881
},
{
"epoch": 3.615733736762481,
"grad_norm": 0.3915151274706588,
"learning_rate": 2.2348500227646347e-05,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17493531107902527,
"step": 2390,
"valid_targets_mean": 5246.4,
"valid_targets_min": 789
},
{
"epoch": 3.6232980332829046,
"grad_norm": 0.43570753821263747,
"learning_rate": 2.2273559143462574e-05,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1876915693283081,
"step": 2395,
"valid_targets_mean": 4848.5,
"valid_targets_min": 721
},
{
"epoch": 3.6308623298033282,
"grad_norm": 0.43800373462337433,
"learning_rate": 2.21985857055714e-05,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16755543649196625,
"step": 2400,
"valid_targets_mean": 4680.5,
"valid_targets_min": 540
},
{
"epoch": 3.638426626323752,
"grad_norm": 0.38868595481400137,
"learning_rate": 2.212358098087652e-05,
"loss": 0.2099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1818462312221527,
"step": 2405,
"valid_targets_mean": 5988.6,
"valid_targets_min": 2237
},
{
"epoch": 3.6459909228441756,
"grad_norm": 0.38746154157768226,
"learning_rate": 2.2048546036726867e-05,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18854598701000214,
"step": 2410,
"valid_targets_mean": 5940.6,
"valid_targets_min": 650
},
{
"epoch": 3.6535552193645993,
"grad_norm": 0.4176036178181955,
"learning_rate": 2.1973481940901403e-05,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15259526669979095,
"step": 2415,
"valid_targets_mean": 4415.6,
"valid_targets_min": 470
},
{
"epoch": 3.661119515885023,
"grad_norm": 0.41410661612753646,
"learning_rate": 2.1898389761593933e-05,
"loss": 0.1782,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17064417898654938,
"step": 2420,
"valid_targets_mean": 5270.3,
"valid_targets_min": 2559
},
{
"epoch": 3.668683812405446,
"grad_norm": 0.48834300834228367,
"learning_rate": 2.1823270567397908e-05,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18752998113632202,
"step": 2425,
"valid_targets_mean": 4708.6,
"valid_targets_min": 681
},
{
"epoch": 3.67624810892587,
"grad_norm": 0.4696483622125557,
"learning_rate": 2.1748125427291203e-05,
"loss": 0.1689,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16924205422401428,
"step": 2430,
"valid_targets_mean": 4393.2,
"valid_targets_min": 345
},
{
"epoch": 3.6838124054462935,
"grad_norm": 0.4987791009849064,
"learning_rate": 2.1672955410620916e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16017551720142365,
"step": 2435,
"valid_targets_mean": 4371.1,
"valid_targets_min": 535
},
{
"epoch": 3.691376701966717,
"grad_norm": 0.4325171641316711,
"learning_rate": 2.1597761587088146e-05,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17629767954349518,
"step": 2440,
"valid_targets_mean": 4894.4,
"valid_targets_min": 883
},
{
"epoch": 3.6989409984871404,
"grad_norm": 0.4736685289222699,
"learning_rate": 2.1522545026732793e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14739350974559784,
"step": 2445,
"valid_targets_mean": 4710.0,
"valid_targets_min": 848
},
{
"epoch": 3.706505295007564,
"grad_norm": 0.4512152628668887,
"learning_rate": 2.1447306799918285e-05,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16980385780334473,
"step": 2450,
"valid_targets_mean": 5042.8,
"valid_targets_min": 789
},
{
"epoch": 3.7140695915279878,
"grad_norm": 0.4576435044941357,
"learning_rate": 2.137204797731638e-05,
"loss": 0.1767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1822136491537094,
"step": 2455,
"valid_targets_mean": 5460.8,
"valid_targets_min": 697
},
{
"epoch": 3.7216338880484114,
"grad_norm": 0.4631213031026051,
"learning_rate": 2.1296769629891946e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19493688642978668,
"step": 2460,
"valid_targets_mean": 4408.8,
"valid_targets_min": 779
},
{
"epoch": 3.729198184568835,
"grad_norm": 0.37665036712818883,
"learning_rate": 2.1221472828887672e-05,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16041424870491028,
"step": 2465,
"valid_targets_mean": 5879.9,
"valid_targets_min": 1259
},
{
"epoch": 3.736762481089259,
"grad_norm": 0.4179212731663629,
"learning_rate": 2.1146158645808845e-05,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18884560465812683,
"step": 2470,
"valid_targets_mean": 5352.8,
"valid_targets_min": 2763
},
{
"epoch": 3.7443267776096825,
"grad_norm": 0.41500424559921534,
"learning_rate": 2.107082815240813e-05,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15109623968601227,
"step": 2475,
"valid_targets_mean": 5304.8,
"valid_targets_min": 1296
},
{
"epoch": 3.751891074130106,
"grad_norm": 0.48903761793465,
"learning_rate": 2.099548242067028e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1728041172027588,
"step": 2480,
"valid_targets_mean": 3551.8,
"valid_targets_min": 732
},
{
"epoch": 3.7594553706505294,
"grad_norm": 0.3925523813669197,
"learning_rate": 2.0920122522796894e-05,
"loss": 0.181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1809263825416565,
"step": 2485,
"valid_targets_mean": 5726.9,
"valid_targets_min": 1075
},
{
"epoch": 3.767019667170953,
"grad_norm": 0.3811307614768285,
"learning_rate": 2.0844749531191164e-05,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17140492796897888,
"step": 2490,
"valid_targets_mean": 5197.9,
"valid_targets_min": 706
},
{
"epoch": 3.7745839636913767,
"grad_norm": 0.4723320494664942,
"learning_rate": 2.076936451844263e-05,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20417089760303497,
"step": 2495,
"valid_targets_mean": 5198.6,
"valid_targets_min": 808
},
{
"epoch": 3.7821482602118004,
"grad_norm": 0.4735562331191886,
"learning_rate": 2.0693968557311858e-05,
"loss": 0.1901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1843431442975998,
"step": 2500,
"valid_targets_mean": 4259.9,
"valid_targets_min": 586
},
{
"epoch": 3.789712556732224,
"grad_norm": 0.46605787164924223,
"learning_rate": 2.061856272071525e-05,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1783793866634369,
"step": 2505,
"valid_targets_mean": 4357.8,
"valid_targets_min": 709
},
{
"epoch": 3.7972768532526473,
"grad_norm": 0.4258832263694262,
"learning_rate": 2.0543148081709726e-05,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18057414889335632,
"step": 2510,
"valid_targets_mean": 5267.4,
"valid_targets_min": 797
},
{
"epoch": 3.804841149773071,
"grad_norm": 0.4403025638542816,
"learning_rate": 2.0467725713477463e-05,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22269657254219055,
"step": 2515,
"valid_targets_mean": 5570.6,
"valid_targets_min": 956
},
{
"epoch": 3.8124054462934946,
"grad_norm": 0.42145758561605795,
"learning_rate": 2.0392296689310646e-05,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1556507647037506,
"step": 2520,
"valid_targets_mean": 4532.9,
"valid_targets_min": 844
},
{
"epoch": 3.8199697428139183,
"grad_norm": 0.45716031065040713,
"learning_rate": 2.0316862082596153e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17538976669311523,
"step": 2525,
"valid_targets_mean": 5158.4,
"valid_targets_min": 922
},
{
"epoch": 3.827534039334342,
"grad_norm": 0.47592674209274544,
"learning_rate": 2.024142296680032e-05,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19242042303085327,
"step": 2530,
"valid_targets_mean": 4368.2,
"valid_targets_min": 559
},
{
"epoch": 3.8350983358547657,
"grad_norm": 0.4216297325551423,
"learning_rate": 2.0165980415453643e-05,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18463507294654846,
"step": 2535,
"valid_targets_mean": 4899.9,
"valid_targets_min": 951
},
{
"epoch": 3.8426626323751893,
"grad_norm": 0.408114244972223,
"learning_rate": 2.0090535502135516e-05,
"loss": 0.1833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18673035502433777,
"step": 2540,
"valid_targets_mean": 4995.6,
"valid_targets_min": 499
},
{
"epoch": 3.8502269288956126,
"grad_norm": 0.4559095603030895,
"learning_rate": 2.0015089300458928e-05,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18540602922439575,
"step": 2545,
"valid_targets_mean": 4267.0,
"valid_targets_min": 482
},
{
"epoch": 3.8577912254160363,
"grad_norm": 0.43246068560103573,
"learning_rate": 1.9939642884055215e-05,
"loss": 0.1781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1851813793182373,
"step": 2550,
"valid_targets_mean": 5570.6,
"valid_targets_min": 1990
},
{
"epoch": 3.86535552193646,
"grad_norm": 0.40837587717862334,
"learning_rate": 1.9864197326558784e-05,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17242997884750366,
"step": 2555,
"valid_targets_mean": 4821.5,
"valid_targets_min": 1103
},
{
"epoch": 3.8729198184568836,
"grad_norm": 0.526014027378549,
"learning_rate": 1.9788753701591767e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17967309057712555,
"step": 2560,
"valid_targets_mean": 4044.2,
"valid_targets_min": 538
},
{
"epoch": 3.8804841149773073,
"grad_norm": 0.43157336608044927,
"learning_rate": 1.9713313082748867e-05,
"loss": 0.19,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18985623121261597,
"step": 2565,
"valid_targets_mean": 4637.7,
"valid_targets_min": 456
},
{
"epoch": 3.8880484114977305,
"grad_norm": 0.4159194231850038,
"learning_rate": 1.963787654358194e-05,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18229806423187256,
"step": 2570,
"valid_targets_mean": 5123.1,
"valid_targets_min": 702
},
{
"epoch": 3.895612708018154,
"grad_norm": 0.45085006380846965,
"learning_rate": 1.9562445157584826e-05,
"loss": 0.1699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19042447209358215,
"step": 2575,
"valid_targets_mean": 4716.1,
"valid_targets_min": 717
},
{
"epoch": 3.903177004538578,
"grad_norm": 0.43137412386375706,
"learning_rate": 1.9487019998178042e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18286067247390747,
"step": 2580,
"valid_targets_mean": 4466.0,
"valid_targets_min": 940
},
{
"epoch": 3.9107413010590015,
"grad_norm": 0.4965792101957091,
"learning_rate": 1.9411602138693457e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18717160820960999,
"step": 2585,
"valid_targets_mean": 6286.9,
"valid_targets_min": 1458
},
{
"epoch": 3.918305597579425,
"grad_norm": 0.6490298129257558,
"learning_rate": 1.9336192652359088e-05,
"loss": 0.1779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16575998067855835,
"step": 2590,
"valid_targets_mean": 5423.4,
"valid_targets_min": 802
},
{
"epoch": 3.925869894099849,
"grad_norm": 0.4383331497273429,
"learning_rate": 1.9260792612283816e-05,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16938605904579163,
"step": 2595,
"valid_targets_mean": 4913.7,
"valid_targets_min": 1531
},
{
"epoch": 3.9334341906202726,
"grad_norm": 0.49828779485449154,
"learning_rate": 1.9185403091442044e-05,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18119296431541443,
"step": 2600,
"valid_targets_mean": 3814.1,
"valid_targets_min": 468
},
{
"epoch": 3.940998487140696,
"grad_norm": 0.49147145967933253,
"learning_rate": 1.9110025162658522e-05,
"loss": 0.1825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17999988794326782,
"step": 2605,
"valid_targets_mean": 4321.2,
"valid_targets_min": 537
},
{
"epoch": 3.9485627836611195,
"grad_norm": 0.4221075762512994,
"learning_rate": 1.903465989859305e-05,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1725933998823166,
"step": 2610,
"valid_targets_mean": 4869.0,
"valid_targets_min": 929
},
{
"epoch": 3.956127080181543,
"grad_norm": 0.4345597802764291,
"learning_rate": 1.8959308371725157e-05,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1820940226316452,
"step": 2615,
"valid_targets_mean": 4674.4,
"valid_targets_min": 611
},
{
"epoch": 3.963691376701967,
"grad_norm": 0.4692245197589479,
"learning_rate": 1.8883971654338927e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18120905756950378,
"step": 2620,
"valid_targets_mean": 4830.3,
"valid_targets_min": 714
},
{
"epoch": 3.9712556732223905,
"grad_norm": 0.3967835982808758,
"learning_rate": 1.8808650818507695e-05,
"loss": 0.186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17867086827754974,
"step": 2625,
"valid_targets_mean": 5038.8,
"valid_targets_min": 2633
},
{
"epoch": 3.9788199697428137,
"grad_norm": 0.44838758067100143,
"learning_rate": 1.8733346936078768e-05,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16222552955150604,
"step": 2630,
"valid_targets_mean": 5533.2,
"valid_targets_min": 824
},
{
"epoch": 3.9863842662632374,
"grad_norm": 0.48431745535271226,
"learning_rate": 1.8658061078658224e-05,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1916062831878662,
"step": 2635,
"valid_targets_mean": 4110.4,
"valid_targets_min": 627
},
{
"epoch": 3.993948562783661,
"grad_norm": 0.47680301163534866,
"learning_rate": 1.8582794317595628e-05,
"loss": 0.1743,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1811482459306717,
"step": 2640,
"valid_targets_mean": 4020.2,
"valid_targets_min": 663
},
{
"epoch": 4.001512859304085,
"grad_norm": 0.46463818534745904,
"learning_rate": 1.8507547723968795e-05,
"loss": 0.1803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16638009250164032,
"step": 2645,
"valid_targets_mean": 3962.8,
"valid_targets_min": 522
},
{
"epoch": 4.009077155824508,
"grad_norm": 0.41554851090079853,
"learning_rate": 1.8432322368568562e-05,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16338765621185303,
"step": 2650,
"valid_targets_mean": 4404.9,
"valid_targets_min": 843
},
{
"epoch": 4.016641452344932,
"grad_norm": 0.5770464302701627,
"learning_rate": 1.835711932188351e-05,
"loss": 0.1812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18008169531822205,
"step": 2655,
"valid_targets_mean": 3572.7,
"valid_targets_min": 642
},
{
"epoch": 4.024205748865356,
"grad_norm": 0.4525771024595579,
"learning_rate": 1.8281939654084783e-05,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17555324733257294,
"step": 2660,
"valid_targets_mean": 5826.1,
"valid_targets_min": 321
},
{
"epoch": 4.031770045385779,
"grad_norm": 0.3758422902364508,
"learning_rate": 1.820678443501083e-05,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13354334235191345,
"step": 2665,
"valid_targets_mean": 5234.1,
"valid_targets_min": 941
},
{
"epoch": 4.039334341906203,
"grad_norm": 0.48385102695876686,
"learning_rate": 1.8131654734152165e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16652946174144745,
"step": 2670,
"valid_targets_mean": 4157.3,
"valid_targets_min": 726
},
{
"epoch": 4.046898638426626,
"grad_norm": 0.41464631491138004,
"learning_rate": 1.805655162063619e-05,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17274890840053558,
"step": 2675,
"valid_targets_mean": 5395.8,
"valid_targets_min": 924
},
{
"epoch": 4.05446293494705,
"grad_norm": 0.3576877331596476,
"learning_rate": 1.798147616321195e-05,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14228424429893494,
"step": 2680,
"valid_targets_mean": 6599.6,
"valid_targets_min": 3450
},
{
"epoch": 4.062027231467473,
"grad_norm": 0.42216558468027454,
"learning_rate": 1.7906429430234927e-05,
"loss": 0.1742,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1685303896665573,
"step": 2685,
"valid_targets_mean": 5240.1,
"valid_targets_min": 849
},
{
"epoch": 4.069591527987897,
"grad_norm": 0.43009627202726336,
"learning_rate": 1.783141248965184e-05,
"loss": 0.1638,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13526831567287445,
"step": 2690,
"valid_targets_mean": 5489.6,
"valid_targets_min": 1941
},
{
"epoch": 4.077155824508321,
"grad_norm": 0.44577441502625953,
"learning_rate": 1.775642640898547e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14539185166358948,
"step": 2695,
"valid_targets_mean": 4562.2,
"valid_targets_min": 514
},
{
"epoch": 4.084720121028744,
"grad_norm": 0.4644816906536246,
"learning_rate": 1.7681472255319417e-05,
"loss": 0.1692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16671213507652283,
"step": 2700,
"valid_targets_mean": 4358.8,
"valid_targets_min": 768
},
{
"epoch": 4.092284417549168,
"grad_norm": 0.4876809684009793,
"learning_rate": 1.7606551095282978e-05,
"loss": 0.1753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1734774261713028,
"step": 2705,
"valid_targets_mean": 3740.9,
"valid_targets_min": 423
},
{
"epoch": 4.099848714069592,
"grad_norm": 0.38721781374833864,
"learning_rate": 1.753166399503591e-05,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15614727139472961,
"step": 2710,
"valid_targets_mean": 5812.4,
"valid_targets_min": 1874
},
{
"epoch": 4.107413010590015,
"grad_norm": 0.4989057932943494,
"learning_rate": 1.74568120202533e-05,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21545648574829102,
"step": 2715,
"valid_targets_mean": 4326.6,
"valid_targets_min": 913
},
{
"epoch": 4.114977307110439,
"grad_norm": 0.5034602177391847,
"learning_rate": 1.7381996236110386e-05,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17472974956035614,
"step": 2720,
"valid_targets_mean": 3635.9,
"valid_targets_min": 586
},
{
"epoch": 4.122541603630863,
"grad_norm": 0.9829745879005233,
"learning_rate": 1.730721770726739e-05,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1908668577671051,
"step": 2725,
"valid_targets_mean": 4817.6,
"valid_targets_min": 944
},
{
"epoch": 4.130105900151286,
"grad_norm": 0.526475392969517,
"learning_rate": 1.7232477497854377e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16699153184890747,
"step": 2730,
"valid_targets_mean": 3689.2,
"valid_targets_min": 956
},
{
"epoch": 4.13767019667171,
"grad_norm": 0.5000977100526197,
"learning_rate": 1.7157776671456114e-05,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1865454614162445,
"step": 2735,
"valid_targets_mean": 3762.7,
"valid_targets_min": 391
},
{
"epoch": 4.145234493192133,
"grad_norm": 0.4234081246667148,
"learning_rate": 1.7083116291096926e-05,
"loss": 0.1682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1912594586610794,
"step": 2740,
"valid_targets_mean": 5724.4,
"valid_targets_min": 1161
},
{
"epoch": 4.1527987897125564,
"grad_norm": 0.41678834278096616,
"learning_rate": 1.7008497419225578e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16795726120471954,
"step": 2745,
"valid_targets_mean": 5573.5,
"valid_targets_min": 496
},
{
"epoch": 4.16036308623298,
"grad_norm": 0.4621994786376751,
"learning_rate": 1.6933921117700156e-05,
"loss": 0.1691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18064820766448975,
"step": 2750,
"valid_targets_mean": 4568.9,
"valid_targets_min": 773
},
{
"epoch": 4.167927382753404,
"grad_norm": 0.4826289668834577,
"learning_rate": 1.6859388447772936e-05,
"loss": 0.1819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17181620001792908,
"step": 2755,
"valid_targets_mean": 4864.2,
"valid_targets_min": 932
},
{
"epoch": 4.1754916792738275,
"grad_norm": 0.6397951450093655,
"learning_rate": 1.6784900470075312e-05,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1756332814693451,
"step": 2760,
"valid_targets_mean": 3957.1,
"valid_targets_min": 767
},
{
"epoch": 4.183055975794251,
"grad_norm": 0.44994217785156254,
"learning_rate": 1.6710458244602695e-05,
"loss": 0.1703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15611310303211212,
"step": 2765,
"valid_targets_mean": 4696.2,
"valid_targets_min": 736
},
{
"epoch": 4.190620272314675,
"grad_norm": 0.4237563016526201,
"learning_rate": 1.66360628306994e-05,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1666485220193863,
"step": 2770,
"valid_targets_mean": 5272.4,
"valid_targets_min": 753
},
{
"epoch": 4.1981845688350985,
"grad_norm": 0.5395432298525558,
"learning_rate": 1.656171528704361e-05,
"loss": 0.1824,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17594173550605774,
"step": 2775,
"valid_targets_mean": 3776.5,
"valid_targets_min": 620
},
{
"epoch": 4.205748865355522,
"grad_norm": 0.5832213537978989,
"learning_rate": 1.648741667163229e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17744117975234985,
"step": 2780,
"valid_targets_mean": 3303.4,
"valid_targets_min": 583
},
{
"epoch": 4.213313161875946,
"grad_norm": 0.5256449374178925,
"learning_rate": 1.641316804176613e-05,
"loss": 0.1647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16040672361850739,
"step": 2785,
"valid_targets_mean": 3447.4,
"valid_targets_min": 519
},
{
"epoch": 4.2208774583963695,
"grad_norm": 0.5028188639011574,
"learning_rate": 1.6338970454034527e-05,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17807036638259888,
"step": 2790,
"valid_targets_mean": 4636.7,
"valid_targets_min": 787
},
{
"epoch": 4.228441754916792,
"grad_norm": 0.4997025752135004,
"learning_rate": 1.626482496430049e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1678473949432373,
"step": 2795,
"valid_targets_mean": 4014.8,
"valid_targets_min": 442
},
{
"epoch": 4.236006051437216,
"grad_norm": 0.45565425172448304,
"learning_rate": 1.6190732627685686e-05,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16583865880966187,
"step": 2800,
"valid_targets_mean": 4589.2,
"valid_targets_min": 405
},
{
"epoch": 4.24357034795764,
"grad_norm": 0.4025133264233328,
"learning_rate": 1.611669449855537e-05,
"loss": 0.1678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16866248846054077,
"step": 2805,
"valid_targets_mean": 5671.2,
"valid_targets_min": 711
},
{
"epoch": 4.251134644478063,
"grad_norm": 0.48967416716184,
"learning_rate": 1.6042711630503406e-05,
"loss": 0.1886,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16977915167808533,
"step": 2810,
"valid_targets_mean": 4551.2,
"valid_targets_min": 514
},
{
"epoch": 4.258698940998487,
"grad_norm": 0.44902519039938005,
"learning_rate": 1.5968785076337273e-05,
"loss": 0.1732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1602228879928589,
"step": 2815,
"valid_targets_mean": 4892.4,
"valid_targets_min": 526
},
{
"epoch": 4.266263237518911,
"grad_norm": 0.5206132784127442,
"learning_rate": 1.5894915888063085e-05,
"loss": 0.1695,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19216004014015198,
"step": 2820,
"valid_targets_mean": 3800.8,
"valid_targets_min": 552
},
{
"epoch": 4.273827534039334,
"grad_norm": 0.4447385592944839,
"learning_rate": 1.5821105116870594e-05,
"loss": 0.1714,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15732452273368835,
"step": 2825,
"valid_targets_mean": 4333.0,
"valid_targets_min": 694
},
{
"epoch": 4.281391830559758,
"grad_norm": 0.4279569711895869,
"learning_rate": 1.5747353813118276e-05,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1582874357700348,
"step": 2830,
"valid_targets_mean": 4712.3,
"valid_targets_min": 614
},
{
"epoch": 4.288956127080182,
"grad_norm": 0.5213550677478702,
"learning_rate": 1.567366302631835e-05,
"loss": 0.161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16362854838371277,
"step": 2835,
"valid_targets_mean": 4576.0,
"valid_targets_min": 776
},
{
"epoch": 4.296520423600605,
"grad_norm": 0.47091022792617493,
"learning_rate": 1.560003380512185e-05,
"loss": 0.1667,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.168619304895401,
"step": 2840,
"valid_targets_mean": 4807.8,
"valid_targets_min": 547
},
{
"epoch": 4.304084720121029,
"grad_norm": 0.47159810197254937,
"learning_rate": 1.5526467197303715e-05,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.182538241147995,
"step": 2845,
"valid_targets_mean": 4528.5,
"valid_targets_min": 780
},
{
"epoch": 4.311649016641453,
"grad_norm": 0.47889319712753947,
"learning_rate": 1.5452964249747848e-05,
"loss": 0.1761,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14952681958675385,
"step": 2850,
"valid_targets_mean": 4010.2,
"valid_targets_min": 730
},
{
"epoch": 4.319213313161876,
"grad_norm": 0.4256664007842176,
"learning_rate": 1.537952600843227e-05,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14827358722686768,
"step": 2855,
"valid_targets_mean": 4466.1,
"valid_targets_min": 716
},
{
"epoch": 4.326777609682299,
"grad_norm": 0.40977956425276274,
"learning_rate": 1.5306153518414197e-05,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15310370922088623,
"step": 2860,
"valid_targets_mean": 5170.0,
"valid_targets_min": 332
},
{
"epoch": 4.334341906202723,
"grad_norm": 0.462683167593508,
"learning_rate": 1.523284782381514e-05,
"loss": 0.1454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14999224245548248,
"step": 2865,
"valid_targets_mean": 5006.0,
"valid_targets_min": 239
},
{
"epoch": 4.3419062027231465,
"grad_norm": 0.45878776063067306,
"learning_rate": 1.5159609967806135e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.185188889503479,
"step": 2870,
"valid_targets_mean": 4822.1,
"valid_targets_min": 1063
},
{
"epoch": 4.34947049924357,
"grad_norm": 0.41643746040516816,
"learning_rate": 1.5086440992592826e-05,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15771910548210144,
"step": 2875,
"valid_targets_mean": 5071.6,
"valid_targets_min": 614
},
{
"epoch": 4.357034795763994,
"grad_norm": 0.4803323187058902,
"learning_rate": 1.5013341939400628e-05,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18151001632213593,
"step": 2880,
"valid_targets_mean": 4068.4,
"valid_targets_min": 506
},
{
"epoch": 4.364599092284418,
"grad_norm": 0.49357279196784626,
"learning_rate": 1.4940313848459975e-05,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16743910312652588,
"step": 2885,
"valid_targets_mean": 4971.4,
"valid_targets_min": 899
},
{
"epoch": 4.372163388804841,
"grad_norm": 0.47252098051012686,
"learning_rate": 1.4867357758991474e-05,
"loss": 0.1707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18773172795772552,
"step": 2890,
"valid_targets_mean": 5009.6,
"valid_targets_min": 506
},
{
"epoch": 4.379727685325265,
"grad_norm": 0.4343325194878802,
"learning_rate": 1.4794474709191082e-05,
"loss": 0.1634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1580682247877121,
"step": 2895,
"valid_targets_mean": 5471.8,
"valid_targets_min": 474
},
{
"epoch": 4.387291981845689,
"grad_norm": 0.6607347840108052,
"learning_rate": 1.4721665736215416e-05,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17931993305683136,
"step": 2900,
"valid_targets_mean": 5108.2,
"valid_targets_min": 905
},
{
"epoch": 4.394856278366112,
"grad_norm": 0.4590615908212395,
"learning_rate": 1.4648931876166931e-05,
"loss": 0.1764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1773712933063507,
"step": 2905,
"valid_targets_mean": 4593.6,
"valid_targets_min": 717
},
{
"epoch": 4.402420574886536,
"grad_norm": 0.45820730146428945,
"learning_rate": 1.4576274164079183e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1603582799434662,
"step": 2910,
"valid_targets_mean": 4533.9,
"valid_targets_min": 524
},
{
"epoch": 4.409984871406959,
"grad_norm": 0.5249917435247164,
"learning_rate": 1.4503693633902128e-05,
"loss": 0.1682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20168936252593994,
"step": 2915,
"valid_targets_mean": 4979.8,
"valid_targets_min": 2321
},
{
"epoch": 4.417549167927382,
"grad_norm": 0.4815350204188176,
"learning_rate": 1.4431191318487372e-05,
"loss": 0.1661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16469869017601013,
"step": 2920,
"valid_targets_mean": 4120.6,
"valid_targets_min": 652
},
{
"epoch": 4.425113464447806,
"grad_norm": 0.4797606831091243,
"learning_rate": 1.4358768249573514e-05,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17197684943675995,
"step": 2925,
"valid_targets_mean": 4215.9,
"valid_targets_min": 660
},
{
"epoch": 4.43267776096823,
"grad_norm": 0.43573686034480597,
"learning_rate": 1.4286425457771427e-05,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17867511510849,
"step": 2930,
"valid_targets_mean": 5221.4,
"valid_targets_min": 2249
},
{
"epoch": 4.440242057488653,
"grad_norm": 0.41672734352822066,
"learning_rate": 1.4214163972549604e-05,
"loss": 0.1517,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13659437000751495,
"step": 2935,
"valid_targets_mean": 5257.1,
"valid_targets_min": 2090
},
{
"epoch": 4.447806354009077,
"grad_norm": 0.48856441504073617,
"learning_rate": 1.4141984822219521e-05,
"loss": 0.1657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15636491775512695,
"step": 2940,
"valid_targets_mean": 4395.1,
"valid_targets_min": 600
},
{
"epoch": 4.455370650529501,
"grad_norm": 0.4772725352943584,
"learning_rate": 1.4069889033920998e-05,
"loss": 0.1797,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20085512101650238,
"step": 2945,
"valid_targets_mean": 4495.1,
"valid_targets_min": 607
},
{
"epoch": 4.462934947049924,
"grad_norm": 0.42051910317593916,
"learning_rate": 1.3997877633607557e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16399016976356506,
"step": 2950,
"valid_targets_mean": 5878.0,
"valid_targets_min": 869
},
{
"epoch": 4.470499243570348,
"grad_norm": 0.42806628012013004,
"learning_rate": 1.3925951646031864e-05,
"loss": 0.1823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17599345743656158,
"step": 2955,
"valid_targets_mean": 5046.3,
"valid_targets_min": 900
},
{
"epoch": 4.478063540090772,
"grad_norm": 0.3960989399268624,
"learning_rate": 1.3854112094731116e-05,
"loss": 0.1643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16925032436847687,
"step": 2960,
"valid_targets_mean": 6420.0,
"valid_targets_min": 1942
},
{
"epoch": 4.4856278366111955,
"grad_norm": 0.46152209852293663,
"learning_rate": 1.3782360002012485e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14222872257232666,
"step": 2965,
"valid_targets_mean": 4932.2,
"valid_targets_min": 2050
},
{
"epoch": 4.493192133131619,
"grad_norm": 0.4611561798527351,
"learning_rate": 1.3710696388938574e-05,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17129528522491455,
"step": 2970,
"valid_targets_mean": 4561.2,
"valid_targets_min": 493
},
{
"epoch": 4.500756429652043,
"grad_norm": 0.5236948649019548,
"learning_rate": 1.3639122275312886e-05,
"loss": 0.1605,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1523115336894989,
"step": 2975,
"valid_targets_mean": 4292.9,
"valid_targets_min": 732
},
{
"epoch": 4.508320726172466,
"grad_norm": 0.49450938589759885,
"learning_rate": 1.3567638679665296e-05,
"loss": 0.173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17702379822731018,
"step": 2980,
"valid_targets_mean": 4186.6,
"valid_targets_min": 575
},
{
"epoch": 4.515885022692889,
"grad_norm": 0.43334140448201086,
"learning_rate": 1.3496246619237585e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17083197832107544,
"step": 2985,
"valid_targets_mean": 5292.4,
"valid_targets_min": 1003
},
{
"epoch": 4.523449319213313,
"grad_norm": 0.472497861189218,
"learning_rate": 1.3424947109968944e-05,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16844433546066284,
"step": 2990,
"valid_targets_mean": 4980.1,
"valid_targets_min": 738
},
{
"epoch": 4.531013615733737,
"grad_norm": 0.49098116229371497,
"learning_rate": 1.3353741166481515e-05,
"loss": 0.168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15978705883026123,
"step": 2995,
"valid_targets_mean": 4352.1,
"valid_targets_min": 1871
},
{
"epoch": 4.53857791225416,
"grad_norm": 0.4383059631684414,
"learning_rate": 1.3282629802065974e-05,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16577211022377014,
"step": 3000,
"valid_targets_mean": 5097.1,
"valid_targets_min": 970
},
{
"epoch": 4.546142208774584,
"grad_norm": 0.45601726097153666,
"learning_rate": 1.3211614028667077e-05,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2073879837989807,
"step": 3005,
"valid_targets_mean": 4979.4,
"valid_targets_min": 723
},
{
"epoch": 4.553706505295008,
"grad_norm": 0.4059819676532039,
"learning_rate": 1.3140694856869297e-05,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14776208996772766,
"step": 3010,
"valid_targets_mean": 5175.5,
"valid_targets_min": 1354
},
{
"epoch": 4.561270801815431,
"grad_norm": 0.50274521759109,
"learning_rate": 1.306987329588242e-05,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16442856192588806,
"step": 3015,
"valid_targets_mean": 4776.6,
"valid_targets_min": 913
},
{
"epoch": 4.568835098335855,
"grad_norm": 0.4264689299807262,
"learning_rate": 1.2999150353527182e-05,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16325069963932037,
"step": 3020,
"valid_targets_mean": 4675.2,
"valid_targets_min": 167
},
{
"epoch": 4.576399394856279,
"grad_norm": 0.4440378341428616,
"learning_rate": 1.2928527036220944e-05,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1781526505947113,
"step": 3025,
"valid_targets_mean": 4669.3,
"valid_targets_min": 881
},
{
"epoch": 4.583963691376702,
"grad_norm": 0.44802586160013663,
"learning_rate": 1.285800434896336e-05,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1558399349451065,
"step": 3030,
"valid_targets_mean": 5058.0,
"valid_targets_min": 579
},
{
"epoch": 4.591527987897125,
"grad_norm": 0.4382924500174268,
"learning_rate": 1.2787583295322063e-05,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12798433005809784,
"step": 3035,
"valid_targets_mean": 4102.2,
"valid_targets_min": 372
},
{
"epoch": 4.599092284417549,
"grad_norm": 0.495690878784159,
"learning_rate": 1.2717264877418409e-05,
"loss": 0.1663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16291014850139618,
"step": 3040,
"valid_targets_mean": 4889.7,
"valid_targets_min": 1085
},
{
"epoch": 4.6066565809379725,
"grad_norm": 0.4139498162424246,
"learning_rate": 1.2647050095913211e-05,
"loss": 0.1665,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1578187495470047,
"step": 3045,
"valid_targets_mean": 5494.0,
"valid_targets_min": 1253
},
{
"epoch": 4.614220877458396,
"grad_norm": 0.47999890638951775,
"learning_rate": 1.2576939949992468e-05,
"loss": 0.1628,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1848933845758438,
"step": 3050,
"valid_targets_mean": 4716.2,
"valid_targets_min": 760
},
{
"epoch": 4.62178517397882,
"grad_norm": 0.5019757162184942,
"learning_rate": 1.2506935437353192e-05,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19041526317596436,
"step": 3055,
"valid_targets_mean": 4226.5,
"valid_targets_min": 551
},
{
"epoch": 4.6293494704992435,
"grad_norm": 0.5289337309331459,
"learning_rate": 1.2437037554189186e-05,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17573757469654083,
"step": 3060,
"valid_targets_mean": 4741.9,
"valid_targets_min": 876
},
{
"epoch": 4.636913767019667,
"grad_norm": 0.40854843689777737,
"learning_rate": 1.2367247295176855e-05,
"loss": 0.1658,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17039918899536133,
"step": 3065,
"valid_targets_mean": 5760.3,
"valid_targets_min": 1998
},
{
"epoch": 4.644478063540091,
"grad_norm": 0.4314054991151234,
"learning_rate": 1.2297565653461087e-05,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15315118432044983,
"step": 3070,
"valid_targets_mean": 5566.9,
"valid_targets_min": 2093
},
{
"epoch": 4.6520423600605145,
"grad_norm": 0.525526201288757,
"learning_rate": 1.2227993620641083e-05,
"loss": 0.1751,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17355704307556152,
"step": 3075,
"valid_targets_mean": 3794.9,
"valid_targets_min": 676
},
{
"epoch": 4.659606656580938,
"grad_norm": 0.4676478453236289,
"learning_rate": 1.2158532186756275e-05,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1458236575126648,
"step": 3080,
"valid_targets_mean": 4220.9,
"valid_targets_min": 803
},
{
"epoch": 4.667170953101362,
"grad_norm": 0.4387137897170397,
"learning_rate": 1.2089182340272227e-05,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16402631998062134,
"step": 3085,
"valid_targets_mean": 5154.2,
"valid_targets_min": 1986
},
{
"epoch": 4.6747352496217855,
"grad_norm": 0.5151503192275158,
"learning_rate": 1.201994506806655e-05,
"loss": 0.1644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15883511304855347,
"step": 3090,
"valid_targets_mean": 5183.6,
"valid_targets_min": 614
},
{
"epoch": 4.682299546142209,
"grad_norm": 0.4919027448221628,
"learning_rate": 1.1950821355414894e-05,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2019597738981247,
"step": 3095,
"valid_targets_mean": 4693.2,
"valid_targets_min": 795
},
{
"epoch": 4.689863842662632,
"grad_norm": 0.411381231559992,
"learning_rate": 1.1881812185976902e-05,
"loss": 0.1602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15423153340816498,
"step": 3100,
"valid_targets_mean": 5120.1,
"valid_targets_min": 974
},
{
"epoch": 4.697428139183056,
"grad_norm": 0.433674376108163,
"learning_rate": 1.1812918541782215e-05,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17236676812171936,
"step": 3105,
"valid_targets_mean": 5125.4,
"valid_targets_min": 456
},
{
"epoch": 4.704992435703479,
"grad_norm": 0.5330642664335918,
"learning_rate": 1.1744141403216503e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2719995379447937,
"step": 3110,
"valid_targets_mean": 5730.6,
"valid_targets_min": 894
},
{
"epoch": 4.712556732223903,
"grad_norm": 0.589306427456538,
"learning_rate": 1.1675481749007518e-05,
"loss": 0.1775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.211774080991745,
"step": 3115,
"valid_targets_mean": 3777.1,
"valid_targets_min": 258
},
{
"epoch": 4.720121028744327,
"grad_norm": 0.43617038752664566,
"learning_rate": 1.1606940556211147e-05,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1602756232023239,
"step": 3120,
"valid_targets_mean": 5495.8,
"valid_targets_min": 1985
},
{
"epoch": 4.72768532526475,
"grad_norm": 0.43013622893573156,
"learning_rate": 1.1538518800197538e-05,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16299334168434143,
"step": 3125,
"valid_targets_mean": 4878.0,
"valid_targets_min": 664
},
{
"epoch": 4.735249621785174,
"grad_norm": 0.4243645747448522,
"learning_rate": 1.1470217454637193e-05,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15592533349990845,
"step": 3130,
"valid_targets_mean": 4838.5,
"valid_targets_min": 830
},
{
"epoch": 4.742813918305598,
"grad_norm": 0.42684650496375437,
"learning_rate": 1.1402037491487112e-05,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17367637157440186,
"step": 3135,
"valid_targets_mean": 5900.9,
"valid_targets_min": 898
},
{
"epoch": 4.750378214826021,
"grad_norm": 0.4361124117092106,
"learning_rate": 1.1333979880976992e-05,
"loss": 0.1637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17264147102832794,
"step": 3140,
"valid_targets_mean": 4803.4,
"valid_targets_min": 918
},
{
"epoch": 4.757942511346445,
"grad_norm": 0.45343151422164607,
"learning_rate": 1.1266045591595391e-05,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18170015513896942,
"step": 3145,
"valid_targets_mean": 4986.0,
"valid_targets_min": 1012
},
{
"epoch": 4.765506807866869,
"grad_norm": 0.5071698615673526,
"learning_rate": 1.1198235590075951e-05,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17840242385864258,
"step": 3150,
"valid_targets_mean": 4062.6,
"valid_targets_min": 706
},
{
"epoch": 4.7730711043872915,
"grad_norm": 0.4581144263893417,
"learning_rate": 1.1130550841383662e-05,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15911459922790527,
"step": 3155,
"valid_targets_mean": 4572.2,
"valid_targets_min": 525
},
{
"epoch": 4.780635400907715,
"grad_norm": 0.42922503083348856,
"learning_rate": 1.1062992308701089e-05,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1482914686203003,
"step": 3160,
"valid_targets_mean": 4370.2,
"valid_targets_min": 871
},
{
"epoch": 4.788199697428139,
"grad_norm": 0.4259676210192377,
"learning_rate": 1.0995560953414701e-05,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15134750306606293,
"step": 3165,
"valid_targets_mean": 5120.9,
"valid_targets_min": 903
},
{
"epoch": 4.795763993948563,
"grad_norm": 0.4931505035733333,
"learning_rate": 1.0928257735101186e-05,
"loss": 0.1612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14641442894935608,
"step": 3170,
"valid_targets_mean": 3489.4,
"valid_targets_min": 498
},
{
"epoch": 4.803328290468986,
"grad_norm": 0.4657115402405436,
"learning_rate": 1.0861083611513781e-05,
"loss": 0.169,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1858498901128769,
"step": 3175,
"valid_targets_mean": 4672.9,
"valid_targets_min": 653
},
{
"epoch": 4.81089258698941,
"grad_norm": 0.4963708205352106,
"learning_rate": 1.0794039538568653e-05,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1865379959344864,
"step": 3180,
"valid_targets_mean": 4229.4,
"valid_targets_min": 515
},
{
"epoch": 4.818456883509834,
"grad_norm": 0.5019745644106931,
"learning_rate": 1.0727126470331299e-05,
"loss": 0.1686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17774225771427155,
"step": 3185,
"valid_targets_mean": 4163.1,
"valid_targets_min": 509
},
{
"epoch": 4.826021180030257,
"grad_norm": 0.41638071512531366,
"learning_rate": 1.0660345359002941e-05,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1485077440738678,
"step": 3190,
"valid_targets_mean": 4660.1,
"valid_targets_min": 736
},
{
"epoch": 4.833585476550681,
"grad_norm": 0.44572452901778975,
"learning_rate": 1.0593697154907027e-05,
"loss": 0.1719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16914719343185425,
"step": 3195,
"valid_targets_mean": 5350.4,
"valid_targets_min": 744
},
{
"epoch": 4.841149773071105,
"grad_norm": 0.6533490446460197,
"learning_rate": 1.0527182806475662e-05,
"loss": 0.1708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1586613953113556,
"step": 3200,
"valid_targets_mean": 4271.1,
"valid_targets_min": 597
},
{
"epoch": 4.848714069591528,
"grad_norm": 0.45373202080563063,
"learning_rate": 1.0460803260236134e-05,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1581738293170929,
"step": 3205,
"valid_targets_mean": 5267.1,
"valid_targets_min": 649
},
{
"epoch": 4.856278366111952,
"grad_norm": 0.4179137546333998,
"learning_rate": 1.0394559460797446e-05,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17204821109771729,
"step": 3210,
"valid_targets_mean": 5295.6,
"valid_targets_min": 543
},
{
"epoch": 4.863842662632376,
"grad_norm": 0.4122805539335566,
"learning_rate": 1.0328452350836842e-05,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18401654064655304,
"step": 3215,
"valid_targets_mean": 5601.4,
"valid_targets_min": 742
},
{
"epoch": 4.871406959152798,
"grad_norm": 0.40302438542126645,
"learning_rate": 1.0262482871086443e-05,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1483723670244217,
"step": 3220,
"valid_targets_mean": 6198.2,
"valid_targets_min": 848
},
{
"epoch": 4.878971255673222,
"grad_norm": 0.45468069712107095,
"learning_rate": 1.019665196031982e-05,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17304138839244843,
"step": 3225,
"valid_targets_mean": 4215.2,
"valid_targets_min": 871
},
{
"epoch": 4.886535552193646,
"grad_norm": 0.44734310925531656,
"learning_rate": 1.013096055533866e-05,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16383050382137299,
"step": 3230,
"valid_targets_mean": 4358.6,
"valid_targets_min": 750
},
{
"epoch": 4.8940998487140694,
"grad_norm": 0.4425864585330284,
"learning_rate": 1.006540959095941e-05,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17266994714736938,
"step": 3235,
"valid_targets_mean": 4547.7,
"valid_targets_min": 537
},
{
"epoch": 4.901664145234493,
"grad_norm": 0.42155951333967423,
"learning_rate": 1.0000000000000006e-05,
"loss": 0.1682,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1378743052482605,
"step": 3240,
"valid_targets_mean": 4115.5,
"valid_targets_min": 263
},
{
"epoch": 4.909228441754917,
"grad_norm": 0.4299630738249049,
"learning_rate": 9.93473271326655e-06,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1550338864326477,
"step": 3245,
"valid_targets_mean": 4854.7,
"valid_targets_min": 2796
},
{
"epoch": 4.9167927382753405,
"grad_norm": 0.44329248279038397,
"learning_rate": 9.869608659540129e-06,
"loss": 0.1702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17476975917816162,
"step": 3250,
"valid_targets_mean": 5090.2,
"valid_targets_min": 1022
},
{
"epoch": 4.924357034795764,
"grad_norm": 0.428271116473207,
"learning_rate": 9.804628765563542e-06,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15965984761714935,
"step": 3255,
"valid_targets_mean": 4787.6,
"valid_targets_min": 804
},
{
"epoch": 4.931921331316188,
"grad_norm": 0.45332178784102023,
"learning_rate": 9.739793956028143e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14514422416687012,
"step": 3260,
"valid_targets_mean": 5900.1,
"valid_targets_min": 435
},
{
"epoch": 4.9394856278366115,
"grad_norm": 0.4444157485949258,
"learning_rate": 9.675105153560668e-06,
"loss": 0.1662,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440054178237915,
"step": 3265,
"valid_targets_mean": 4733.8,
"valid_targets_min": 584
},
{
"epoch": 4.947049924357035,
"grad_norm": 0.4348481496365988,
"learning_rate": 9.610563278710128e-06,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.180255725979805,
"step": 3270,
"valid_targets_mean": 5171.2,
"valid_targets_min": 762
},
{
"epoch": 4.954614220877458,
"grad_norm": 0.45864775112962614,
"learning_rate": 9.546169249934654e-06,
"loss": 0.1738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17231298983097076,
"step": 3275,
"valid_targets_mean": 4814.8,
"valid_targets_min": 333
},
{
"epoch": 4.962178517397882,
"grad_norm": 0.5156923688354568,
"learning_rate": 9.481923983588508e-06,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18253746628761292,
"step": 3280,
"valid_targets_mean": 3727.0,
"valid_targets_min": 447
},
{
"epoch": 4.969742813918305,
"grad_norm": 0.4101590443569368,
"learning_rate": 9.417828393908955e-06,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12951171398162842,
"step": 3285,
"valid_targets_mean": 4951.4,
"valid_targets_min": 416
},
{
"epoch": 4.977307110438729,
"grad_norm": 0.42241612118878036,
"learning_rate": 9.353883393003347e-06,
"loss": 0.1646,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17528489232063293,
"step": 3290,
"valid_targets_mean": 5294.8,
"valid_targets_min": 578
},
{
"epoch": 4.984871406959153,
"grad_norm": 0.3957796359048021,
"learning_rate": 9.290089890836068e-06,
"loss": 0.1674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16144408285617828,
"step": 3295,
"valid_targets_mean": 5681.1,
"valid_targets_min": 947
},
{
"epoch": 4.992435703479576,
"grad_norm": 0.4371247368929281,
"learning_rate": 9.226448795215598e-06,
"loss": 0.1636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1603410542011261,
"step": 3300,
"valid_targets_mean": 4666.8,
"valid_targets_min": 718
},
{
"epoch": 5.0,
"grad_norm": 0.44364123498321484,
"learning_rate": 9.162961011781632e-06,
"loss": 0.1666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18622517585754395,
"step": 3305,
"valid_targets_mean": 4746.6,
"valid_targets_min": 1724
},
{
"epoch": 5.007564296520424,
"grad_norm": 0.48356773402835035,
"learning_rate": 9.099627443992163e-06,
"loss": 0.1504,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1390305906534195,
"step": 3310,
"valid_targets_mean": 4232.3,
"valid_targets_min": 636
},
{
"epoch": 5.015128593040847,
"grad_norm": 0.40848481053739466,
"learning_rate": 9.036448993110603e-06,
"loss": 0.1555,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1643286496400833,
"step": 3315,
"valid_targets_mean": 5712.9,
"valid_targets_min": 1201
},
{
"epoch": 5.022692889561271,
"grad_norm": 0.4515946515252321,
"learning_rate": 8.97342655819303e-06,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15688204765319824,
"step": 3320,
"valid_targets_mean": 4522.5,
"valid_targets_min": 737
},
{
"epoch": 5.030257186081695,
"grad_norm": 0.4329236745402465,
"learning_rate": 8.910561036075325e-06,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.152809739112854,
"step": 3325,
"valid_targets_mean": 4936.4,
"valid_targets_min": 263
},
{
"epoch": 5.037821482602118,
"grad_norm": 0.4478790148739838,
"learning_rate": 8.847853321360423e-06,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13745734095573425,
"step": 3330,
"valid_targets_mean": 4847.0,
"valid_targets_min": 2085
},
{
"epoch": 5.045385779122542,
"grad_norm": 0.46929256146302734,
"learning_rate": 8.785304306405605e-06,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14126646518707275,
"step": 3335,
"valid_targets_mean": 4518.4,
"valid_targets_min": 919
},
{
"epoch": 5.052950075642965,
"grad_norm": 0.45325256164746236,
"learning_rate": 8.722914881309801e-06,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1484193503856659,
"step": 3340,
"valid_targets_mean": 4938.5,
"valid_targets_min": 541
},
{
"epoch": 5.0605143721633885,
"grad_norm": 0.488278580977796,
"learning_rate": 8.660685933900869e-06,
"loss": 0.1765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16470378637313843,
"step": 3345,
"valid_targets_mean": 4565.0,
"valid_targets_min": 850
},
{
"epoch": 5.068078668683812,
"grad_norm": 0.5386047975887774,
"learning_rate": 8.59861834972306e-06,
"loss": 0.1724,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17436347901821136,
"step": 3350,
"valid_targets_mean": 3495.9,
"valid_targets_min": 457
},
{
"epoch": 5.075642965204236,
"grad_norm": 0.505045707433957,
"learning_rate": 8.536713012024305e-06,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1657446324825287,
"step": 3355,
"valid_targets_mean": 4460.2,
"valid_targets_min": 639
},
{
"epoch": 5.0832072617246595,
"grad_norm": 0.4834428008879641,
"learning_rate": 8.474970801743724e-06,
"loss": 0.1621,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14867718517780304,
"step": 3360,
"valid_targets_mean": 5020.8,
"valid_targets_min": 726
},
{
"epoch": 5.090771558245083,
"grad_norm": 0.601215561668829,
"learning_rate": 8.413392597499075e-06,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14667610824108124,
"step": 3365,
"valid_targets_mean": 3490.2,
"valid_targets_min": 442
},
{
"epoch": 5.098335854765507,
"grad_norm": 0.4279890944625253,
"learning_rate": 8.351979275574207e-06,
"loss": 0.1623,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1501058042049408,
"step": 3370,
"valid_targets_mean": 5297.9,
"valid_targets_min": 873
},
{
"epoch": 5.1059001512859306,
"grad_norm": 0.44340326773424427,
"learning_rate": 8.290731709906643e-06,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16302546858787537,
"step": 3375,
"valid_targets_mean": 4976.1,
"valid_targets_min": 1877
},
{
"epoch": 5.113464447806354,
"grad_norm": 0.5128759287926937,
"learning_rate": 8.229650772075153e-06,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15705181658267975,
"step": 3380,
"valid_targets_mean": 3650.5,
"valid_targets_min": 506
},
{
"epoch": 5.121028744326778,
"grad_norm": 0.4688934592390907,
"learning_rate": 8.168737331287269e-06,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15802708268165588,
"step": 3385,
"valid_targets_mean": 4826.7,
"valid_targets_min": 841
},
{
"epoch": 5.128593040847202,
"grad_norm": 0.5338964793918589,
"learning_rate": 8.107992254367003e-06,
"loss": 0.1653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17902442812919617,
"step": 3390,
"valid_targets_mean": 3932.9,
"valid_targets_min": 650
},
{
"epoch": 5.136157337367624,
"grad_norm": 0.4961972344616427,
"learning_rate": 8.047416405742479e-06,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15935659408569336,
"step": 3395,
"valid_targets_mean": 4673.6,
"valid_targets_min": 672
},
{
"epoch": 5.143721633888048,
"grad_norm": 0.41951146240242676,
"learning_rate": 7.987010647433606e-06,
"loss": 0.1609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18392476439476013,
"step": 3400,
"valid_targets_mean": 6500.2,
"valid_targets_min": 665
},
{
"epoch": 5.151285930408472,
"grad_norm": 0.5308721732777357,
"learning_rate": 7.926775839039851e-06,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1562509834766388,
"step": 3405,
"valid_targets_mean": 3936.5,
"valid_targets_min": 593
},
{
"epoch": 5.158850226928895,
"grad_norm": 0.4254042910385951,
"learning_rate": 7.866712837728016e-06,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1462964117527008,
"step": 3410,
"valid_targets_mean": 5346.2,
"valid_targets_min": 944
},
{
"epoch": 5.166414523449319,
"grad_norm": 0.5552776613133977,
"learning_rate": 7.80682249821997e-06,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11865056306123734,
"step": 3415,
"valid_targets_mean": 4060.9,
"valid_targets_min": 660
},
{
"epoch": 5.173978819969743,
"grad_norm": 0.5104198651404502,
"learning_rate": 7.747105672780561e-06,
"loss": 0.1733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15125545859336853,
"step": 3420,
"valid_targets_mean": 4615.4,
"valid_targets_min": 628
},
{
"epoch": 5.181543116490166,
"grad_norm": 0.472114678915561,
"learning_rate": 7.68756321120546e-06,
"loss": 0.1639,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16353891789913177,
"step": 3425,
"valid_targets_mean": 4357.2,
"valid_targets_min": 723
},
{
"epoch": 5.18910741301059,
"grad_norm": 0.7788327189272692,
"learning_rate": 7.628195960809039e-06,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1500215232372284,
"step": 3430,
"valid_targets_mean": 4284.7,
"valid_targets_min": 754
},
{
"epoch": 5.196671709531014,
"grad_norm": 0.43343966922095256,
"learning_rate": 7.569004766412369e-06,
"loss": 0.1565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14865446090698242,
"step": 3435,
"valid_targets_mean": 4969.2,
"valid_targets_min": 586
},
{
"epoch": 5.204236006051437,
"grad_norm": 0.47577740785963674,
"learning_rate": 7.509990470331159e-06,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1581379622220993,
"step": 3440,
"valid_targets_mean": 4133.3,
"valid_targets_min": 712
},
{
"epoch": 5.211800302571861,
"grad_norm": 0.3926350192189327,
"learning_rate": 7.451153912363784e-06,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13046491146087646,
"step": 3445,
"valid_targets_mean": 6214.4,
"valid_targets_min": 2307
},
{
"epoch": 5.219364599092285,
"grad_norm": 0.4176746702190328,
"learning_rate": 7.392495929779333e-06,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1757950782775879,
"step": 3450,
"valid_targets_mean": 5443.2,
"valid_targets_min": 546
},
{
"epoch": 5.2269288956127085,
"grad_norm": 0.4515587545805908,
"learning_rate": 7.334017357305674e-06,
"loss": 0.1591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16047310829162598,
"step": 3455,
"valid_targets_mean": 4970.7,
"valid_targets_min": 550
},
{
"epoch": 5.234493192133131,
"grad_norm": 0.45597339531041936,
"learning_rate": 7.2757190271176115e-06,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14856447279453278,
"step": 3460,
"valid_targets_mean": 4530.4,
"valid_targets_min": 710
},
{
"epoch": 5.242057488653555,
"grad_norm": 0.5008734692788059,
"learning_rate": 7.217601768825023e-06,
"loss": 0.1531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14690902829170227,
"step": 3465,
"valid_targets_mean": 5124.4,
"valid_targets_min": 583
},
{
"epoch": 5.249621785173979,
"grad_norm": 0.4989691903624996,
"learning_rate": 7.15966640946105e-06,
"loss": 0.1539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14532163739204407,
"step": 3470,
"valid_targets_mean": 4449.6,
"valid_targets_min": 695
},
{
"epoch": 5.257186081694402,
"grad_norm": 0.4129795536595691,
"learning_rate": 7.101913773470346e-06,
"loss": 0.1582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14961427450180054,
"step": 3475,
"valid_targets_mean": 5730.8,
"valid_targets_min": 3290
},
{
"epoch": 5.264750378214826,
"grad_norm": 0.4834264222381325,
"learning_rate": 7.044344682697326e-06,
"loss": 0.1587,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14742320775985718,
"step": 3480,
"valid_targets_mean": 4838.9,
"valid_targets_min": 515
},
{
"epoch": 5.27231467473525,
"grad_norm": 0.5026805612919963,
"learning_rate": 6.986959956374473e-06,
"loss": 0.1668,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17401841282844543,
"step": 3485,
"valid_targets_mean": 4044.6,
"valid_targets_min": 781
},
{
"epoch": 5.279878971255673,
"grad_norm": 0.4735788451733253,
"learning_rate": 6.929760411110698e-06,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1525282859802246,
"step": 3490,
"valid_targets_mean": 4527.6,
"valid_targets_min": 812
},
{
"epoch": 5.287443267776097,
"grad_norm": 0.4391485486379499,
"learning_rate": 6.872746860879702e-06,
"loss": 0.1562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1371186375617981,
"step": 3495,
"valid_targets_mean": 4986.9,
"valid_targets_min": 80
},
{
"epoch": 5.295007564296521,
"grad_norm": 0.4167604767357861,
"learning_rate": 6.815920117008399e-06,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15365831553936005,
"step": 3500,
"valid_targets_mean": 5418.2,
"valid_targets_min": 617
},
{
"epoch": 5.302571860816944,
"grad_norm": 0.42828839637040433,
"learning_rate": 6.759280988165373e-06,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13771694898605347,
"step": 3505,
"valid_targets_mean": 5017.8,
"valid_targets_min": 1328
},
{
"epoch": 5.310136157337368,
"grad_norm": 0.4506403163352829,
"learning_rate": 6.702830280349353e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15530502796173096,
"step": 3510,
"valid_targets_mean": 4390.8,
"valid_targets_min": 1004
},
{
"epoch": 5.317700453857791,
"grad_norm": 0.4340685132852124,
"learning_rate": 6.6465687968777725e-06,
"loss": 0.1495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.146540105342865,
"step": 3515,
"valid_targets_mean": 4825.2,
"valid_targets_min": 642
},
{
"epoch": 5.3252647503782145,
"grad_norm": 0.46671624987800375,
"learning_rate": 6.590497338375317e-06,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1502562165260315,
"step": 3520,
"valid_targets_mean": 4549.4,
"valid_targets_min": 540
},
{
"epoch": 5.332829046898638,
"grad_norm": 0.5101933773328257,
"learning_rate": 6.534616702762537e-06,
"loss": 0.1594,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17042289674282074,
"step": 3525,
"valid_targets_mean": 4879.7,
"valid_targets_min": 795
},
{
"epoch": 5.340393343419062,
"grad_norm": 0.5293012627631964,
"learning_rate": 6.478927685244494e-06,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18156251311302185,
"step": 3530,
"valid_targets_mean": 3960.2,
"valid_targets_min": 719
},
{
"epoch": 5.3479576399394855,
"grad_norm": 0.47166025682277357,
"learning_rate": 6.423431078299443e-06,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17513303458690643,
"step": 3535,
"valid_targets_mean": 4714.2,
"valid_targets_min": 692
},
{
"epoch": 5.355521936459909,
"grad_norm": 0.4337643659228156,
"learning_rate": 6.3681276716675435e-06,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18963715434074402,
"step": 3540,
"valid_targets_mean": 5398.2,
"valid_targets_min": 740
},
{
"epoch": 5.363086232980333,
"grad_norm": 0.44696298609992435,
"learning_rate": 6.3130182523396484e-06,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17503423988819122,
"step": 3545,
"valid_targets_mean": 4828.9,
"valid_targets_min": 2715
},
{
"epoch": 5.3706505295007565,
"grad_norm": 0.44174975125123683,
"learning_rate": 6.258103604546087e-06,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1407729834318161,
"step": 3550,
"valid_targets_mean": 4479.8,
"valid_targets_min": 2428
},
{
"epoch": 5.37821482602118,
"grad_norm": 0.44916605681525745,
"learning_rate": 6.2033845097454985e-06,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14504870772361755,
"step": 3555,
"valid_targets_mean": 4913.3,
"valid_targets_min": 940
},
{
"epoch": 5.385779122541604,
"grad_norm": 0.4400921867214306,
"learning_rate": 6.14886174661373e-06,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15662983059883118,
"step": 3560,
"valid_targets_mean": 4724.1,
"valid_targets_min": 620
},
{
"epoch": 5.3933434190620275,
"grad_norm": 0.47087556709614853,
"learning_rate": 6.0945360910327476e-06,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1466415971517563,
"step": 3565,
"valid_targets_mean": 4426.4,
"valid_targets_min": 1086
},
{
"epoch": 5.400907715582451,
"grad_norm": 0.5433230621680141,
"learning_rate": 6.040408316079575e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13208290934562683,
"step": 3570,
"valid_targets_mean": 2785.8,
"valid_targets_min": 167
},
{
"epoch": 5.408472012102875,
"grad_norm": 0.46344685976956507,
"learning_rate": 5.986479192015337e-06,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2303861677646637,
"step": 3575,
"valid_targets_mean": 5746.5,
"valid_targets_min": 932
},
{
"epoch": 5.416036308623298,
"grad_norm": 0.4310949358505575,
"learning_rate": 5.932749486274239e-06,
"loss": 0.1604,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14768637716770172,
"step": 3580,
"valid_targets_mean": 5434.6,
"valid_targets_min": 666
},
{
"epoch": 5.423600605143721,
"grad_norm": 0.4677000573971819,
"learning_rate": 5.8792199634527205e-06,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16156046092510223,
"step": 3585,
"valid_targets_mean": 5433.3,
"valid_targets_min": 756
},
{
"epoch": 5.431164901664145,
"grad_norm": 0.49393458847349964,
"learning_rate": 5.82589138529851e-06,
"loss": 0.1693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1611177623271942,
"step": 3590,
"valid_targets_mean": 4461.6,
"valid_targets_min": 595
},
{
"epoch": 5.438729198184569,
"grad_norm": 0.5687948770753518,
"learning_rate": 5.7727645106998e-06,
"loss": 0.1508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15704114735126495,
"step": 3595,
"valid_targets_mean": 4090.4,
"valid_targets_min": 286
},
{
"epoch": 5.446293494704992,
"grad_norm": 0.5444741623582646,
"learning_rate": 5.719840095674476e-06,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1610284447669983,
"step": 3600,
"valid_targets_mean": 3557.4,
"valid_targets_min": 560
},
{
"epoch": 5.453857791225416,
"grad_norm": 0.43128286547039024,
"learning_rate": 5.667118893359331e-06,
"loss": 0.1541,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1486874222755432,
"step": 3605,
"valid_targets_mean": 4866.7,
"valid_targets_min": 1302
},
{
"epoch": 5.46142208774584,
"grad_norm": 0.4595711511111565,
"learning_rate": 5.614601653999338e-06,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16856805980205536,
"step": 3610,
"valid_targets_mean": 4922.6,
"valid_targets_min": 557
},
{
"epoch": 5.468986384266263,
"grad_norm": 0.46656320107157945,
"learning_rate": 5.5622891249370234e-06,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20066699385643005,
"step": 3615,
"valid_targets_mean": 5136.1,
"valid_targets_min": 688
},
{
"epoch": 5.476550680786687,
"grad_norm": 0.4411187508138855,
"learning_rate": 5.5101820506017865e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1552569568157196,
"step": 3620,
"valid_targets_mean": 5095.8,
"valid_targets_min": 635
},
{
"epoch": 5.484114977307111,
"grad_norm": 0.4862124542907482,
"learning_rate": 5.458281172499298e-06,
"loss": 0.1614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1585727334022522,
"step": 3625,
"valid_targets_mean": 3937.2,
"valid_targets_min": 496
},
{
"epoch": 5.491679273827534,
"grad_norm": 0.4292729342401527,
"learning_rate": 5.406587229200997e-06,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12494321167469025,
"step": 3630,
"valid_targets_mean": 4550.4,
"valid_targets_min": 1536
},
{
"epoch": 5.499243570347957,
"grad_norm": 0.4047902663925935,
"learning_rate": 5.355100956333546e-06,
"loss": 0.154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14619508385658264,
"step": 3635,
"valid_targets_mean": 5542.1,
"valid_targets_min": 570
},
{
"epoch": 5.506807866868381,
"grad_norm": 0.5096706493017572,
"learning_rate": 5.303823086568347e-06,
"loss": 0.1548,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15569140017032623,
"step": 3640,
"valid_targets_mean": 3900.1,
"valid_targets_min": 856
},
{
"epoch": 5.5143721633888045,
"grad_norm": 0.4255353489871283,
"learning_rate": 5.252754349611182e-06,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14665234088897705,
"step": 3645,
"valid_targets_mean": 5351.4,
"valid_targets_min": 1002
},
{
"epoch": 5.521936459909228,
"grad_norm": 0.452780407445397,
"learning_rate": 5.201895472191743e-06,
"loss": 0.155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1493845283985138,
"step": 3650,
"valid_targets_mean": 5155.4,
"valid_targets_min": 1700
},
{
"epoch": 5.529500756429652,
"grad_norm": 0.43780341220663965,
"learning_rate": 5.151247178053349e-06,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15060928463935852,
"step": 3655,
"valid_targets_mean": 5135.1,
"valid_targets_min": 1275
},
{
"epoch": 5.537065052950076,
"grad_norm": 0.5052751593749545,
"learning_rate": 5.100810187942639e-06,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1450476050376892,
"step": 3660,
"valid_targets_mean": 5569.8,
"valid_targets_min": 2214
},
{
"epoch": 5.544629349470499,
"grad_norm": 0.47706320379830186,
"learning_rate": 5.050585219599289e-06,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1428034007549286,
"step": 3665,
"valid_targets_mean": 4428.3,
"valid_targets_min": 345
},
{
"epoch": 5.552193645990923,
"grad_norm": 0.4868390792247118,
"learning_rate": 5.0005729877458155e-06,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1447855830192566,
"step": 3670,
"valid_targets_mean": 4278.9,
"valid_targets_min": 579
},
{
"epoch": 5.559757942511347,
"grad_norm": 0.4567698222657148,
"learning_rate": 4.950774204077433e-06,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.161106675863266,
"step": 3675,
"valid_targets_mean": 4954.6,
"valid_targets_min": 579
},
{
"epoch": 5.56732223903177,
"grad_norm": 0.42355294049312686,
"learning_rate": 4.901189577251864e-06,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1554052084684372,
"step": 3680,
"valid_targets_mean": 5065.8,
"valid_targets_min": 1009
},
{
"epoch": 5.574886535552194,
"grad_norm": 0.4156925770441878,
"learning_rate": 4.851819812879303e-06,
"loss": 0.1529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1524563580751419,
"step": 3685,
"valid_targets_mean": 5432.8,
"valid_targets_min": 1562
},
{
"epoch": 5.582450832072618,
"grad_norm": 0.4746990695302771,
"learning_rate": 4.80266561351237e-06,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16682183742523193,
"step": 3690,
"valid_targets_mean": 4135.4,
"valid_targets_min": 736
},
{
"epoch": 5.590015128593041,
"grad_norm": 0.5340419322270344,
"learning_rate": 4.753727678636082e-06,
"loss": 0.1483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16570830345153809,
"step": 3695,
"valid_targets_mean": 4032.8,
"valid_targets_min": 802
},
{
"epoch": 5.597579425113464,
"grad_norm": 0.46287738612206497,
"learning_rate": 4.7050067046579324e-06,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15962907671928406,
"step": 3700,
"valid_targets_mean": 4799.6,
"valid_targets_min": 855
},
{
"epoch": 5.605143721633888,
"grad_norm": 0.4388012169199975,
"learning_rate": 4.656503384897988e-06,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13840925693511963,
"step": 3705,
"valid_targets_mean": 4313.9,
"valid_targets_min": 733
},
{
"epoch": 5.612708018154311,
"grad_norm": 0.478903080739202,
"learning_rate": 4.6082184095789686e-06,
"loss": 0.1491,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15945684909820557,
"step": 3710,
"valid_targets_mean": 4372.9,
"valid_targets_min": 892
},
{
"epoch": 5.620272314674735,
"grad_norm": 0.43574711337202326,
"learning_rate": 4.56015246581649e-06,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18066449463367462,
"step": 3715,
"valid_targets_mean": 5704.6,
"valid_targets_min": 716
},
{
"epoch": 5.627836611195159,
"grad_norm": 0.4685680736943704,
"learning_rate": 4.512306237609232e-06,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15282121300697327,
"step": 3720,
"valid_targets_mean": 5270.2,
"valid_targets_min": 569
},
{
"epoch": 5.635400907715582,
"grad_norm": 0.4897093192549938,
"learning_rate": 4.464680405829249e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14707836508750916,
"step": 3725,
"valid_targets_mean": 4000.9,
"valid_targets_min": 473
},
{
"epoch": 5.642965204236006,
"grad_norm": 0.4848515119309501,
"learning_rate": 4.4172756482122535e-06,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1577150821685791,
"step": 3730,
"valid_targets_mean": 4438.2,
"valid_targets_min": 1148
},
{
"epoch": 5.65052950075643,
"grad_norm": 0.47760265587876977,
"learning_rate": 4.370092639347978e-06,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17945009469985962,
"step": 3735,
"valid_targets_mean": 4574.9,
"valid_targets_min": 504
},
{
"epoch": 5.6580937972768535,
"grad_norm": 0.4826246472719842,
"learning_rate": 4.3231320506705775e-06,
"loss": 0.1645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16503837704658508,
"step": 3740,
"valid_targets_mean": 4244.0,
"valid_targets_min": 762
},
{
"epoch": 5.665658093797277,
"grad_norm": 0.4948486143484778,
"learning_rate": 4.2763945504490835e-06,
"loss": 0.1536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1612137407064438,
"step": 3745,
"valid_targets_mean": 3841.2,
"valid_targets_min": 898
},
{
"epoch": 5.673222390317701,
"grad_norm": 0.5418667804393014,
"learning_rate": 4.229880803777859e-06,
"loss": 0.1564,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1569966971874237,
"step": 3750,
"valid_targets_mean": 5043.6,
"valid_targets_min": 789
},
{
"epoch": 5.680786686838124,
"grad_norm": 0.44525023164036787,
"learning_rate": 4.183591472567186e-06,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15684780478477478,
"step": 3755,
"valid_targets_mean": 5266.2,
"valid_targets_min": 2689
},
{
"epoch": 5.688350983358547,
"grad_norm": 0.42073209891417795,
"learning_rate": 4.137527215533805e-06,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16824714839458466,
"step": 3760,
"valid_targets_mean": 6439.3,
"valid_targets_min": 607
},
{
"epoch": 5.695915279878971,
"grad_norm": 0.4862094128743182,
"learning_rate": 4.091688688191564e-06,
"loss": 0.1615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15628470480442047,
"step": 3765,
"valid_targets_mean": 4402.2,
"valid_targets_min": 800
},
{
"epoch": 5.703479576399395,
"grad_norm": 0.537061705110618,
"learning_rate": 4.046076542842077e-06,
"loss": 0.1606,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1753963828086853,
"step": 3770,
"valid_targets_mean": 3481.6,
"valid_targets_min": 730
},
{
"epoch": 5.711043872919818,
"grad_norm": 0.49689760167531866,
"learning_rate": 4.000691428565453e-06,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18343189358711243,
"step": 3775,
"valid_targets_mean": 4551.9,
"valid_targets_min": 732
},
{
"epoch": 5.718608169440242,
"grad_norm": 0.48330032612845897,
"learning_rate": 3.9555339912110355e-06,
"loss": 0.1654,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1796744465827942,
"step": 3780,
"valid_targets_mean": 4892.2,
"valid_targets_min": 760
},
{
"epoch": 5.726172465960666,
"grad_norm": 0.5276122434209084,
"learning_rate": 3.910604873388248e-06,
"loss": 0.1669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17993156611919403,
"step": 3785,
"valid_targets_mean": 3504.7,
"valid_targets_min": 574
},
{
"epoch": 5.733736762481089,
"grad_norm": 0.4887711580738052,
"learning_rate": 3.8659047144574245e-06,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1559087038040161,
"step": 3790,
"valid_targets_mean": 4371.9,
"valid_targets_min": 638
},
{
"epoch": 5.741301059001513,
"grad_norm": 1.3298249041601897,
"learning_rate": 3.821434150520715e-06,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17897151410579681,
"step": 3795,
"valid_targets_mean": 4587.8,
"valid_targets_min": 756
},
{
"epoch": 5.748865355521937,
"grad_norm": 0.43958731365820686,
"learning_rate": 3.777193814413045e-06,
"loss": 0.1632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17036233842372894,
"step": 3800,
"valid_targets_mean": 5104.9,
"valid_targets_min": 486
},
{
"epoch": 5.75642965204236,
"grad_norm": 0.4549903255374407,
"learning_rate": 3.7331843356930806e-06,
"loss": 0.1715,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1566658914089203,
"step": 3805,
"valid_targets_mean": 4717.1,
"valid_targets_min": 818
},
{
"epoch": 5.763993948562784,
"grad_norm": 0.4541303493990637,
"learning_rate": 3.6894063406343094e-06,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15038271248340607,
"step": 3810,
"valid_targets_mean": 4360.2,
"valid_targets_min": 1600
},
{
"epoch": 5.771558245083208,
"grad_norm": 0.4563736572350106,
"learning_rate": 3.645860452216099e-06,
"loss": 0.1704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1912127137184143,
"step": 3815,
"valid_targets_mean": 5395.8,
"valid_targets_min": 828
},
{
"epoch": 5.7791225416036305,
"grad_norm": 0.4551743372988032,
"learning_rate": 3.6025472901148463e-06,
"loss": 0.1652,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14934727549552917,
"step": 3820,
"valid_targets_mean": 4297.6,
"valid_targets_min": 723
},
{
"epoch": 5.786686838124054,
"grad_norm": 0.5419707059621975,
"learning_rate": 3.5594674706951505e-06,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17843681573867798,
"step": 3825,
"valid_targets_mean": 3665.1,
"valid_targets_min": 869
},
{
"epoch": 5.794251134644478,
"grad_norm": 0.41228701610809887,
"learning_rate": 3.5166216070010538e-06,
"loss": 0.1501,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16986562311649323,
"step": 3830,
"valid_targets_mean": 5923.2,
"valid_targets_min": 727
},
{
"epoch": 5.8018154311649015,
"grad_norm": 0.5633480031927796,
"learning_rate": 3.474010308747291e-06,
"loss": 0.1598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1795251965522766,
"step": 3835,
"valid_targets_mean": 3345.4,
"valid_targets_min": 488
},
{
"epoch": 5.809379727685325,
"grad_norm": 0.4548488396337465,
"learning_rate": 3.431634182310648e-06,
"loss": 0.1522,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15337982773780823,
"step": 3840,
"valid_targets_mean": 5548.0,
"valid_targets_min": 603
},
{
"epoch": 5.816944024205749,
"grad_norm": 0.5594216753768365,
"learning_rate": 3.3894938307213152e-06,
"loss": 0.163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16239002346992493,
"step": 3845,
"valid_targets_mean": 3887.2,
"valid_targets_min": 625
},
{
"epoch": 5.8245083207261725,
"grad_norm": 0.48899700932766244,
"learning_rate": 3.3475898536543027e-06,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14301034808158875,
"step": 3850,
"valid_targets_mean": 3694.9,
"valid_targets_min": 783
},
{
"epoch": 5.832072617246596,
"grad_norm": 0.5375659757559488,
"learning_rate": 3.305922847420917e-06,
"loss": 0.1585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1484188735485077,
"step": 3855,
"valid_targets_mean": 4786.7,
"valid_targets_min": 980
},
{
"epoch": 5.83963691376702,
"grad_norm": 0.4496456556488915,
"learning_rate": 3.2644934049602563e-06,
"loss": 0.1681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.143708735704422,
"step": 3860,
"valid_targets_mean": 4360.6,
"valid_targets_min": 451
},
{
"epoch": 5.8472012102874436,
"grad_norm": 0.5024320220862686,
"learning_rate": 3.2233021158307977e-06,
"loss": 0.1688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16948488354682922,
"step": 3865,
"valid_targets_mean": 3960.7,
"valid_targets_min": 653
},
{
"epoch": 5.854765506807867,
"grad_norm": 0.4794661098479003,
"learning_rate": 3.1823495662019945e-06,
"loss": 0.1642,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18447071313858032,
"step": 3870,
"valid_targets_mean": 4347.0,
"valid_targets_min": 869
},
{
"epoch": 5.86232980332829,
"grad_norm": 0.5335315955728364,
"learning_rate": 3.1416363388459327e-06,
"loss": 0.1514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16665160655975342,
"step": 3875,
"valid_targets_mean": 3852.0,
"valid_targets_min": 442
},
{
"epoch": 5.869894099848714,
"grad_norm": 0.4521764880267215,
"learning_rate": 3.101163013129045e-06,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1629321575164795,
"step": 3880,
"valid_targets_mean": 5032.3,
"valid_targets_min": 1726
},
{
"epoch": 5.877458396369137,
"grad_norm": 0.44215316112526387,
"learning_rate": 3.0609301650038636e-06,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16144798696041107,
"step": 3885,
"valid_targets_mean": 4983.0,
"valid_targets_min": 1035
},
{
"epoch": 5.885022692889561,
"grad_norm": 0.45192189450308085,
"learning_rate": 3.02093836700081e-06,
"loss": 0.1569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1504105031490326,
"step": 3890,
"valid_targets_mean": 4960.3,
"valid_targets_min": 660
},
{
"epoch": 5.892586989409985,
"grad_norm": 0.48426768810953463,
"learning_rate": 2.9811881882200743e-06,
"loss": 0.1651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13621945679187775,
"step": 3895,
"valid_targets_mean": 5686.2,
"valid_targets_min": 975
},
{
"epoch": 5.900151285930408,
"grad_norm": 0.42046160161979335,
"learning_rate": 2.9416801943234998e-06,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1531427800655365,
"step": 3900,
"valid_targets_mean": 4956.7,
"valid_targets_min": 623
},
{
"epoch": 5.907715582450832,
"grad_norm": 0.39285175944912043,
"learning_rate": 2.9024149475265373e-06,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13850067555904388,
"step": 3905,
"valid_targets_mean": 5538.1,
"valid_targets_min": 562
},
{
"epoch": 5.915279878971256,
"grad_norm": 0.4675547807289267,
"learning_rate": 2.863393006590238e-06,
"loss": 0.1613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1579177975654602,
"step": 3910,
"valid_targets_mean": 4398.9,
"valid_targets_min": 695
},
{
"epoch": 5.922844175491679,
"grad_norm": 0.5044920538844487,
"learning_rate": 2.8246149268133204e-06,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13913246989250183,
"step": 3915,
"valid_targets_mean": 4010.9,
"valid_targets_min": 992
},
{
"epoch": 5.930408472012103,
"grad_norm": 0.4734152534913723,
"learning_rate": 2.786081260024236e-06,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16348206996917725,
"step": 3920,
"valid_targets_mean": 4878.4,
"valid_targets_min": 765
},
{
"epoch": 5.937972768532527,
"grad_norm": 0.4212958889997933,
"learning_rate": 2.747792554573352e-06,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16852790117263794,
"step": 3925,
"valid_targets_mean": 5669.1,
"valid_targets_min": 907
},
{
"epoch": 5.94553706505295,
"grad_norm": 0.45812842620540806,
"learning_rate": 2.7097493553251307e-06,
"loss": 0.176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20022347569465637,
"step": 3930,
"valid_targets_mean": 5328.2,
"valid_targets_min": 585
},
{
"epoch": 5.953101361573374,
"grad_norm": 0.6055937435419297,
"learning_rate": 2.6719522036503654e-06,
"loss": 0.1597,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15267616510391235,
"step": 3935,
"valid_targets_mean": 4613.9,
"valid_targets_min": 512
},
{
"epoch": 5.960665658093797,
"grad_norm": 0.4411679407281343,
"learning_rate": 2.634401637418511e-06,
"loss": 0.156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13407060503959656,
"step": 3940,
"valid_targets_mean": 5239.2,
"valid_targets_min": 773
},
{
"epoch": 5.968229954614221,
"grad_norm": 0.4846638993954495,
"learning_rate": 2.5970981909899817e-06,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1752455234527588,
"step": 3945,
"valid_targets_mean": 4496.4,
"valid_targets_min": 848
},
{
"epoch": 5.975794251134644,
"grad_norm": 0.5259996428825984,
"learning_rate": 2.5600423952085884e-06,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1702825427055359,
"step": 3950,
"valid_targets_mean": 4433.2,
"valid_targets_min": 694
},
{
"epoch": 5.983358547655068,
"grad_norm": 0.45060137388491545,
"learning_rate": 2.5232347773939704e-06,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15999829769134521,
"step": 3955,
"valid_targets_mean": 4916.9,
"valid_targets_min": 932
},
{
"epoch": 5.990922844175492,
"grad_norm": 0.49433677369908263,
"learning_rate": 2.4866758613340734e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17644256353378296,
"step": 3960,
"valid_targets_mean": 3945.7,
"valid_targets_min": 611
},
{
"epoch": 5.998487140695915,
"grad_norm": 0.4731628539536409,
"learning_rate": 2.4503661672777244e-06,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15683284401893616,
"step": 3965,
"valid_targets_mean": 4375.0,
"valid_targets_min": 345
},
{
"epoch": 6.006051437216339,
"grad_norm": 0.7191490640882733,
"learning_rate": 2.4143062119272263e-06,
"loss": 0.1776,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2411782443523407,
"step": 3970,
"valid_targets_mean": 5717.2,
"valid_targets_min": 577
},
{
"epoch": 6.013615733736763,
"grad_norm": 0.45234451996666436,
"learning_rate": 2.3784965084309697e-06,
"loss": 0.1492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.135951966047287,
"step": 3975,
"valid_targets_mean": 4790.9,
"valid_targets_min": 524
},
{
"epoch": 6.021180030257186,
"grad_norm": 0.4357043407051513,
"learning_rate": 2.3429375663761734e-06,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14513269066810608,
"step": 3980,
"valid_targets_mean": 4690.6,
"valid_targets_min": 307
},
{
"epoch": 6.02874432677761,
"grad_norm": 0.4842329006340026,
"learning_rate": 2.307629891781611e-06,
"loss": 0.1568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1446702480316162,
"step": 3985,
"valid_targets_mean": 4378.6,
"valid_targets_min": 702
},
{
"epoch": 6.036308623298034,
"grad_norm": 0.5364048099568542,
"learning_rate": 2.2725739870904075e-06,
"loss": 0.1527,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1525079607963562,
"step": 3990,
"valid_targets_mean": 4930.4,
"valid_targets_min": 795
},
{
"epoch": 6.043872919818457,
"grad_norm": 0.43526201026202,
"learning_rate": 2.2377703511629023e-06,
"loss": 0.1595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1793811321258545,
"step": 3995,
"valid_targets_mean": 5215.1,
"valid_targets_min": 739
},
{
"epoch": 6.05143721633888,
"grad_norm": 0.5106416304534394,
"learning_rate": 2.2032194792695517e-06,
"loss": 0.1519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1592015027999878,
"step": 4000,
"valid_targets_mean": 4197.9,
"valid_targets_min": 650
},
{
"epoch": 6.059001512859304,
"grad_norm": 0.4414429719089798,
"learning_rate": 2.1689218630838528e-06,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17658647894859314,
"step": 4005,
"valid_targets_mean": 5331.7,
"valid_targets_min": 1472
},
{
"epoch": 6.0665658093797274,
"grad_norm": 0.54354392739444,
"learning_rate": 2.1348779906753856e-06,
"loss": 0.1684,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14778614044189453,
"step": 4010,
"valid_targets_mean": 5743.7,
"valid_targets_min": 765
},
{
"epoch": 6.074130105900151,
"grad_norm": 0.43018503151003995,
"learning_rate": 2.101088346502833e-06,
"loss": 0.1433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13991913199424744,
"step": 4015,
"valid_targets_mean": 5941.0,
"valid_targets_min": 1067
},
{
"epoch": 6.081694402420575,
"grad_norm": 0.5551337425133364,
"learning_rate": 2.067553411407117e-06,
"loss": 0.157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15724679827690125,
"step": 4020,
"valid_targets_mean": 3873.4,
"valid_targets_min": 525
},
{
"epoch": 6.0892586989409985,
"grad_norm": 0.44853100000660745,
"learning_rate": 2.0342736626045356e-06,
"loss": 0.1542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14757779240608215,
"step": 4025,
"valid_targets_mean": 4953.8,
"valid_targets_min": 723
},
{
"epoch": 6.096822995461422,
"grad_norm": 0.45503441348935464,
"learning_rate": 2.0012495736799753e-06,
"loss": 0.1481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1418561339378357,
"step": 4030,
"valid_targets_mean": 5156.3,
"valid_targets_min": 932
},
{
"epoch": 6.104387291981846,
"grad_norm": 0.40513522356616916,
"learning_rate": 1.9684816145801776e-06,
"loss": 0.1456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13881005346775055,
"step": 4035,
"valid_targets_mean": 5304.2,
"valid_targets_min": 2569
},
{
"epoch": 6.1119515885022695,
"grad_norm": 0.4269784848098862,
"learning_rate": 1.9359702516070553e-06,
"loss": 0.158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1601366251707077,
"step": 4040,
"valid_targets_mean": 5462.7,
"valid_targets_min": 573
},
{
"epoch": 6.119515885022693,
"grad_norm": 0.5519519701322759,
"learning_rate": 1.9037159474110333e-06,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1714671403169632,
"step": 4045,
"valid_targets_mean": 3356.6,
"valid_targets_min": 778
},
{
"epoch": 6.127080181543117,
"grad_norm": 0.4351482020097601,
"learning_rate": 1.8717191609844931e-06,
"loss": 0.1624,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16394942998886108,
"step": 4050,
"valid_targets_mean": 5265.4,
"valid_targets_min": 766
},
{
"epoch": 6.1346444780635405,
"grad_norm": 0.40124586897572423,
"learning_rate": 1.8399803476552303e-06,
"loss": 0.1518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12816530466079712,
"step": 4055,
"valid_targets_mean": 4822.0,
"valid_targets_min": 1189
},
{
"epoch": 6.142208774583963,
"grad_norm": 0.384206751077286,
"learning_rate": 1.8084999590799678e-06,
"loss": 0.1439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15090115368366241,
"step": 4060,
"valid_targets_mean": 6546.3,
"valid_targets_min": 2772
},
{
"epoch": 6.149773071104387,
"grad_norm": 1.2611731543758526,
"learning_rate": 1.7772784432379398e-06,
"loss": 0.1406,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1444360464811325,
"step": 4065,
"valid_targets_mean": 4284.9,
"valid_targets_min": 562
},
{
"epoch": 6.157337367624811,
"grad_norm": 0.414208754194147,
"learning_rate": 1.7463162444245174e-06,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15277935564517975,
"step": 4070,
"valid_targets_mean": 5458.4,
"valid_targets_min": 1847
},
{
"epoch": 6.164901664145234,
"grad_norm": 0.5352430006908002,
"learning_rate": 1.7156138032448621e-06,
"loss": 0.1557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17013967037200928,
"step": 4075,
"valid_targets_mean": 4358.4,
"valid_targets_min": 627
},
{
"epoch": 6.172465960665658,
"grad_norm": 0.4390587640921899,
"learning_rate": 1.6851715566076942e-06,
"loss": 0.148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1464182734489441,
"step": 4080,
"valid_targets_mean": 5010.7,
"valid_targets_min": 498
},
{
"epoch": 6.180030257186082,
"grad_norm": 0.5455898884169155,
"learning_rate": 1.6549899377190448e-06,
"loss": 0.1575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1335110366344452,
"step": 4085,
"valid_targets_mean": 3511.6,
"valid_targets_min": 457
},
{
"epoch": 6.187594553706505,
"grad_norm": 0.4098562706112613,
"learning_rate": 1.6250693760761072e-06,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14616535604000092,
"step": 4090,
"valid_targets_mean": 5443.2,
"valid_targets_min": 894
},
{
"epoch": 6.195158850226929,
"grad_norm": 0.5540401439486693,
"learning_rate": 1.5954102974611218e-06,
"loss": 0.1566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18993410468101501,
"step": 4095,
"valid_targets_mean": 4211.4,
"valid_targets_min": 662
},
{
"epoch": 6.202723146747353,
"grad_norm": 0.4054113810918477,
"learning_rate": 1.5660131239353037e-06,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15200453996658325,
"step": 4100,
"valid_targets_mean": 5708.1,
"valid_targets_min": 1104
},
{
"epoch": 6.210287443267776,
"grad_norm": 0.590958853321242,
"learning_rate": 1.536878273832858e-06,
"loss": 0.1447,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16703468561172485,
"step": 4105,
"valid_targets_mean": 4328.2,
"valid_targets_min": 619
},
{
"epoch": 6.2178517397882,
"grad_norm": 0.4431701530215047,
"learning_rate": 1.5080061617550157e-06,
"loss": 0.1547,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16911979019641876,
"step": 4110,
"valid_targets_mean": 5307.1,
"valid_targets_min": 801
},
{
"epoch": 6.225416036308624,
"grad_norm": 0.447619549856025,
"learning_rate": 1.4793971985641298e-06,
"loss": 0.1655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16727328300476074,
"step": 4115,
"valid_targets_mean": 5365.2,
"valid_targets_min": 1941
},
{
"epoch": 6.2329803328290465,
"grad_norm": 0.49490312967592337,
"learning_rate": 1.45105179137784e-06,
"loss": 0.1532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16049346327781677,
"step": 4120,
"valid_targets_mean": 4772.8,
"valid_targets_min": 971
},
{
"epoch": 6.24054462934947,
"grad_norm": 0.5002729276708221,
"learning_rate": 1.4229703435632702e-06,
"loss": 0.1445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15890288352966309,
"step": 4125,
"valid_targets_mean": 4810.2,
"valid_targets_min": 871
},
{
"epoch": 6.248108925869894,
"grad_norm": 0.3972740664066531,
"learning_rate": 1.395153254731285e-06,
"loss": 0.1467,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1513948142528534,
"step": 4130,
"valid_targets_mean": 5640.1,
"valid_targets_min": 714
},
{
"epoch": 6.2556732223903175,
"grad_norm": 0.43980618632091506,
"learning_rate": 1.367600920730816e-06,
"loss": 0.174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1656402349472046,
"step": 4135,
"valid_targets_mean": 5542.3,
"valid_targets_min": 1749
},
{
"epoch": 6.263237518910741,
"grad_norm": 0.4443207443673087,
"learning_rate": 1.3403137336432193e-06,
"loss": 0.1659,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1583198606967926,
"step": 4140,
"valid_targets_mean": 5384.4,
"valid_targets_min": 753
},
{
"epoch": 6.270801815431165,
"grad_norm": 0.4753683286569819,
"learning_rate": 1.313292081776698e-06,
"loss": 0.149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17670109868049622,
"step": 4145,
"valid_targets_mean": 4728.7,
"valid_targets_min": 488
},
{
"epoch": 6.278366111951589,
"grad_norm": 0.4969598551390092,
"learning_rate": 1.286536349660783e-06,
"loss": 0.1538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14761213958263397,
"step": 4150,
"valid_targets_mean": 3709.7,
"valid_targets_min": 645
},
{
"epoch": 6.285930408472012,
"grad_norm": 0.5059874781677619,
"learning_rate": 1.2600469180408403e-06,
"loss": 0.1421,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1481596827507019,
"step": 4155,
"valid_targets_mean": 4018.0,
"valid_targets_min": 342
},
{
"epoch": 6.293494704992436,
"grad_norm": 0.41740987872915114,
"learning_rate": 1.2338241638726811e-06,
"loss": 0.1543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16702906787395477,
"step": 4160,
"valid_targets_mean": 6024.6,
"valid_targets_min": 581
},
{
"epoch": 6.30105900151286,
"grad_norm": 0.4637071225113284,
"learning_rate": 1.2078684603171787e-06,
"loss": 0.1477,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.139248326420784,
"step": 4165,
"valid_targets_mean": 4567.2,
"valid_targets_min": 1063
},
{
"epoch": 6.308623298033283,
"grad_norm": 0.5155678448385924,
"learning_rate": 1.1821801767349616e-06,
"loss": 0.1574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15290087461471558,
"step": 4170,
"valid_targets_mean": 4242.0,
"valid_targets_min": 654
},
{
"epoch": 6.316187594553707,
"grad_norm": 0.5065606805513911,
"learning_rate": 1.1567596786811652e-06,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13100755214691162,
"step": 4175,
"valid_targets_mean": 3437.8,
"valid_targets_min": 858
},
{
"epoch": 6.32375189107413,
"grad_norm": 0.44032005356083065,
"learning_rate": 1.1316073279002172e-06,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14807850122451782,
"step": 4180,
"valid_targets_mean": 4680.6,
"valid_targets_min": 522
},
{
"epoch": 6.331316187594553,
"grad_norm": 0.4547949954293122,
"learning_rate": 1.1067234823206951e-06,
"loss": 0.1545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14795613288879395,
"step": 4185,
"valid_targets_mean": 4760.6,
"valid_targets_min": 476
},
{
"epoch": 6.338880484114977,
"grad_norm": 0.4554441505241382,
"learning_rate": 1.0821084960502404e-06,
"loss": 0.1641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1481642872095108,
"step": 4190,
"valid_targets_mean": 4714.2,
"valid_targets_min": 2218
},
{
"epoch": 6.346444780635401,
"grad_norm": 0.4378844494460036,
"learning_rate": 1.0577627193705098e-06,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16023436188697815,
"step": 4195,
"valid_targets_mean": 4950.8,
"valid_targets_min": 698
},
{
"epoch": 6.354009077155824,
"grad_norm": 0.41590217934510926,
"learning_rate": 1.0336864987321938e-06,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13555586338043213,
"step": 4200,
"valid_targets_mean": 5161.0,
"valid_targets_min": 2019
},
{
"epoch": 6.361573373676248,
"grad_norm": 0.5143664594370752,
"learning_rate": 1.0098801767500842e-06,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1585438847541809,
"step": 4205,
"valid_targets_mean": 4201.8,
"valid_targets_min": 2109
},
{
"epoch": 6.369137670196672,
"grad_norm": 0.4399131246610985,
"learning_rate": 9.863440921982104e-07,
"loss": 0.1448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13819454610347748,
"step": 4210,
"valid_targets_mean": 4746.9,
"valid_targets_min": 747
},
{
"epoch": 6.376701966717095,
"grad_norm": 0.8335656415915854,
"learning_rate": 9.630785800049947e-07,
"loss": 0.1534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16780400276184082,
"step": 4215,
"valid_targets_mean": 4925.7,
"valid_targets_min": 746
},
{
"epoch": 6.384266263237519,
"grad_norm": 0.4067684611911977,
"learning_rate": 9.40083971248511e-07,
"loss": 0.1561,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1596384346485138,
"step": 4220,
"valid_targets_mean": 6230.5,
"valid_targets_min": 587
},
{
"epoch": 6.391830559757943,
"grad_norm": 0.43309543072557627,
"learning_rate": 9.173605931517526e-07,
"loss": 0.152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15254181623458862,
"step": 4225,
"valid_targets_mean": 5193.5,
"valid_targets_min": 551
},
{
"epoch": 6.3993948562783665,
"grad_norm": 0.4574867684924863,
"learning_rate": 8.949087690780023e-07,
"loss": 0.1648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15973302721977234,
"step": 4230,
"valid_targets_mean": 4612.9,
"valid_targets_min": 506
},
{
"epoch": 6.406959152798789,
"grad_norm": 0.4542653244014224,
"learning_rate": 8.727288185262029e-07,
"loss": 0.1687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1596071720123291,
"step": 4235,
"valid_targets_mean": 4488.4,
"valid_targets_min": 416
},
{
"epoch": 6.414523449319213,
"grad_norm": 0.4572109475990556,
"learning_rate": 8.508210571264186e-07,
"loss": 0.1458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14880454540252686,
"step": 4240,
"valid_targets_mean": 5173.1,
"valid_targets_min": 716
},
{
"epoch": 6.422087745839637,
"grad_norm": 0.6070546959330988,
"learning_rate": 8.291857966353545e-07,
"loss": 0.1734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16235873103141785,
"step": 4245,
"valid_targets_mean": 3878.2,
"valid_targets_min": 434
},
{
"epoch": 6.42965204236006,
"grad_norm": 0.5670598499888627,
"learning_rate": 8.078233449319128e-07,
"loss": 0.1622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16082099080085754,
"step": 4250,
"valid_targets_mean": 3953.2,
"valid_targets_min": 511
},
{
"epoch": 6.437216338880484,
"grad_norm": 0.41041322824939125,
"learning_rate": 7.867340060128037e-07,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13654690980911255,
"step": 4255,
"valid_targets_mean": 5684.5,
"valid_targets_min": 361
},
{
"epoch": 6.444780635400908,
"grad_norm": 0.4199160542149558,
"learning_rate": 7.659180799882371e-07,
"loss": 0.1583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15124070644378662,
"step": 4260,
"valid_targets_mean": 5140.1,
"valid_targets_min": 332
},
{
"epoch": 6.452344931921331,
"grad_norm": 0.4939206548010923,
"learning_rate": 7.453758630776398e-07,
"loss": 0.1463,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16383801400661469,
"step": 4265,
"valid_targets_mean": 4354.5,
"valid_targets_min": 850
},
{
"epoch": 6.459909228441755,
"grad_norm": 0.4501260238297891,
"learning_rate": 7.25107647605432e-07,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15669146180152893,
"step": 4270,
"valid_targets_mean": 5121.8,
"valid_targets_min": 677
},
{
"epoch": 6.467473524962179,
"grad_norm": 0.4734703379153941,
"learning_rate": 7.051137219968885e-07,
"loss": 0.1505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14317908883094788,
"step": 4275,
"valid_targets_mean": 4474.1,
"valid_targets_min": 571
},
{
"epoch": 6.475037821482602,
"grad_norm": 0.4564012604214816,
"learning_rate": 6.853943707740218e-07,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12744159996509552,
"step": 4280,
"valid_targets_mean": 4480.9,
"valid_targets_min": 1132
},
{
"epoch": 6.482602118003026,
"grad_norm": 0.4721394856153527,
"learning_rate": 6.659498745515258e-07,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1510826200246811,
"step": 4285,
"valid_targets_mean": 4945.0,
"valid_targets_min": 706
},
{
"epoch": 6.49016641452345,
"grad_norm": 0.5177102676493053,
"learning_rate": 6.467805100328117e-07,
"loss": 0.1442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14990335702896118,
"step": 4290,
"valid_targets_mean": 4293.1,
"valid_targets_min": 496
},
{
"epoch": 6.497730711043873,
"grad_norm": 0.4743441140245587,
"learning_rate": 6.278865500060271e-07,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18568217754364014,
"step": 4295,
"valid_targets_mean": 4790.9,
"valid_targets_min": 1246
},
{
"epoch": 6.505295007564296,
"grad_norm": 0.46507859849231403,
"learning_rate": 6.092682633402103e-07,
"loss": 0.1494,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14523780345916748,
"step": 4300,
"valid_targets_mean": 5654.4,
"valid_targets_min": 1877
},
{
"epoch": 6.51285930408472,
"grad_norm": 0.43490921069799204,
"learning_rate": 5.909259149814505e-07,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1442725956439972,
"step": 4305,
"valid_targets_mean": 5352.5,
"valid_targets_min": 474
},
{
"epoch": 6.5204236006051435,
"grad_norm": 0.4707066879537463,
"learning_rate": 5.728597659491142e-07,
"loss": 0.1635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1738138496875763,
"step": 4310,
"valid_targets_mean": 4893.9,
"valid_targets_min": 254
},
{
"epoch": 6.527987897125567,
"grad_norm": 0.4241793853464637,
"learning_rate": 5.550700733321379e-07,
"loss": 0.1737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1556629091501236,
"step": 4315,
"valid_targets_mean": 5057.2,
"valid_targets_min": 2822
},
{
"epoch": 6.535552193645991,
"grad_norm": 0.46368809571656755,
"learning_rate": 5.375570902853633e-07,
"loss": 0.1516,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13116100430488586,
"step": 4320,
"valid_targets_mean": 4321.1,
"valid_targets_min": 507
},
{
"epoch": 6.5431164901664145,
"grad_norm": 0.5052781045290954,
"learning_rate": 5.203210660259439e-07,
"loss": 0.1603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16794294118881226,
"step": 4325,
"valid_targets_mean": 4214.9,
"valid_targets_min": 611
},
{
"epoch": 6.550680786686838,
"grad_norm": 0.5073596132262154,
"learning_rate": 5.033622458297859e-07,
"loss": 0.165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1713084876537323,
"step": 4330,
"valid_targets_mean": 4483.1,
"valid_targets_min": 929
},
{
"epoch": 6.558245083207262,
"grad_norm": 0.4964554507482467,
"learning_rate": 4.866808710280691e-07,
"loss": 0.1437,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1499142050743103,
"step": 4335,
"valid_targets_mean": 4372.1,
"valid_targets_min": 486
},
{
"epoch": 6.5658093797276855,
"grad_norm": 0.519199836361022,
"learning_rate": 4.702771790038041e-07,
"loss": 0.1496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1542699635028839,
"step": 4340,
"valid_targets_mean": 3608.7,
"valid_targets_min": 520
},
{
"epoch": 6.573373676248109,
"grad_norm": 0.5427545547266298,
"learning_rate": 4.5415140318846306e-07,
"loss": 0.1537,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18496286869049072,
"step": 4345,
"valid_targets_mean": 4414.1,
"valid_targets_min": 769
},
{
"epoch": 6.580937972768533,
"grad_norm": 0.4891244974517963,
"learning_rate": 4.383037730586481e-07,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1510729044675827,
"step": 4350,
"valid_targets_mean": 4612.4,
"valid_targets_min": 345
},
{
"epoch": 6.588502269288956,
"grad_norm": 0.4882037237746936,
"learning_rate": 4.227345141328343e-07,
"loss": 0.1509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17036430537700653,
"step": 4355,
"valid_targets_mean": 5320.2,
"valid_targets_min": 1887
},
{
"epoch": 6.59606656580938,
"grad_norm": 0.4307780734929585,
"learning_rate": 4.074438479681564e-07,
"loss": 0.1556,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1584295928478241,
"step": 4360,
"valid_targets_mean": 5430.9,
"valid_targets_min": 927
},
{
"epoch": 6.603630862329803,
"grad_norm": 0.4772782028419242,
"learning_rate": 3.924319921572561e-07,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1360929310321808,
"step": 4365,
"valid_targets_mean": 3927.8,
"valid_targets_min": 688
},
{
"epoch": 6.611195158850227,
"grad_norm": 0.50833656176906,
"learning_rate": 3.7769916032518227e-07,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16856953501701355,
"step": 4370,
"valid_targets_mean": 4089.0,
"valid_targets_min": 711
},
{
"epoch": 6.61875945537065,
"grad_norm": 0.656485093888422,
"learning_rate": 3.63245562126362e-07,
"loss": 0.1571,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15266793966293335,
"step": 4375,
"valid_targets_mean": 5172.1,
"valid_targets_min": 642
},
{
"epoch": 6.626323751891074,
"grad_norm": 0.4561975368678506,
"learning_rate": 3.490714032416032e-07,
"loss": 0.1679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.183062344789505,
"step": 4380,
"valid_targets_mean": 5307.6,
"valid_targets_min": 1195
},
{
"epoch": 6.633888048411498,
"grad_norm": 0.7110131773558642,
"learning_rate": 3.351768853751769e-07,
"loss": 0.1487,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13424867391586304,
"step": 4385,
"valid_targets_mean": 4276.8,
"valid_targets_min": 509
},
{
"epoch": 6.641452344931921,
"grad_norm": 0.4678252102427936,
"learning_rate": 3.2156220625194633e-07,
"loss": 0.1577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14004451036453247,
"step": 4390,
"valid_targets_mean": 5015.1,
"valid_targets_min": 1259
},
{
"epoch": 6.649016641452345,
"grad_norm": 0.4246923427532061,
"learning_rate": 3.082275596145445e-07,
"loss": 0.1562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17100787162780762,
"step": 4395,
"valid_targets_mean": 5502.5,
"valid_targets_min": 2260
},
{
"epoch": 6.656580937972769,
"grad_norm": 0.5330628132067585,
"learning_rate": 2.951731352206322e-07,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1702652871608734,
"step": 4400,
"valid_targets_mean": 3936.1,
"valid_targets_min": 665
},
{
"epoch": 6.664145234493192,
"grad_norm": 0.4965404997875294,
"learning_rate": 2.8239911884018423e-07,
"loss": 0.1584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16452646255493164,
"step": 4405,
"valid_targets_mean": 4274.4,
"valid_targets_min": 877
},
{
"epoch": 6.671709531013616,
"grad_norm": 0.4915934752549612,
"learning_rate": 2.69905692252852e-07,
"loss": 0.1502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15462955832481384,
"step": 4410,
"valid_targets_mean": 4155.4,
"valid_targets_min": 632
},
{
"epoch": 6.67927382753404,
"grad_norm": 0.4336803794043365,
"learning_rate": 2.576930332453742e-07,
"loss": 0.1625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18209487199783325,
"step": 4415,
"valid_targets_mean": 6130.0,
"valid_targets_min": 637
},
{
"epoch": 6.6868381240544625,
"grad_norm": 0.4812053413355094,
"learning_rate": 2.4576131560905216e-07,
"loss": 0.1549,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16345643997192383,
"step": 4420,
"valid_targets_mean": 4934.9,
"valid_targets_min": 977
},
{
"epoch": 6.694402420574886,
"grad_norm": 0.49964213190276036,
"learning_rate": 2.341107091372674e-07,
"loss": 0.1677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17566847801208496,
"step": 4425,
"valid_targets_mean": 4736.9,
"valid_targets_min": 923
},
{
"epoch": 6.70196671709531,
"grad_norm": 0.4652703083015772,
"learning_rate": 2.2274137962307264e-07,
"loss": 0.1465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14961759746074677,
"step": 4430,
"valid_targets_mean": 4612.9,
"valid_targets_min": 1135
},
{
"epoch": 6.709531013615734,
"grad_norm": 0.43970643901140566,
"learning_rate": 2.1165348885683557e-07,
"loss": 0.1617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1801401823759079,
"step": 4435,
"valid_targets_mean": 5360.0,
"valid_targets_min": 805
},
{
"epoch": 6.717095310136157,
"grad_norm": 0.5006540034502627,
"learning_rate": 2.0084719462392544e-07,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15871846675872803,
"step": 4440,
"valid_targets_mean": 4147.4,
"valid_targets_min": 740
},
{
"epoch": 6.724659606656581,
"grad_norm": 0.4655065162357877,
"learning_rate": 1.903226507024769e-07,
"loss": 0.1554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17267106473445892,
"step": 4445,
"valid_targets_mean": 4900.9,
"valid_targets_min": 994
},
{
"epoch": 6.732223903177005,
"grad_norm": 0.4776542317912404,
"learning_rate": 1.800800068611941e-07,
"loss": 0.1619,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14296205341815948,
"step": 4450,
"valid_targets_mean": 4429.6,
"valid_targets_min": 644
},
{
"epoch": 6.739788199697428,
"grad_norm": 0.4645194361477701,
"learning_rate": 1.7011940885723222e-07,
"loss": 0.1593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.158104807138443,
"step": 4455,
"valid_targets_mean": 4528.9,
"valid_targets_min": 719
},
{
"epoch": 6.747352496217852,
"grad_norm": 0.463140877582521,
"learning_rate": 1.60440998434106e-07,
"loss": 0.164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15552181005477905,
"step": 4460,
"valid_targets_mean": 4513.7,
"valid_targets_min": 333
},
{
"epoch": 6.754916792738276,
"grad_norm": 0.4310101427133752,
"learning_rate": 1.5104491331968674e-07,
"loss": 0.1552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15951894223690033,
"step": 4465,
"valid_targets_mean": 5195.2,
"valid_targets_min": 814
},
{
"epoch": 6.762481089258699,
"grad_norm": 0.48515138640133515,
"learning_rate": 1.4193128722423954e-07,
"loss": 0.1586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1668251007795334,
"step": 4470,
"valid_targets_mean": 4821.4,
"valid_targets_min": 1072
},
{
"epoch": 6.770045385779122,
"grad_norm": 0.46924780947969497,
"learning_rate": 1.3310024983851367e-07,
"loss": 0.1551,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14621658623218536,
"step": 4475,
"valid_targets_mean": 4700.8,
"valid_targets_min": 578
},
{
"epoch": 6.777609682299547,
"grad_norm": 0.47997006639888423,
"learning_rate": 1.2455192683189955e-07,
"loss": 0.1485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1525563895702362,
"step": 4480,
"valid_targets_mean": 4628.7,
"valid_targets_min": 749
},
{
"epoch": 6.785173978819969,
"grad_norm": 0.44729024533554707,
"learning_rate": 1.1628643985064802e-07,
"loss": 0.1515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1606258600950241,
"step": 4485,
"valid_targets_mean": 5041.1,
"valid_targets_min": 2257
},
{
"epoch": 6.792738275340393,
"grad_norm": 0.5567659415227543,
"learning_rate": 1.0830390651613399e-07,
"loss": 0.1588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1706101894378662,
"step": 4490,
"valid_targets_mean": 3684.8,
"valid_targets_min": 533
},
{
"epoch": 6.800302571860817,
"grad_norm": 0.44905642734474416,
"learning_rate": 1.0060444042317984e-07,
"loss": 0.1618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1561523973941803,
"step": 4495,
"valid_targets_mean": 5226.9,
"valid_targets_min": 2218
},
{
"epoch": 6.80786686838124,
"grad_norm": 0.44526000556057144,
"learning_rate": 9.318815113843915e-08,
"loss": 0.1581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14291979372501373,
"step": 4500,
"valid_targets_mean": 4976.4,
"valid_targets_min": 970
},
{
"epoch": 6.815431164901664,
"grad_norm": 0.41389807910948084,
"learning_rate": 8.605514419884442e-08,
"loss": 0.147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1524887979030609,
"step": 4505,
"valid_targets_mean": 5439.3,
"valid_targets_min": 2445
},
{
"epoch": 6.822995461422088,
"grad_norm": 0.573972759244845,
"learning_rate": 7.92055211100995e-08,
"loss": 0.1546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14557316899299622,
"step": 4510,
"valid_targets_mean": 4493.8,
"valid_targets_min": 1014
},
{
"epoch": 6.8305597579425115,
"grad_norm": 0.49554661750919793,
"learning_rate": 7.263937934523402e-08,
"loss": 0.15,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.146365225315094,
"step": 4515,
"valid_targets_mean": 4681.9,
"valid_targets_min": 662
},
{
"epoch": 6.838124054462935,
"grad_norm": 0.41268242005804795,
"learning_rate": 6.635681234321789e-08,
"loss": 0.1544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12661297619342804,
"step": 4520,
"valid_targets_mean": 5688.6,
"valid_targets_min": 672
},
{
"epoch": 6.845688350983359,
"grad_norm": 0.5245346275052402,
"learning_rate": 6.035790950764008e-08,
"loss": 0.1459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15378622710704803,
"step": 4525,
"valid_targets_mean": 3729.6,
"valid_targets_min": 435
},
{
"epoch": 6.8532526475037825,
"grad_norm": 0.536981712222097,
"learning_rate": 5.464275620542081e-08,
"loss": 0.1592,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16862401366233826,
"step": 4530,
"valid_targets_mean": 4265.4,
"valid_targets_min": 617
},
{
"epoch": 6.860816944024206,
"grad_norm": 0.661040289886661,
"learning_rate": 4.921143376560355e-08,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19529613852500916,
"step": 4535,
"valid_targets_mean": 4173.4,
"valid_targets_min": 903
},
{
"epoch": 6.868381240544629,
"grad_norm": 0.4025079338035215,
"learning_rate": 4.4064019478207154e-08,
"loss": 0.1444,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14101910591125488,
"step": 4540,
"valid_targets_mean": 5818.1,
"valid_targets_min": 527
},
{
"epoch": 6.875945537065053,
"grad_norm": 0.4700049710206088,
"learning_rate": 3.920058659310666e-08,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16515228152275085,
"step": 4545,
"valid_targets_mean": 4960.9,
"valid_targets_min": 620
},
{
"epoch": 6.883509833585476,
"grad_norm": 0.4603067526871369,
"learning_rate": 3.4621204319011946e-08,
"loss": 0.1493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14470770955085754,
"step": 4550,
"valid_targets_mean": 4982.2,
"valid_targets_min": 831
},
{
"epoch": 6.8910741301059,
"grad_norm": 0.4673350592645921,
"learning_rate": 3.032593782246629e-08,
"loss": 0.1578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14939948916435242,
"step": 4555,
"valid_targets_mean": 4254.9,
"valid_targets_min": 987
},
{
"epoch": 6.898638426626324,
"grad_norm": 0.4517397456464997,
"learning_rate": 2.6314848226927094e-08,
"loss": 0.1453,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15728193521499634,
"step": 4560,
"valid_targets_mean": 4525.2,
"valid_targets_min": 711
},
{
"epoch": 6.906202723146747,
"grad_norm": 0.5117006909099115,
"learning_rate": 2.258799261189326e-08,
"loss": 0.1506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17386361956596375,
"step": 4565,
"valid_targets_mean": 4593.4,
"valid_targets_min": 630
},
{
"epoch": 6.913767019667171,
"grad_norm": 0.41306104008904443,
"learning_rate": 1.9145424012096957e-08,
"loss": 0.1525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15774936974048615,
"step": 4570,
"valid_targets_mean": 6134.3,
"valid_targets_min": 2953
},
{
"epoch": 6.921331316187595,
"grad_norm": 0.40696459882097896,
"learning_rate": 1.5987191416744208e-08,
"loss": 0.1611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1495034098625183,
"step": 4575,
"valid_targets_mean": 6611.8,
"valid_targets_min": 1330
},
{
"epoch": 6.928895612708018,
"grad_norm": 0.47931424197263106,
"learning_rate": 1.3113339768817679e-08,
"loss": 0.1486,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16390691697597504,
"step": 4580,
"valid_targets_mean": 4471.8,
"valid_targets_min": 723
},
{
"epoch": 6.936459909228442,
"grad_norm": 0.4461599389375818,
"learning_rate": 1.0523909964441636e-08,
"loss": 0.1495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15007872879505157,
"step": 4585,
"valid_targets_mean": 4946.4,
"valid_targets_min": 738
},
{
"epoch": 6.944024205748866,
"grad_norm": 0.430644073341138,
"learning_rate": 8.218938852295744e-09,
"loss": 0.1484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11911873519420624,
"step": 4590,
"valid_targets_mean": 5387.9,
"valid_targets_min": 681
},
{
"epoch": 6.9515885022692885,
"grad_norm": 0.544666118636178,
"learning_rate": 6.1984592330954776e-09,
"loss": 0.1391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12848445773124695,
"step": 4595,
"valid_targets_mean": 4979.9,
"valid_targets_min": 364
},
{
"epoch": 6.959152798789713,
"grad_norm": 0.47313846425247624,
"learning_rate": 4.4624998591191735e-09,
"loss": 0.1507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.164044588804245,
"step": 4600,
"valid_targets_mean": 4802.0,
"valid_targets_min": 1697
},
{
"epoch": 6.966717095310136,
"grad_norm": 0.5499679479102836,
"learning_rate": 3.0110854337994654e-09,
"loss": 0.1599,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1561359018087387,
"step": 4605,
"valid_targets_mean": 3980.2,
"valid_targets_min": 711
},
{
"epoch": 6.9742813918305595,
"grad_norm": 0.47453995839514496,
"learning_rate": 1.8442366113791132e-09,
"loss": 0.1616,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16566257178783417,
"step": 4610,
"valid_targets_mean": 4593.8,
"valid_targets_min": 932
},
{
"epoch": 6.981845688350983,
"grad_norm": 0.4033635076972133,
"learning_rate": 9.619699966090245e-10,
"loss": 0.1608,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15273799002170563,
"step": 4615,
"valid_targets_mean": 6477.4,
"valid_targets_min": 1671
},
{
"epoch": 6.989409984871407,
"grad_norm": 0.45663261359056423,
"learning_rate": 3.642981445173277e-10,
"loss": 0.1482,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14979088306427002,
"step": 4620,
"valid_targets_mean": 4614.1,
"valid_targets_min": 625
},
{
"epoch": 6.9969742813918305,
"grad_norm": 0.42449100353688324,
"learning_rate": 5.1229560225074525e-11,
"loss": 0.1511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13834691047668457,
"step": 4625,
"valid_targets_mean": 5519.8,
"valid_targets_min": 2736
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13807812333106995,
"step": 4627,
"total_flos": 1697568073121792.0,
"train_loss": 0.19562295946828587,
"train_runtime": 28413.4165,
"train_samples_per_second": 2.604,
"train_steps_per_second": 0.163,
"valid_targets_mean": 4912.6,
"valid_targets_min": 607
}
],
"logging_steps": 5,
"max_steps": 4627,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1697568073121792.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}