penfever's picture
End of training
f5f3bc8 verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 3850,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.009099181073703366,
"grad_norm": 14.786740346535169,
"learning_rate": 4.155844155844156e-07,
"loss": 0.7964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4239060580730438,
"step": 5,
"valid_targets_mean": 3328.6,
"valid_targets_min": 1920
},
{
"epoch": 0.018198362147406732,
"grad_norm": 16.012612850793044,
"learning_rate": 9.350649350649352e-07,
"loss": 0.7542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43628671765327454,
"step": 10,
"valid_targets_mean": 4038.5,
"valid_targets_min": 510
},
{
"epoch": 0.0272975432211101,
"grad_norm": 11.637341370322037,
"learning_rate": 1.4545454545454546e-06,
"loss": 0.6985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25581756234169006,
"step": 15,
"valid_targets_mean": 2830.5,
"valid_targets_min": 1594
},
{
"epoch": 0.036396724294813464,
"grad_norm": 9.205480878961371,
"learning_rate": 1.9740259740259743e-06,
"loss": 0.7378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43626388907432556,
"step": 20,
"valid_targets_mean": 2573.2,
"valid_targets_min": 503
},
{
"epoch": 0.04549590536851683,
"grad_norm": 6.503069240270076,
"learning_rate": 2.4935064935064936e-06,
"loss": 0.6758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3213389217853546,
"step": 25,
"valid_targets_mean": 3504.4,
"valid_targets_min": 562
},
{
"epoch": 0.0545950864422202,
"grad_norm": 5.450861291416442,
"learning_rate": 3.0129870129870133e-06,
"loss": 0.6141,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31898123025894165,
"step": 30,
"valid_targets_mean": 3968.9,
"valid_targets_min": 2624
},
{
"epoch": 0.06369426751592357,
"grad_norm": 4.3390051294027145,
"learning_rate": 3.532467532467533e-06,
"loss": 0.5348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29908043146133423,
"step": 35,
"valid_targets_mean": 3511.2,
"valid_targets_min": 1657
},
{
"epoch": 0.07279344858962693,
"grad_norm": 1.7434242750268414,
"learning_rate": 4.051948051948053e-06,
"loss": 0.4927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2466040551662445,
"step": 40,
"valid_targets_mean": 4462.8,
"valid_targets_min": 862
},
{
"epoch": 0.0818926296633303,
"grad_norm": 1.3123142041030291,
"learning_rate": 4.571428571428572e-06,
"loss": 0.4902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24911117553710938,
"step": 45,
"valid_targets_mean": 4395.0,
"valid_targets_min": 2994
},
{
"epoch": 0.09099181073703366,
"grad_norm": 1.0370754476225932,
"learning_rate": 5.090909090909091e-06,
"loss": 0.4637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21570774912834167,
"step": 50,
"valid_targets_mean": 3738.4,
"valid_targets_min": 601
},
{
"epoch": 0.10009099181073704,
"grad_norm": 1.0104012155244833,
"learning_rate": 5.6103896103896105e-06,
"loss": 0.4562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24701082706451416,
"step": 55,
"valid_targets_mean": 2790.5,
"valid_targets_min": 1528
},
{
"epoch": 0.1091901728844404,
"grad_norm": 0.7663704291957927,
"learning_rate": 6.129870129870131e-06,
"loss": 0.4542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23319780826568604,
"step": 60,
"valid_targets_mean": 4510.6,
"valid_targets_min": 1800
},
{
"epoch": 0.11828935395814377,
"grad_norm": 0.8498028917774307,
"learning_rate": 6.64935064935065e-06,
"loss": 0.4485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24339726567268372,
"step": 65,
"valid_targets_mean": 3079.8,
"valid_targets_min": 1365
},
{
"epoch": 0.12738853503184713,
"grad_norm": 0.7238294258812147,
"learning_rate": 7.16883116883117e-06,
"loss": 0.4281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18463903665542603,
"step": 70,
"valid_targets_mean": 2951.8,
"valid_targets_min": 306
},
{
"epoch": 0.1364877161055505,
"grad_norm": 0.7422498404553763,
"learning_rate": 7.68831168831169e-06,
"loss": 0.4167,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2971900403499603,
"step": 75,
"valid_targets_mean": 5033.6,
"valid_targets_min": 705
},
{
"epoch": 0.14558689717925385,
"grad_norm": 0.7477819199483188,
"learning_rate": 8.20779220779221e-06,
"loss": 0.4342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19027340412139893,
"step": 80,
"valid_targets_mean": 2463.9,
"valid_targets_min": 287
},
{
"epoch": 0.15468607825295724,
"grad_norm": 0.7810954141754345,
"learning_rate": 8.727272727272728e-06,
"loss": 0.4291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21374209225177765,
"step": 85,
"valid_targets_mean": 2681.8,
"valid_targets_min": 1059
},
{
"epoch": 0.1637852593266606,
"grad_norm": 0.736357169889036,
"learning_rate": 9.246753246753248e-06,
"loss": 0.411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24572578072547913,
"step": 90,
"valid_targets_mean": 3635.2,
"valid_targets_min": 1665
},
{
"epoch": 0.17288444040036396,
"grad_norm": 0.601778477867443,
"learning_rate": 9.766233766233766e-06,
"loss": 0.4094,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20906668901443481,
"step": 95,
"valid_targets_mean": 4694.9,
"valid_targets_min": 2787
},
{
"epoch": 0.18198362147406733,
"grad_norm": 0.7108557287411013,
"learning_rate": 1.0285714285714285e-05,
"loss": 0.4183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23694711923599243,
"step": 100,
"valid_targets_mean": 3789.9,
"valid_targets_min": 2115
},
{
"epoch": 0.1910828025477707,
"grad_norm": 0.7213642248877461,
"learning_rate": 1.0805194805194805e-05,
"loss": 0.3775,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17074792087078094,
"step": 105,
"valid_targets_mean": 2586.1,
"valid_targets_min": 188
},
{
"epoch": 0.20018198362147407,
"grad_norm": 0.5465254431332037,
"learning_rate": 1.1324675324675325e-05,
"loss": 0.3878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18964694440364838,
"step": 110,
"valid_targets_mean": 3826.4,
"valid_targets_min": 1437
},
{
"epoch": 0.20928116469517744,
"grad_norm": 0.6290670154418285,
"learning_rate": 1.1844155844155845e-05,
"loss": 0.3946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17479845881462097,
"step": 115,
"valid_targets_mean": 3998.0,
"valid_targets_min": 501
},
{
"epoch": 0.2183803457688808,
"grad_norm": 0.7219274776090822,
"learning_rate": 1.2363636363636364e-05,
"loss": 0.3796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22305920720100403,
"step": 120,
"valid_targets_mean": 3191.8,
"valid_targets_min": 1186
},
{
"epoch": 0.22747952684258416,
"grad_norm": 0.6217810003610046,
"learning_rate": 1.2883116883116884e-05,
"loss": 0.3889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23009517788887024,
"step": 125,
"valid_targets_mean": 4508.2,
"valid_targets_min": 2876
},
{
"epoch": 0.23657870791628755,
"grad_norm": 0.7528270014107937,
"learning_rate": 1.3402597402597404e-05,
"loss": 0.4085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2731509804725647,
"step": 130,
"valid_targets_mean": 4044.8,
"valid_targets_min": 191
},
{
"epoch": 0.2456778889899909,
"grad_norm": 0.773354064973906,
"learning_rate": 1.3922077922077924e-05,
"loss": 0.4325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24367764592170715,
"step": 135,
"valid_targets_mean": 2869.1,
"valid_targets_min": 276
},
{
"epoch": 0.25477707006369427,
"grad_norm": 0.6366461975764265,
"learning_rate": 1.4441558441558442e-05,
"loss": 0.3849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2264237254858017,
"step": 140,
"valid_targets_mean": 4120.5,
"valid_targets_min": 297
},
{
"epoch": 0.26387625113739765,
"grad_norm": 0.73407765075352,
"learning_rate": 1.4961038961038962e-05,
"loss": 0.3789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24225257337093353,
"step": 145,
"valid_targets_mean": 3395.4,
"valid_targets_min": 2194
},
{
"epoch": 0.272975432211101,
"grad_norm": 0.528975542490164,
"learning_rate": 1.548051948051948e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15162131190299988,
"step": 150,
"valid_targets_mean": 5184.5,
"valid_targets_min": 1548
},
{
"epoch": 0.2820746132848044,
"grad_norm": 0.6407623243411594,
"learning_rate": 1.6000000000000003e-05,
"loss": 0.3807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17568965256214142,
"step": 155,
"valid_targets_mean": 3090.6,
"valid_targets_min": 1391
},
{
"epoch": 0.2911737943585077,
"grad_norm": 0.5598898794356707,
"learning_rate": 1.651948051948052e-05,
"loss": 0.3768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18702304363250732,
"step": 160,
"valid_targets_mean": 4726.5,
"valid_targets_min": 1965
},
{
"epoch": 0.3002729754322111,
"grad_norm": 0.80253866312149,
"learning_rate": 1.703896103896104e-05,
"loss": 0.3835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20537051558494568,
"step": 165,
"valid_targets_mean": 3467.9,
"valid_targets_min": 1035
},
{
"epoch": 0.3093721565059145,
"grad_norm": 0.617856603797492,
"learning_rate": 1.7558441558441558e-05,
"loss": 0.3794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21695730090141296,
"step": 170,
"valid_targets_mean": 4163.9,
"valid_targets_min": 2707
},
{
"epoch": 0.3184713375796178,
"grad_norm": 0.6035798544318993,
"learning_rate": 1.807792207792208e-05,
"loss": 0.3703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15242548286914825,
"step": 175,
"valid_targets_mean": 3452.9,
"valid_targets_min": 863
},
{
"epoch": 0.3275705186533212,
"grad_norm": 0.7205194191830786,
"learning_rate": 1.8597402597402598e-05,
"loss": 0.3566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22975976765155792,
"step": 180,
"valid_targets_mean": 3661.2,
"valid_targets_min": 1386
},
{
"epoch": 0.33666969972702454,
"grad_norm": 0.664114211118228,
"learning_rate": 1.9116883116883117e-05,
"loss": 0.3906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1819133758544922,
"step": 185,
"valid_targets_mean": 3520.2,
"valid_targets_min": 302
},
{
"epoch": 0.34576888080072793,
"grad_norm": 0.630988318809503,
"learning_rate": 1.963636363636364e-05,
"loss": 0.361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1779000461101532,
"step": 190,
"valid_targets_mean": 3337.4,
"valid_targets_min": 2080
},
{
"epoch": 0.3548680618744313,
"grad_norm": 0.657730355236433,
"learning_rate": 2.0155844155844157e-05,
"loss": 0.3542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17508140206336975,
"step": 195,
"valid_targets_mean": 3508.1,
"valid_targets_min": 1803
},
{
"epoch": 0.36396724294813465,
"grad_norm": 0.5665992228116543,
"learning_rate": 2.0675324675324675e-05,
"loss": 0.3336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14676086604595184,
"step": 200,
"valid_targets_mean": 7127.0,
"valid_targets_min": 1887
},
{
"epoch": 0.37306642402183804,
"grad_norm": 0.6282569130705208,
"learning_rate": 2.1194805194805194e-05,
"loss": 0.3454,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19846948981285095,
"step": 205,
"valid_targets_mean": 3845.4,
"valid_targets_min": 545
},
{
"epoch": 0.3821656050955414,
"grad_norm": 0.6716368289981851,
"learning_rate": 2.1714285714285715e-05,
"loss": 0.3542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20502102375030518,
"step": 210,
"valid_targets_mean": 4379.2,
"valid_targets_min": 1637
},
{
"epoch": 0.39126478616924476,
"grad_norm": 0.586040871093467,
"learning_rate": 2.2233766233766234e-05,
"loss": 0.3325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20062410831451416,
"step": 215,
"valid_targets_mean": 4620.4,
"valid_targets_min": 306
},
{
"epoch": 0.40036396724294815,
"grad_norm": 0.7116115352531075,
"learning_rate": 2.2753246753246752e-05,
"loss": 0.355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20102885365486145,
"step": 220,
"valid_targets_mean": 4042.2,
"valid_targets_min": 692
},
{
"epoch": 0.4094631483166515,
"grad_norm": 0.7593643012524895,
"learning_rate": 2.3272727272727274e-05,
"loss": 0.3669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16333557665348053,
"step": 225,
"valid_targets_mean": 2727.2,
"valid_targets_min": 1471
},
{
"epoch": 0.41856232939035487,
"grad_norm": 0.6436238397243124,
"learning_rate": 2.3792207792207793e-05,
"loss": 0.377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19011452794075012,
"step": 230,
"valid_targets_mean": 3853.6,
"valid_targets_min": 327
},
{
"epoch": 0.42766151046405826,
"grad_norm": 0.49381503876442573,
"learning_rate": 2.4311688311688314e-05,
"loss": 0.3322,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1791185438632965,
"step": 235,
"valid_targets_mean": 6669.8,
"valid_targets_min": 4161
},
{
"epoch": 0.4367606915377616,
"grad_norm": 0.7562039996015982,
"learning_rate": 2.4831168831168833e-05,
"loss": 0.3279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1556703746318817,
"step": 240,
"valid_targets_mean": 2839.9,
"valid_targets_min": 690
},
{
"epoch": 0.445859872611465,
"grad_norm": 0.6948851833431993,
"learning_rate": 2.535064935064935e-05,
"loss": 0.3472,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16435737907886505,
"step": 245,
"valid_targets_mean": 3262.5,
"valid_targets_min": 1379
},
{
"epoch": 0.4549590536851683,
"grad_norm": 0.58823239503998,
"learning_rate": 2.5870129870129873e-05,
"loss": 0.3371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18383200466632843,
"step": 250,
"valid_targets_mean": 4217.0,
"valid_targets_min": 1857
},
{
"epoch": 0.4640582347588717,
"grad_norm": 0.7146593511175929,
"learning_rate": 2.638961038961039e-05,
"loss": 0.3456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20923785865306854,
"step": 255,
"valid_targets_mean": 3851.0,
"valid_targets_min": 2105
},
{
"epoch": 0.4731574158325751,
"grad_norm": 0.639172708679333,
"learning_rate": 2.690909090909091e-05,
"loss": 0.3481,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16769519448280334,
"step": 260,
"valid_targets_mean": 3705.9,
"valid_targets_min": 1050
},
{
"epoch": 0.4822565969062784,
"grad_norm": 0.5819486451804095,
"learning_rate": 2.742857142857143e-05,
"loss": 0.3405,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1527741402387619,
"step": 265,
"valid_targets_mean": 3778.8,
"valid_targets_min": 1858
},
{
"epoch": 0.4913557779799818,
"grad_norm": 0.7052096499331427,
"learning_rate": 2.794805194805195e-05,
"loss": 0.3661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16779346764087677,
"step": 270,
"valid_targets_mean": 2560.2,
"valid_targets_min": 979
},
{
"epoch": 0.5004549590536852,
"grad_norm": 0.6155479988948123,
"learning_rate": 2.8467532467532472e-05,
"loss": 0.3386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17713932693004608,
"step": 275,
"valid_targets_mean": 4008.5,
"valid_targets_min": 1179
},
{
"epoch": 0.5095541401273885,
"grad_norm": 0.7222593319271032,
"learning_rate": 2.898701298701299e-05,
"loss": 0.3627,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18285799026489258,
"step": 280,
"valid_targets_mean": 2894.9,
"valid_targets_min": 1384
},
{
"epoch": 0.5186533212010919,
"grad_norm": 0.5061744009962925,
"learning_rate": 2.950649350649351e-05,
"loss": 0.3327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11711747944355011,
"step": 285,
"valid_targets_mean": 4999.4,
"valid_targets_min": 506
},
{
"epoch": 0.5277525022747953,
"grad_norm": 0.628458589369126,
"learning_rate": 3.002597402597403e-05,
"loss": 0.3524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20639720559120178,
"step": 290,
"valid_targets_mean": 3854.2,
"valid_targets_min": 1366
},
{
"epoch": 0.5368516833484986,
"grad_norm": 0.7356451176164959,
"learning_rate": 3.054545454545455e-05,
"loss": 0.3704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17715367674827576,
"step": 295,
"valid_targets_mean": 2221.9,
"valid_targets_min": 159
},
{
"epoch": 0.545950864422202,
"grad_norm": 0.6834528754923809,
"learning_rate": 3.106493506493507e-05,
"loss": 0.3664,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.202093243598938,
"step": 300,
"valid_targets_mean": 3654.0,
"valid_targets_min": 2125
},
{
"epoch": 0.5550500454959054,
"grad_norm": 0.644798154871265,
"learning_rate": 3.158441558441559e-05,
"loss": 0.3375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17941009998321533,
"step": 305,
"valid_targets_mean": 4599.6,
"valid_targets_min": 1266
},
{
"epoch": 0.5641492265696088,
"grad_norm": 0.6306840599749488,
"learning_rate": 3.210389610389611e-05,
"loss": 0.3457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1706070601940155,
"step": 310,
"valid_targets_mean": 3753.9,
"valid_targets_min": 867
},
{
"epoch": 0.5732484076433121,
"grad_norm": 0.6591743834234475,
"learning_rate": 3.2623376623376626e-05,
"loss": 0.3473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17178833484649658,
"step": 315,
"valid_targets_mean": 3608.0,
"valid_targets_min": 402
},
{
"epoch": 0.5823475887170154,
"grad_norm": 0.6834492202812368,
"learning_rate": 3.314285714285715e-05,
"loss": 0.3601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16191285848617554,
"step": 320,
"valid_targets_mean": 2754.0,
"valid_targets_min": 287
},
{
"epoch": 0.5914467697907189,
"grad_norm": 0.6218165451057371,
"learning_rate": 3.366233766233766e-05,
"loss": 0.3288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18606127798557281,
"step": 325,
"valid_targets_mean": 4163.6,
"valid_targets_min": 1883
},
{
"epoch": 0.6005459508644222,
"grad_norm": 0.6971555869668246,
"learning_rate": 3.4181818181818185e-05,
"loss": 0.3588,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1653805673122406,
"step": 330,
"valid_targets_mean": 3056.8,
"valid_targets_min": 286
},
{
"epoch": 0.6096451319381255,
"grad_norm": 0.6694568351469594,
"learning_rate": 3.47012987012987e-05,
"loss": 0.3542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18698689341545105,
"step": 335,
"valid_targets_mean": 3503.6,
"valid_targets_min": 352
},
{
"epoch": 0.618744313011829,
"grad_norm": 0.7602070220543796,
"learning_rate": 3.522077922077922e-05,
"loss": 0.3574,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18287214636802673,
"step": 340,
"valid_targets_mean": 3039.4,
"valid_targets_min": 902
},
{
"epoch": 0.6278434940855323,
"grad_norm": 1.4136824233595235,
"learning_rate": 3.5740259740259743e-05,
"loss": 0.3515,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17238737642765045,
"step": 345,
"valid_targets_mean": 2872.9,
"valid_targets_min": 872
},
{
"epoch": 0.6369426751592356,
"grad_norm": 0.5035685691094948,
"learning_rate": 3.625974025974026e-05,
"loss": 0.3246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1299327313899994,
"step": 350,
"valid_targets_mean": 3888.1,
"valid_targets_min": 811
},
{
"epoch": 0.6460418562329391,
"grad_norm": 0.7509236623969442,
"learning_rate": 3.677922077922078e-05,
"loss": 0.3434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16455626487731934,
"step": 355,
"valid_targets_mean": 2435.2,
"valid_targets_min": 382
},
{
"epoch": 0.6551410373066424,
"grad_norm": 0.7267357043550218,
"learning_rate": 3.72987012987013e-05,
"loss": 0.3339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15680286288261414,
"step": 360,
"valid_targets_mean": 2537.6,
"valid_targets_min": 723
},
{
"epoch": 0.6642402183803457,
"grad_norm": 0.5882397350664301,
"learning_rate": 3.7818181818181824e-05,
"loss": 0.3445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17925706505775452,
"step": 365,
"valid_targets_mean": 3746.2,
"valid_targets_min": 174
},
{
"epoch": 0.6733393994540491,
"grad_norm": 0.6701257363851001,
"learning_rate": 3.833766233766234e-05,
"loss": 0.3429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15250617265701294,
"step": 370,
"valid_targets_mean": 3226.2,
"valid_targets_min": 534
},
{
"epoch": 0.6824385805277525,
"grad_norm": 0.7709420665796557,
"learning_rate": 3.885714285714286e-05,
"loss": 0.3363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19574809074401855,
"step": 375,
"valid_targets_mean": 2969.6,
"valid_targets_min": 579
},
{
"epoch": 0.6915377616014559,
"grad_norm": 0.7321311016328584,
"learning_rate": 3.937662337662338e-05,
"loss": 0.3474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18352022767066956,
"step": 380,
"valid_targets_mean": 3078.8,
"valid_targets_min": 246
},
{
"epoch": 0.7006369426751592,
"grad_norm": 0.5227688266969235,
"learning_rate": 3.98961038961039e-05,
"loss": 0.3135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1240387111902237,
"step": 385,
"valid_targets_mean": 5729.1,
"valid_targets_min": 148
},
{
"epoch": 0.7097361237488626,
"grad_norm": 0.6634696872428075,
"learning_rate": 3.999986847364818e-05,
"loss": 0.3455,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14379724860191345,
"step": 390,
"valid_targets_mean": 3921.5,
"valid_targets_min": 2435
},
{
"epoch": 0.718835304822566,
"grad_norm": 0.6786231321488037,
"learning_rate": 3.999933415080877e-05,
"loss": 0.3428,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15791067481040955,
"step": 395,
"valid_targets_mean": 2961.2,
"valid_targets_min": 1549
},
{
"epoch": 0.7279344858962693,
"grad_norm": 0.7042840913170564,
"learning_rate": 3.999838882205719e-05,
"loss": 0.3347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17206677794456482,
"step": 400,
"valid_targets_mean": 4209.1,
"valid_targets_min": 295
},
{
"epoch": 0.7370336669699727,
"grad_norm": 0.776618106056019,
"learning_rate": 3.999703250682087e-05,
"loss": 0.3471,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1754663586616516,
"step": 405,
"valid_targets_mean": 2778.5,
"valid_targets_min": 513
},
{
"epoch": 0.7461328480436761,
"grad_norm": 0.6821666886795281,
"learning_rate": 3.9995265232973414e-05,
"loss": 0.321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13924285769462585,
"step": 410,
"valid_targets_mean": 3779.0,
"valid_targets_min": 270
},
{
"epoch": 0.7552320291173794,
"grad_norm": 0.6028714659678347,
"learning_rate": 3.9993087036834034e-05,
"loss": 0.3242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1615755558013916,
"step": 415,
"valid_targets_mean": 3375.9,
"valid_targets_min": 2078
},
{
"epoch": 0.7643312101910829,
"grad_norm": 0.629543345625808,
"learning_rate": 3.9990497963166797e-05,
"loss": 0.3329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1638343334197998,
"step": 420,
"valid_targets_mean": 3765.9,
"valid_targets_min": 1599
},
{
"epoch": 0.7734303912647862,
"grad_norm": 0.6579488775198418,
"learning_rate": 3.99874980651797e-05,
"loss": 0.3283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14738169312477112,
"step": 425,
"valid_targets_mean": 3576.5,
"valid_targets_min": 2775
},
{
"epoch": 0.7825295723384895,
"grad_norm": 0.6561952681802788,
"learning_rate": 3.998408740452359e-05,
"loss": 0.3288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16806158423423767,
"step": 430,
"valid_targets_mean": 3370.6,
"valid_targets_min": 388
},
{
"epoch": 0.7916287534121929,
"grad_norm": 0.7592724078668787,
"learning_rate": 3.998026605129088e-05,
"loss": 0.342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21901732683181763,
"step": 435,
"valid_targets_mean": 3533.4,
"valid_targets_min": 433
},
{
"epoch": 0.8007279344858963,
"grad_norm": 0.7391353010655607,
"learning_rate": 3.997603408401413e-05,
"loss": 0.3378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1867692768573761,
"step": 440,
"valid_targets_mean": 4258.1,
"valid_targets_min": 2031
},
{
"epoch": 0.8098271155595996,
"grad_norm": 0.7795273567250613,
"learning_rate": 3.997139158966441e-05,
"loss": 0.3335,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13619282841682434,
"step": 445,
"valid_targets_mean": 2759.1,
"valid_targets_min": 1005
},
{
"epoch": 0.818926296633303,
"grad_norm": 0.6562343920190629,
"learning_rate": 3.996633866364953e-05,
"loss": 0.3274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18688486516475677,
"step": 450,
"valid_targets_mean": 4256.5,
"valid_targets_min": 2352
},
{
"epoch": 0.8280254777070064,
"grad_norm": 0.6567770384652188,
"learning_rate": 3.996087540981206e-05,
"loss": 0.3392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1674097329378128,
"step": 455,
"valid_targets_mean": 3862.6,
"valid_targets_min": 1844
},
{
"epoch": 0.8371246587807097,
"grad_norm": 0.43691333266562116,
"learning_rate": 3.9955001940427236e-05,
"loss": 0.3385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13044530153274536,
"step": 460,
"valid_targets_mean": 7291.9,
"valid_targets_min": 1771
},
{
"epoch": 0.8462238398544131,
"grad_norm": 0.5118948109279933,
"learning_rate": 3.99487183762006e-05,
"loss": 0.308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12879431247711182,
"step": 465,
"valid_targets_mean": 4598.5,
"valid_targets_min": 776
},
{
"epoch": 0.8553230209281165,
"grad_norm": 0.8074499299412539,
"learning_rate": 3.994202484626555e-05,
"loss": 0.3267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14642921090126038,
"step": 470,
"valid_targets_mean": 2749.0,
"valid_targets_min": 1419
},
{
"epoch": 0.8644222020018199,
"grad_norm": 0.46974985023916216,
"learning_rate": 3.993492148818069e-05,
"loss": 0.3302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10927803814411163,
"step": 475,
"valid_targets_mean": 3984.2,
"valid_targets_min": 2741
},
{
"epoch": 0.8735213830755232,
"grad_norm": 0.5801889932724914,
"learning_rate": 3.992740844792699e-05,
"loss": 0.3269,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16290982067584991,
"step": 480,
"valid_targets_mean": 3765.0,
"valid_targets_min": 2484
},
{
"epoch": 0.8826205641492265,
"grad_norm": 0.7885165014083056,
"learning_rate": 3.991948587990479e-05,
"loss": 0.338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1817663013935089,
"step": 485,
"valid_targets_mean": 3399.4,
"valid_targets_min": 332
},
{
"epoch": 0.89171974522293,
"grad_norm": 0.6491169797538565,
"learning_rate": 3.991115394693061e-05,
"loss": 0.3351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18687278032302856,
"step": 490,
"valid_targets_mean": 4333.0,
"valid_targets_min": 3067
},
{
"epoch": 0.9008189262966333,
"grad_norm": 0.6388245302934621,
"learning_rate": 3.990241282023385e-05,
"loss": 0.3066,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.171747088432312,
"step": 495,
"valid_targets_mean": 3816.8,
"valid_targets_min": 1782
},
{
"epoch": 0.9099181073703366,
"grad_norm": 0.9397629711325225,
"learning_rate": 3.989326267945323e-05,
"loss": 0.3338,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1524638682603836,
"step": 500,
"valid_targets_mean": 2860.0,
"valid_targets_min": 1797
},
{
"epoch": 0.9190172884440401,
"grad_norm": 0.5993283056073379,
"learning_rate": 3.98837037126331e-05,
"loss": 0.3366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1285330355167389,
"step": 505,
"valid_targets_mean": 3083.9,
"valid_targets_min": 344
},
{
"epoch": 0.9281164695177434,
"grad_norm": 0.6429169438989089,
"learning_rate": 3.98737361162196e-05,
"loss": 0.349,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15727660059928894,
"step": 510,
"valid_targets_mean": 3575.6,
"valid_targets_min": 590
},
{
"epoch": 0.9372156505914467,
"grad_norm": 0.6432681607328898,
"learning_rate": 3.986336009505659e-05,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.134327232837677,
"step": 515,
"valid_targets_mean": 2672.4,
"valid_targets_min": 378
},
{
"epoch": 0.9463148316651502,
"grad_norm": 0.5634556848468228,
"learning_rate": 3.985257586238149e-05,
"loss": 0.3458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1891605108976364,
"step": 520,
"valid_targets_mean": 4462.9,
"valid_targets_min": 2757
},
{
"epoch": 0.9554140127388535,
"grad_norm": 0.7126742924631625,
"learning_rate": 3.984138363982084e-05,
"loss": 0.3403,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16645973920822144,
"step": 525,
"valid_targets_mean": 2579.2,
"valid_targets_min": 303
},
{
"epoch": 0.9645131938125568,
"grad_norm": 0.5297879582892905,
"learning_rate": 3.982978365738578e-05,
"loss": 0.3148,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10891679674386978,
"step": 530,
"valid_targets_mean": 4010.6,
"valid_targets_min": 2391
},
{
"epoch": 0.9736123748862603,
"grad_norm": 0.6474325926954897,
"learning_rate": 3.981777615346731e-05,
"loss": 0.3209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1598714292049408,
"step": 535,
"valid_targets_mean": 3160.5,
"valid_targets_min": 1483
},
{
"epoch": 0.9827115559599636,
"grad_norm": 0.6380981419738545,
"learning_rate": 3.980536137483141e-05,
"loss": 0.3326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15230050683021545,
"step": 540,
"valid_targets_mean": 3283.4,
"valid_targets_min": 418
},
{
"epoch": 0.991810737033667,
"grad_norm": 0.6228267400147609,
"learning_rate": 3.9792539576613934e-05,
"loss": 0.3276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1523316502571106,
"step": 545,
"valid_targets_mean": 2762.2,
"valid_targets_min": 988
},
{
"epoch": 1.0,
"grad_norm": 0.7703107249289565,
"learning_rate": 3.9779311022315405e-05,
"loss": 0.334,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3257380425930023,
"step": 550,
"valid_targets_mean": 4005.5,
"valid_targets_min": 552
},
{
"epoch": 1.0090991810737033,
"grad_norm": 0.6564463452360433,
"learning_rate": 3.976567598379558e-05,
"loss": 0.3199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16916556656360626,
"step": 555,
"valid_targets_mean": 3139.6,
"valid_targets_min": 557
},
{
"epoch": 1.0181983621474067,
"grad_norm": 0.6316598177475052,
"learning_rate": 3.975163474126785e-05,
"loss": 0.314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1529175043106079,
"step": 560,
"valid_targets_mean": 3807.1,
"valid_targets_min": 748
},
{
"epoch": 1.02729754322111,
"grad_norm": 0.5512261147650673,
"learning_rate": 3.9737187583293505e-05,
"loss": 0.302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11598987877368927,
"step": 565,
"valid_targets_mean": 3748.8,
"valid_targets_min": 1146
},
{
"epoch": 1.0363967242948136,
"grad_norm": 0.5664752755228538,
"learning_rate": 3.9722334806775806e-05,
"loss": 0.3217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12348569184541702,
"step": 570,
"valid_targets_mean": 3140.4,
"valid_targets_min": 1894
},
{
"epoch": 1.0454959053685169,
"grad_norm": 0.6383017456860482,
"learning_rate": 3.9707076716953866e-05,
"loss": 0.3028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15872514247894287,
"step": 575,
"valid_targets_mean": 4805.6,
"valid_targets_min": 1894
},
{
"epoch": 1.0545950864422202,
"grad_norm": 0.5375002734811841,
"learning_rate": 3.969141362739636e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1593000888824463,
"step": 580,
"valid_targets_mean": 4595.2,
"valid_targets_min": 2395
},
{
"epoch": 1.0636942675159236,
"grad_norm": 0.5566540119334547,
"learning_rate": 3.967534585999515e-05,
"loss": 0.3154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12608671188354492,
"step": 585,
"valid_targets_mean": 3549.9,
"valid_targets_min": 402
},
{
"epoch": 1.0727934485896269,
"grad_norm": 0.5858299909987527,
"learning_rate": 3.965887374495859e-05,
"loss": 0.2855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15359722077846527,
"step": 590,
"valid_targets_mean": 4215.9,
"valid_targets_min": 501
},
{
"epoch": 1.0818926296633302,
"grad_norm": 0.5380275782190423,
"learning_rate": 3.964199762080478e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1915718913078308,
"step": 595,
"valid_targets_mean": 5193.9,
"valid_targets_min": 1867
},
{
"epoch": 1.0909918107370338,
"grad_norm": 1.3584511182550558,
"learning_rate": 3.9624717834354606e-05,
"loss": 0.3112,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17153777182102203,
"step": 600,
"valid_targets_mean": 3738.6,
"valid_targets_min": 1454
},
{
"epoch": 1.100090991810737,
"grad_norm": 0.559010500557733,
"learning_rate": 3.9607034740724615e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11709210276603699,
"step": 605,
"valid_targets_mean": 3672.4,
"valid_targets_min": 388
},
{
"epoch": 1.1091901728844404,
"grad_norm": 0.6702458849968536,
"learning_rate": 3.958894870331971e-05,
"loss": 0.3029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15884870290756226,
"step": 610,
"valid_targets_mean": 3277.5,
"valid_targets_min": 1322
},
{
"epoch": 1.1182893539581438,
"grad_norm": 0.6566718317921177,
"learning_rate": 3.9570460093825664e-05,
"loss": 0.3032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13488319516181946,
"step": 615,
"valid_targets_mean": 3118.4,
"valid_targets_min": 991
},
{
"epoch": 1.127388535031847,
"grad_norm": 0.5392787236116686,
"learning_rate": 3.9551569292201536e-05,
"loss": 0.3105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12678071856498718,
"step": 620,
"valid_targets_mean": 5099.2,
"valid_targets_min": 2259
},
{
"epoch": 1.1364877161055504,
"grad_norm": 0.5439955061560059,
"learning_rate": 3.9532276686671804e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17293554544448853,
"step": 625,
"valid_targets_mean": 5169.0,
"valid_targets_min": 858
},
{
"epoch": 1.1455868971792538,
"grad_norm": 0.5854445058276169,
"learning_rate": 3.951258267371841e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.132243812084198,
"step": 630,
"valid_targets_mean": 2877.4,
"valid_targets_min": 1308
},
{
"epoch": 1.1546860782529573,
"grad_norm": 0.5041148775156069,
"learning_rate": 3.9492487658072615e-05,
"loss": 0.3091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09935662150382996,
"step": 635,
"valid_targets_mean": 3389.1,
"valid_targets_min": 690
},
{
"epoch": 1.1637852593266607,
"grad_norm": 0.44735914114363684,
"learning_rate": 3.947199205270668e-05,
"loss": 0.2936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10296198725700378,
"step": 640,
"valid_targets_mean": 5112.4,
"valid_targets_min": 1001
},
{
"epoch": 1.172884440400364,
"grad_norm": 0.5201900009933367,
"learning_rate": 3.9451096278825386e-05,
"loss": 0.2938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16323642432689667,
"step": 645,
"valid_targets_mean": 5439.1,
"valid_targets_min": 2591
},
{
"epoch": 1.1819836214740673,
"grad_norm": 0.5540042968486397,
"learning_rate": 3.942980076585735e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1331024318933487,
"step": 650,
"valid_targets_mean": 4330.9,
"valid_targets_min": 1426
},
{
"epoch": 1.1910828025477707,
"grad_norm": 0.667990204314806,
"learning_rate": 3.940810595144624e-05,
"loss": 0.3258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17009712755680084,
"step": 655,
"valid_targets_mean": 4543.8,
"valid_targets_min": 2084
},
{
"epoch": 1.200181983621474,
"grad_norm": 0.5266945348745354,
"learning_rate": 3.938601228144173e-05,
"loss": 0.3017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15906137228012085,
"step": 660,
"valid_targets_mean": 4344.6,
"valid_targets_min": 2687
},
{
"epoch": 1.2092811646951773,
"grad_norm": 0.7452722762074235,
"learning_rate": 3.9363520209890405e-05,
"loss": 0.3122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17923469841480255,
"step": 665,
"valid_targets_mean": 3565.0,
"valid_targets_min": 1291
},
{
"epoch": 1.2183803457688809,
"grad_norm": 0.5906857173983012,
"learning_rate": 3.9340630199026365e-05,
"loss": 0.3121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14141051471233368,
"step": 670,
"valid_targets_mean": 3291.1,
"valid_targets_min": 1233
},
{
"epoch": 1.2274795268425842,
"grad_norm": 0.6496938598519507,
"learning_rate": 3.931734271926176e-05,
"loss": 0.2952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15126341581344604,
"step": 675,
"valid_targets_mean": 3045.4,
"valid_targets_min": 236
},
{
"epoch": 1.2365787079162875,
"grad_norm": 0.5486756887499763,
"learning_rate": 3.929365824917712e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12430839240550995,
"step": 680,
"valid_targets_mean": 3235.9,
"valid_targets_min": 293
},
{
"epoch": 1.2456778889899909,
"grad_norm": 0.6798422752091549,
"learning_rate": 3.9269577275511504e-05,
"loss": 0.2986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16678652167320251,
"step": 685,
"valid_targets_mean": 3219.2,
"valid_targets_min": 1768
},
{
"epoch": 1.2547770700636942,
"grad_norm": 0.5514632289376944,
"learning_rate": 3.924510029315253e-05,
"loss": 0.2955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14286918938159943,
"step": 690,
"valid_targets_mean": 4353.2,
"valid_targets_min": 640
},
{
"epoch": 1.2638762511373978,
"grad_norm": 0.5624165020198547,
"learning_rate": 3.922022780512614e-05,
"loss": 0.3092,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14001207053661346,
"step": 695,
"valid_targets_mean": 3567.9,
"valid_targets_min": 175
},
{
"epoch": 1.2729754322111009,
"grad_norm": 0.7326351561063902,
"learning_rate": 3.919496032258637e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17794157564640045,
"step": 700,
"valid_targets_mean": 4092.0,
"valid_targets_min": 3099
},
{
"epoch": 1.2820746132848044,
"grad_norm": 0.6387174425772494,
"learning_rate": 3.9169298364804716e-05,
"loss": 0.2998,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18912354111671448,
"step": 705,
"valid_targets_mean": 3796.1,
"valid_targets_min": 1231
},
{
"epoch": 1.2911737943585078,
"grad_norm": 0.6358201723562807,
"learning_rate": 3.914324245915956e-05,
"loss": 0.3088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17825400829315186,
"step": 710,
"valid_targets_mean": 3973.0,
"valid_targets_min": 1168
},
{
"epoch": 1.300272975432211,
"grad_norm": 0.7306352957917734,
"learning_rate": 3.91167931411253e-05,
"loss": 0.3107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13277125358581543,
"step": 715,
"valid_targets_mean": 3033.8,
"valid_targets_min": 544
},
{
"epoch": 1.3093721565059144,
"grad_norm": 0.5766296412620744,
"learning_rate": 3.908995095426134e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13581085205078125,
"step": 720,
"valid_targets_mean": 3316.8,
"valid_targets_min": 1310
},
{
"epoch": 1.3184713375796178,
"grad_norm": 0.8249621873775245,
"learning_rate": 3.90627164502009e-05,
"loss": 0.2943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1622616946697235,
"step": 725,
"valid_targets_mean": 4480.9,
"valid_targets_min": 2230
},
{
"epoch": 1.3275705186533213,
"grad_norm": 0.6193536191489676,
"learning_rate": 3.903509018863974e-05,
"loss": 0.3189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17137649655342102,
"step": 730,
"valid_targets_mean": 3858.5,
"valid_targets_min": 1147
},
{
"epoch": 1.3366696997270244,
"grad_norm": 0.6532042961114637,
"learning_rate": 3.90070727373246e-05,
"loss": 0.3137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1350535899400711,
"step": 735,
"valid_targets_mean": 2866.0,
"valid_targets_min": 493
},
{
"epoch": 1.345768880800728,
"grad_norm": 0.4861900826239269,
"learning_rate": 3.897866467204155e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11634202301502228,
"step": 740,
"valid_targets_mean": 2838.1,
"valid_targets_min": 304
},
{
"epoch": 1.3548680618744313,
"grad_norm": 0.713209570991044,
"learning_rate": 3.894986657660418e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19738173484802246,
"step": 745,
"valid_targets_mean": 3062.8,
"valid_targets_min": 166
},
{
"epoch": 1.3639672429481347,
"grad_norm": 0.6296705554955353,
"learning_rate": 3.892067904284154e-05,
"loss": 0.2966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12983810901641846,
"step": 750,
"valid_targets_mean": 2600.9,
"valid_targets_min": 241
},
{
"epoch": 1.373066424021838,
"grad_norm": 0.5361889757739225,
"learning_rate": 3.889110267058608e-05,
"loss": 0.3042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15422046184539795,
"step": 755,
"valid_targets_mean": 4254.5,
"valid_targets_min": 2720
},
{
"epoch": 1.3821656050955413,
"grad_norm": 0.5803866643895204,
"learning_rate": 3.886113806766121e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14216673374176025,
"step": 760,
"valid_targets_mean": 3402.6,
"valid_targets_min": 601
},
{
"epoch": 1.3912647861692449,
"grad_norm": 0.5729756325028772,
"learning_rate": 3.883078584986888e-05,
"loss": 0.3024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13551153242588043,
"step": 765,
"valid_targets_mean": 3336.5,
"valid_targets_min": 2241
},
{
"epoch": 1.4003639672429482,
"grad_norm": 0.6263881007967305,
"learning_rate": 3.8800046640976916e-05,
"loss": 0.3073,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15259312093257904,
"step": 770,
"valid_targets_mean": 3664.9,
"valid_targets_min": 1487
},
{
"epoch": 1.4094631483166515,
"grad_norm": 0.6180611235058632,
"learning_rate": 3.876892107270616e-05,
"loss": 0.3087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12695425748825073,
"step": 775,
"valid_targets_mean": 3159.2,
"valid_targets_min": 379
},
{
"epoch": 1.4185623293903549,
"grad_norm": 0.559623144458965,
"learning_rate": 3.873740978471755e-05,
"loss": 0.3101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18561246991157532,
"step": 780,
"valid_targets_mean": 4742.5,
"valid_targets_min": 965
},
{
"epoch": 1.4276615104640582,
"grad_norm": 0.4243966512830656,
"learning_rate": 3.8705513424598934e-05,
"loss": 0.3037,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10521087050437927,
"step": 785,
"valid_targets_mean": 3032.1,
"valid_targets_min": 1392
},
{
"epoch": 1.4367606915377615,
"grad_norm": 0.624333407768036,
"learning_rate": 3.8673232647851756e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1458563506603241,
"step": 790,
"valid_targets_mean": 3420.6,
"valid_targets_min": 346
},
{
"epoch": 1.4458598726114649,
"grad_norm": 0.5646564966792745,
"learning_rate": 3.8640568117877594e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1571834534406662,
"step": 795,
"valid_targets_mean": 4051.5,
"valid_targets_min": 2398
},
{
"epoch": 1.4549590536851684,
"grad_norm": 0.5670849272463157,
"learning_rate": 3.8607520505964574e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1635785698890686,
"step": 800,
"valid_targets_mean": 4177.8,
"valid_targets_min": 2180
},
{
"epoch": 1.4640582347588718,
"grad_norm": 0.6420218837308556,
"learning_rate": 3.857409049127348e-05,
"loss": 0.3207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15793652832508087,
"step": 805,
"valid_targets_mean": 3131.4,
"valid_targets_min": 1480
},
{
"epoch": 1.473157415832575,
"grad_norm": 0.6343008579526399,
"learning_rate": 3.8540278760823866e-05,
"loss": 0.3036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16844598948955536,
"step": 810,
"valid_targets_mean": 3513.1,
"valid_targets_min": 335
},
{
"epoch": 1.4822565969062784,
"grad_norm": 0.548504727537003,
"learning_rate": 3.8506086009479934e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13627293705940247,
"step": 815,
"valid_targets_mean": 3978.2,
"valid_targets_min": 2587
},
{
"epoch": 1.4913557779799818,
"grad_norm": 0.6522144344848967,
"learning_rate": 3.8471512939936224e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1826554834842682,
"step": 820,
"valid_targets_mean": 3473.9,
"valid_targets_min": 891
},
{
"epoch": 1.5004549590536853,
"grad_norm": 0.47235032448464315,
"learning_rate": 3.843656026270319e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10905256867408752,
"step": 825,
"valid_targets_mean": 4995.2,
"valid_targets_min": 255
},
{
"epoch": 1.5095541401273884,
"grad_norm": 0.5919677581523133,
"learning_rate": 3.840122869609258e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1688118577003479,
"step": 830,
"valid_targets_mean": 3939.0,
"valid_targets_min": 2195
},
{
"epoch": 1.518653321201092,
"grad_norm": 0.6120851821796398,
"learning_rate": 3.8365518966202724e-05,
"loss": 0.2793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1763344705104828,
"step": 835,
"valid_targets_mean": 3543.9,
"valid_targets_min": 1824
},
{
"epoch": 1.5277525022747953,
"grad_norm": 0.5494270450729506,
"learning_rate": 3.832943180690356e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10270395129919052,
"step": 840,
"valid_targets_mean": 3121.2,
"valid_targets_min": 469
},
{
"epoch": 1.5368516833484986,
"grad_norm": 0.668549792242741,
"learning_rate": 3.829296795982156e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1624075323343277,
"step": 845,
"valid_targets_mean": 3347.9,
"valid_targets_min": 1757
},
{
"epoch": 1.545950864422202,
"grad_norm": 0.6025824994023757,
"learning_rate": 3.8256128174324515e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13117438554763794,
"step": 850,
"valid_targets_mean": 3289.5,
"valid_targets_min": 2407
},
{
"epoch": 1.5550500454959053,
"grad_norm": 1.5587470663669738,
"learning_rate": 3.82189132075061e-05,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17107094824314117,
"step": 855,
"valid_targets_mean": 3623.4,
"valid_targets_min": 457
},
{
"epoch": 1.5641492265696089,
"grad_norm": 0.665859516324618,
"learning_rate": 3.818132382417037e-05,
"loss": 0.2962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16790863871574402,
"step": 860,
"valid_targets_mean": 3379.4,
"valid_targets_min": 352
},
{
"epoch": 1.573248407643312,
"grad_norm": 0.6963496071560168,
"learning_rate": 3.8143360796815964e-05,
"loss": 0.3039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16974878311157227,
"step": 865,
"valid_targets_mean": 3827.0,
"valid_targets_min": 1539
},
{
"epoch": 1.5823475887170155,
"grad_norm": 0.41729879716752555,
"learning_rate": 3.81050249056203e-05,
"loss": 0.2879,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11725392192602158,
"step": 870,
"valid_targets_mean": 7242.0,
"valid_targets_min": 1288
},
{
"epoch": 1.5914467697907189,
"grad_norm": 0.5866727554490438,
"learning_rate": 3.8066316938423495e-05,
"loss": 0.2997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20750758051872253,
"step": 875,
"valid_targets_mean": 5255.9,
"valid_targets_min": 2124
},
{
"epoch": 1.6005459508644222,
"grad_norm": 0.5863686910007585,
"learning_rate": 3.8027237690712206e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10066068172454834,
"step": 880,
"valid_targets_mean": 2762.9,
"valid_targets_min": 1092
},
{
"epoch": 1.6096451319381255,
"grad_norm": 0.6167527707800907,
"learning_rate": 3.798778796560326e-05,
"loss": 0.2901,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16851675510406494,
"step": 885,
"valid_targets_mean": 3696.9,
"valid_targets_min": 1240
},
{
"epoch": 1.6187443130118289,
"grad_norm": 0.6924917088244582,
"learning_rate": 3.794796857382717e-05,
"loss": 0.2978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13787582516670227,
"step": 890,
"valid_targets_mean": 2862.2,
"valid_targets_min": 1659
},
{
"epoch": 1.6278434940855324,
"grad_norm": 0.5789838916428676,
"learning_rate": 3.790778033371145e-05,
"loss": 0.3023,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11418955028057098,
"step": 895,
"valid_targets_mean": 3481.0,
"valid_targets_min": 348
},
{
"epoch": 1.6369426751592355,
"grad_norm": 0.7106975900014304,
"learning_rate": 3.786722407116379e-05,
"loss": 0.3085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12953606247901917,
"step": 900,
"valid_targets_mean": 2206.0,
"valid_targets_min": 312
},
{
"epoch": 1.646041856232939,
"grad_norm": 0.6336291450885424,
"learning_rate": 3.782630061965515e-05,
"loss": 0.3064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15805183351039886,
"step": 905,
"valid_targets_mean": 3122.5,
"valid_targets_min": 1578
},
{
"epoch": 1.6551410373066424,
"grad_norm": 0.483971331402685,
"learning_rate": 3.778501082020255e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09273171424865723,
"step": 910,
"valid_targets_mean": 3567.9,
"valid_targets_min": 1520
},
{
"epoch": 1.6642402183803457,
"grad_norm": 0.5149368407010124,
"learning_rate": 3.7743355521351814e-05,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11179894208908081,
"step": 915,
"valid_targets_mean": 5487.8,
"valid_targets_min": 2348
},
{
"epoch": 1.673339399454049,
"grad_norm": 0.5917668119100274,
"learning_rate": 3.7701335579160147e-05,
"loss": 0.2961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1767260581254959,
"step": 920,
"valid_targets_mean": 4154.2,
"valid_targets_min": 2792
},
{
"epoch": 1.6824385805277524,
"grad_norm": 0.7652973549943375,
"learning_rate": 3.7658951857178544e-05,
"loss": 0.3086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17313481867313385,
"step": 925,
"valid_targets_mean": 3225.0,
"valid_targets_min": 1253
},
{
"epoch": 1.691537761601456,
"grad_norm": 0.5994539780074473,
"learning_rate": 3.7616205226434005e-05,
"loss": 0.2772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1413244605064392,
"step": 930,
"valid_targets_mean": 3994.2,
"valid_targets_min": 2883
},
{
"epoch": 1.700636942675159,
"grad_norm": 0.5395727379224268,
"learning_rate": 3.7573096565411694e-05,
"loss": 0.2902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13815945386886597,
"step": 935,
"valid_targets_mean": 4574.5,
"valid_targets_min": 3154
},
{
"epoch": 1.7097361237488626,
"grad_norm": 0.598304083632461,
"learning_rate": 3.7529626760036814e-05,
"loss": 0.3026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13133779168128967,
"step": 940,
"valid_targets_mean": 3710.1,
"valid_targets_min": 1871
},
{
"epoch": 1.718835304822566,
"grad_norm": 0.6169878314374032,
"learning_rate": 3.7485796703656475e-05,
"loss": 0.301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19230428338050842,
"step": 945,
"valid_targets_mean": 4477.2,
"valid_targets_min": 2484
},
{
"epoch": 1.7279344858962693,
"grad_norm": 0.6494778619925592,
"learning_rate": 3.7441607297021254e-05,
"loss": 0.3127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18376144766807556,
"step": 950,
"valid_targets_mean": 3503.4,
"valid_targets_min": 689
},
{
"epoch": 1.7370336669699729,
"grad_norm": 0.5287904809918028,
"learning_rate": 3.7397059448266786e-05,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15362298488616943,
"step": 955,
"valid_targets_mean": 4776.2,
"valid_targets_min": 2511
},
{
"epoch": 1.746132848043676,
"grad_norm": 0.6494659791119134,
"learning_rate": 3.735215407289498e-05,
"loss": 0.2944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18310752511024475,
"step": 960,
"valid_targets_mean": 4014.9,
"valid_targets_min": 1611
},
{
"epoch": 1.7552320291173795,
"grad_norm": 0.5731006048795201,
"learning_rate": 3.730689209375533e-05,
"loss": 0.3011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18742819130420685,
"step": 965,
"valid_targets_mean": 4962.2,
"valid_targets_min": 2034
},
{
"epoch": 1.7643312101910829,
"grad_norm": 0.5506132886158287,
"learning_rate": 3.726127444102583e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15207810699939728,
"step": 970,
"valid_targets_mean": 4009.9,
"valid_targets_min": 1103
},
{
"epoch": 1.7734303912647862,
"grad_norm": 0.4278231884632061,
"learning_rate": 3.721530205219395e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10765276849269867,
"step": 975,
"valid_targets_mean": 5876.9,
"valid_targets_min": 283
},
{
"epoch": 1.7825295723384895,
"grad_norm": 0.5432370249962426,
"learning_rate": 3.716897587203733e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15847131609916687,
"step": 980,
"valid_targets_mean": 4284.6,
"valid_targets_min": 2093
},
{
"epoch": 1.7916287534121929,
"grad_norm": 0.5409964771591507,
"learning_rate": 3.712229685260434e-05,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1669999659061432,
"step": 985,
"valid_targets_mean": 4959.6,
"valid_targets_min": 1444
},
{
"epoch": 1.8007279344858964,
"grad_norm": 0.5124178526933512,
"learning_rate": 3.707526595319459e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14999991655349731,
"step": 990,
"valid_targets_mean": 4784.5,
"valid_targets_min": 1865
},
{
"epoch": 1.8098271155595995,
"grad_norm": 0.48227382336098407,
"learning_rate": 3.7027884140339144e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12232952564954758,
"step": 995,
"valid_targets_mean": 3921.4,
"valid_targets_min": 1567
},
{
"epoch": 1.818926296633303,
"grad_norm": 0.5838105781492224,
"learning_rate": 3.698015238778066e-05,
"loss": 0.2801,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12059933692216873,
"step": 1000,
"valid_targets_mean": 2937.2,
"valid_targets_min": 281
},
{
"epoch": 1.8280254777070064,
"grad_norm": 0.5443419726188922,
"learning_rate": 3.693207167645344e-05,
"loss": 0.2814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13547688722610474,
"step": 1005,
"valid_targets_mean": 3484.6,
"valid_targets_min": 1610
},
{
"epoch": 1.8371246587807097,
"grad_norm": 0.6629227757168609,
"learning_rate": 3.6883642994463194e-05,
"loss": 0.2925,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14396211504936218,
"step": 1010,
"valid_targets_mean": 2764.6,
"valid_targets_min": 1192
},
{
"epoch": 1.846223839854413,
"grad_norm": 0.5769994708000856,
"learning_rate": 3.6834867337066805e-05,
"loss": 0.2974,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15609201788902283,
"step": 1015,
"valid_targets_mean": 4123.5,
"valid_targets_min": 1895
},
{
"epoch": 1.8553230209281164,
"grad_norm": 0.626324397009088,
"learning_rate": 3.678574570665181e-05,
"loss": 0.2836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11908911168575287,
"step": 1020,
"valid_targets_mean": 2649.9,
"valid_targets_min": 1653
},
{
"epoch": 1.86442220200182,
"grad_norm": 0.633036325528964,
"learning_rate": 3.673627911271586e-05,
"loss": 0.2953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11095995455980301,
"step": 1025,
"valid_targets_mean": 3540.4,
"valid_targets_min": 1594
},
{
"epoch": 1.873521383075523,
"grad_norm": 0.6333066712978032,
"learning_rate": 3.668646857184591e-05,
"loss": 0.3157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15657323598861694,
"step": 1030,
"valid_targets_mean": 2872.5,
"valid_targets_min": 969
},
{
"epoch": 1.8826205641492266,
"grad_norm": 0.5660080861885046,
"learning_rate": 3.663631510769739e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1922149509191513,
"step": 1035,
"valid_targets_mean": 4844.6,
"valid_targets_min": 1568
},
{
"epoch": 1.89171974522293,
"grad_norm": 0.7412294025780711,
"learning_rate": 3.658581975097311e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17560440301895142,
"step": 1040,
"valid_targets_mean": 3082.6,
"valid_targets_min": 330
},
{
"epoch": 1.9008189262966333,
"grad_norm": 0.555376644130959,
"learning_rate": 3.653498353940215e-05,
"loss": 0.2961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16862821578979492,
"step": 1045,
"valid_targets_mean": 3799.9,
"valid_targets_min": 1053
},
{
"epoch": 1.9099181073703366,
"grad_norm": 0.5686697582781365,
"learning_rate": 3.648380751771846e-05,
"loss": 0.2948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18659132719039917,
"step": 1050,
"valid_targets_mean": 4709.6,
"valid_targets_min": 2665
},
{
"epoch": 1.91901728844404,
"grad_norm": 0.5600510837685639,
"learning_rate": 3.6432292737639426e-05,
"loss": 0.2813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15304958820343018,
"step": 1055,
"valid_targets_mean": 4016.4,
"valid_targets_min": 2083
},
{
"epoch": 1.9281164695177435,
"grad_norm": 0.5777594563764268,
"learning_rate": 3.638044025784425e-05,
"loss": 0.2946,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14716693758964539,
"step": 1060,
"valid_targets_mean": 3776.5,
"valid_targets_min": 282
},
{
"epoch": 1.9372156505914466,
"grad_norm": 0.7107526464676869,
"learning_rate": 3.63282511439522e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15589915215969086,
"step": 1065,
"valid_targets_mean": 2547.8,
"valid_targets_min": 503
},
{
"epoch": 1.9463148316651502,
"grad_norm": 0.6533274131286898,
"learning_rate": 3.627572646850069e-05,
"loss": 0.296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12605586647987366,
"step": 1070,
"valid_targets_mean": 2884.5,
"valid_targets_min": 184
},
{
"epoch": 1.9554140127388535,
"grad_norm": 0.5095962807954009,
"learning_rate": 3.6222867310923296e-05,
"loss": 0.3,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13677296042442322,
"step": 1075,
"valid_targets_mean": 4426.5,
"valid_targets_min": 1530
},
{
"epoch": 1.9645131938125568,
"grad_norm": 0.5431060924066419,
"learning_rate": 3.6169674757527466e-05,
"loss": 0.2869,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13465212285518646,
"step": 1080,
"valid_targets_mean": 3468.8,
"valid_targets_min": 1512
},
{
"epoch": 1.9736123748862604,
"grad_norm": 0.508309995874022,
"learning_rate": 3.61161499014723e-05,
"loss": 0.2896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1512061208486557,
"step": 1085,
"valid_targets_mean": 4771.5,
"valid_targets_min": 3037
},
{
"epoch": 1.9827115559599635,
"grad_norm": 0.563426896365882,
"learning_rate": 3.606229384274604e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1543359011411667,
"step": 1090,
"valid_targets_mean": 4113.5,
"valid_targets_min": 1392
},
{
"epoch": 1.991810737033667,
"grad_norm": 0.5744094191621176,
"learning_rate": 3.600810768814345e-05,
"loss": 0.2972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1515529453754425,
"step": 1095,
"valid_targets_mean": 4293.8,
"valid_targets_min": 1114
},
{
"epoch": 2.0,
"grad_norm": 0.7949063431983748,
"learning_rate": 3.595359255124311e-05,
"loss": 0.3044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3090308606624603,
"step": 1100,
"valid_targets_mean": 4015.4,
"valid_targets_min": 2457
},
{
"epoch": 2.0090991810737036,
"grad_norm": 0.6751657595795937,
"learning_rate": 3.589874955238449e-05,
"loss": 0.2748,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15675446391105652,
"step": 1105,
"valid_targets_mean": 4197.4,
"valid_targets_min": 1874
},
{
"epoch": 2.0181983621474067,
"grad_norm": 0.6454281420919674,
"learning_rate": 3.5843579818644956e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.139465793967247,
"step": 1110,
"valid_targets_mean": 3443.8,
"valid_targets_min": 683
},
{
"epoch": 2.02729754322111,
"grad_norm": 0.4294367360499809,
"learning_rate": 3.5788084483816587e-05,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08601902425289154,
"step": 1115,
"valid_targets_mean": 6044.8,
"valid_targets_min": 293
},
{
"epoch": 2.0363967242948133,
"grad_norm": 0.6474434008705867,
"learning_rate": 3.573226468838289e-05,
"loss": 0.2756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15890777111053467,
"step": 1120,
"valid_targets_mean": 4120.4,
"valid_targets_min": 2236
},
{
"epoch": 2.045495905368517,
"grad_norm": 0.6607678287468948,
"learning_rate": 3.567612157949536e-05,
"loss": 0.2764,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13646885752677917,
"step": 1125,
"valid_targets_mean": 3556.9,
"valid_targets_min": 2256
},
{
"epoch": 2.05459508644222,
"grad_norm": 0.6001404112466459,
"learning_rate": 3.561965631094988e-05,
"loss": 0.2759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1463991105556488,
"step": 1130,
"valid_targets_mean": 4032.1,
"valid_targets_min": 1838
},
{
"epoch": 2.0636942675159236,
"grad_norm": 0.5395091924578818,
"learning_rate": 3.556287004316305e-05,
"loss": 0.2375,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12247171252965927,
"step": 1135,
"valid_targets_mean": 3741.5,
"valid_targets_min": 1198
},
{
"epoch": 2.072793448589627,
"grad_norm": 0.5912809755997814,
"learning_rate": 3.5505763943148324e-05,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14579446613788605,
"step": 1140,
"valid_targets_mean": 4449.2,
"valid_targets_min": 2512
},
{
"epoch": 2.08189262966333,
"grad_norm": 0.5639172171971991,
"learning_rate": 3.544833918449199e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12566199898719788,
"step": 1145,
"valid_targets_mean": 3620.0,
"valid_targets_min": 726
},
{
"epoch": 2.0909918107370338,
"grad_norm": 0.5348382118034839,
"learning_rate": 3.5390596947329124e-05,
"loss": 0.2615,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14052331447601318,
"step": 1150,
"valid_targets_mean": 4695.1,
"valid_targets_min": 3057
},
{
"epoch": 2.100090991810737,
"grad_norm": 0.5616636512428199,
"learning_rate": 3.5332538418319254e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08257120102643967,
"step": 1155,
"valid_targets_mean": 2379.0,
"valid_targets_min": 382
},
{
"epoch": 2.1091901728844404,
"grad_norm": 0.5992218870310196,
"learning_rate": 3.527416479062205e-05,
"loss": 0.2721,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1420498937368393,
"step": 1160,
"valid_targets_mean": 3988.2,
"valid_targets_min": 1040
},
{
"epoch": 2.1182893539581436,
"grad_norm": 0.6456667062309294,
"learning_rate": 3.521547726387275e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12069796770811081,
"step": 1165,
"valid_targets_mean": 2920.1,
"valid_targets_min": 282
},
{
"epoch": 2.127388535031847,
"grad_norm": 0.716226667426586,
"learning_rate": 3.515647704415754e-05,
"loss": 0.2672,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10610539466142654,
"step": 1170,
"valid_targets_mean": 2205.1,
"valid_targets_min": 330
},
{
"epoch": 2.1364877161055507,
"grad_norm": 0.5716159999832333,
"learning_rate": 3.509716534398873e-05,
"loss": 0.2813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11310961842536926,
"step": 1175,
"valid_targets_mean": 3156.5,
"valid_targets_min": 1663
},
{
"epoch": 2.1455868971792538,
"grad_norm": 0.6345606982139681,
"learning_rate": 3.503754338227989e-05,
"loss": 0.2779,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1598322093486786,
"step": 1180,
"valid_targets_mean": 4152.5,
"valid_targets_min": 373
},
{
"epoch": 2.1546860782529573,
"grad_norm": 0.6444097109585533,
"learning_rate": 3.497761238432073e-05,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1359652876853943,
"step": 1185,
"valid_targets_mean": 3126.6,
"valid_targets_min": 1108
},
{
"epoch": 2.1637852593266604,
"grad_norm": 0.5743362772516076,
"learning_rate": 3.4917373581752e-05,
"loss": 0.2539,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15441018342971802,
"step": 1190,
"valid_targets_mean": 4133.0,
"valid_targets_min": 1427
},
{
"epoch": 2.172884440400364,
"grad_norm": 0.5804857594862529,
"learning_rate": 3.4856828212540094e-05,
"loss": 0.2577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10116176307201385,
"step": 1195,
"valid_targets_mean": 3043.6,
"valid_targets_min": 302
},
{
"epoch": 2.1819836214740675,
"grad_norm": 0.5706299053526133,
"learning_rate": 3.4795977520951684e-05,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11291206628084183,
"step": 1200,
"valid_targets_mean": 3438.2,
"valid_targets_min": 250
},
{
"epoch": 2.1910828025477707,
"grad_norm": 0.6307638349852748,
"learning_rate": 3.47348227575281e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17008806765079498,
"step": 1205,
"valid_targets_mean": 4208.5,
"valid_targets_min": 1336
},
{
"epoch": 2.200181983621474,
"grad_norm": 0.6618907052519223,
"learning_rate": 3.467336517905966e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13128957152366638,
"step": 1210,
"valid_targets_mean": 2842.1,
"valid_targets_min": 201
},
{
"epoch": 2.2092811646951773,
"grad_norm": 0.5658986082884031,
"learning_rate": 3.46116060485598e-05,
"loss": 0.26,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1362631469964981,
"step": 1215,
"valid_targets_mean": 4190.9,
"valid_targets_min": 324
},
{
"epoch": 2.218380345768881,
"grad_norm": 0.5348818447353793,
"learning_rate": 3.4549546635239167e-05,
"loss": 0.2741,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11287876963615417,
"step": 1220,
"valid_targets_mean": 3727.4,
"valid_targets_min": 2818
},
{
"epoch": 2.227479526842584,
"grad_norm": 0.6385706591191282,
"learning_rate": 3.448718821447953e-05,
"loss": 0.2698,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12544016540050507,
"step": 1225,
"valid_targets_mean": 3231.2,
"valid_targets_min": 979
},
{
"epoch": 2.2365787079162875,
"grad_norm": 0.7819910500944424,
"learning_rate": 3.442453206780751e-05,
"loss": 0.2781,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16756212711334229,
"step": 1230,
"valid_targets_mean": 4297.6,
"valid_targets_min": 2240
},
{
"epoch": 2.245677888989991,
"grad_norm": 0.6080355702316727,
"learning_rate": 3.4361579482868325e-05,
"loss": 0.2686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13607972860336304,
"step": 1235,
"valid_targets_mean": 3773.0,
"valid_targets_min": 2000
},
{
"epoch": 2.254777070063694,
"grad_norm": 0.7152228635802768,
"learning_rate": 3.429833175339927e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1547776311635971,
"step": 1240,
"valid_targets_mean": 3546.6,
"valid_targets_min": 573
},
{
"epoch": 2.2638762511373978,
"grad_norm": 0.4914702585050212,
"learning_rate": 3.423479017920317e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1395949423313141,
"step": 1245,
"valid_targets_mean": 4476.6,
"valid_targets_min": 2453
},
{
"epoch": 2.272975432211101,
"grad_norm": 0.5690362474952183,
"learning_rate": 3.4170956066121616e-05,
"loss": 0.2645,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1314096301794052,
"step": 1250,
"valid_targets_mean": 3731.1,
"valid_targets_min": 313
},
{
"epoch": 2.2820746132848044,
"grad_norm": 0.6288288462340934,
"learning_rate": 3.410683072600818e-05,
"loss": 0.2803,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14974285662174225,
"step": 1255,
"valid_targets_mean": 3642.4,
"valid_targets_min": 1186
},
{
"epoch": 2.2911737943585075,
"grad_norm": 0.6119487602662945,
"learning_rate": 3.4042415476701434e-05,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14314958453178406,
"step": 1260,
"valid_targets_mean": 3669.4,
"valid_targets_min": 1599
},
{
"epoch": 2.300272975432211,
"grad_norm": 0.671669349060168,
"learning_rate": 3.397771164199787e-05,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11376748979091644,
"step": 1265,
"valid_targets_mean": 3127.4,
"valid_targets_min": 148
},
{
"epoch": 2.3093721565059147,
"grad_norm": 0.8943752547371007,
"learning_rate": 3.3912720551624684e-05,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12145446240901947,
"step": 1270,
"valid_targets_mean": 3842.5,
"valid_targets_min": 414
},
{
"epoch": 2.3184713375796178,
"grad_norm": 0.5656946255603227,
"learning_rate": 3.384744354121246e-05,
"loss": 0.2601,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11813884228467941,
"step": 1275,
"valid_targets_mean": 3730.5,
"valid_targets_min": 2429
},
{
"epoch": 2.3275705186533213,
"grad_norm": 0.7149215078350728,
"learning_rate": 3.3781881952267715e-05,
"loss": 0.258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15160393714904785,
"step": 1280,
"valid_targets_mean": 2399.2,
"valid_targets_min": 270
},
{
"epoch": 2.3366696997270244,
"grad_norm": 0.5280911417580575,
"learning_rate": 3.3716037132145354e-05,
"loss": 0.2674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13931462168693542,
"step": 1285,
"valid_targets_mean": 5500.1,
"valid_targets_min": 304
},
{
"epoch": 2.345768880800728,
"grad_norm": 0.5450007462035853,
"learning_rate": 3.3649910434020934e-05,
"loss": 0.2734,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14486107230186462,
"step": 1290,
"valid_targets_mean": 4728.0,
"valid_targets_min": 1757
},
{
"epoch": 2.3548680618744315,
"grad_norm": 0.5206771266132671,
"learning_rate": 3.35835032168629e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11571803689002991,
"step": 1295,
"valid_targets_mean": 4034.5,
"valid_targets_min": 850
},
{
"epoch": 2.3639672429481347,
"grad_norm": 0.5980886546519958,
"learning_rate": 3.351681684540462e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1225738599896431,
"step": 1300,
"valid_targets_mean": 3550.4,
"valid_targets_min": 352
},
{
"epoch": 2.373066424021838,
"grad_norm": 0.6270451107929509,
"learning_rate": 3.3449852690116375e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10917264223098755,
"step": 1305,
"valid_targets_mean": 2968.6,
"valid_targets_min": 240
},
{
"epoch": 2.3821656050955413,
"grad_norm": 0.4647051724658464,
"learning_rate": 3.3382612127177166e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1091746836900711,
"step": 1310,
"valid_targets_mean": 4024.8,
"valid_targets_min": 1696
},
{
"epoch": 2.391264786169245,
"grad_norm": 0.6011078170019583,
"learning_rate": 3.331509653844644e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1194903701543808,
"step": 1315,
"valid_targets_mean": 3338.9,
"valid_targets_min": 164
},
{
"epoch": 2.400363967242948,
"grad_norm": 0.6174349839198626,
"learning_rate": 3.324730731143571e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1434527039527893,
"step": 1320,
"valid_targets_mean": 3696.2,
"valid_targets_min": 1616
},
{
"epoch": 2.4094631483166515,
"grad_norm": 0.7158219129507043,
"learning_rate": 3.317924583927999e-05,
"loss": 0.2506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17214879393577576,
"step": 1325,
"valid_targets_mean": 3366.8,
"valid_targets_min": 326
},
{
"epoch": 2.4185623293903546,
"grad_norm": 0.6189432134650674,
"learning_rate": 3.311091352070924e-05,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13491564989089966,
"step": 1330,
"valid_targets_mean": 3157.6,
"valid_targets_min": 1814
},
{
"epoch": 2.427661510464058,
"grad_norm": 0.659452736598218,
"learning_rate": 3.3042311760019554e-05,
"loss": 0.2733,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13368107378482819,
"step": 1335,
"valid_targets_mean": 3190.8,
"valid_targets_min": 557
},
{
"epoch": 2.4367606915377618,
"grad_norm": 0.5820175017066158,
"learning_rate": 3.297344196704431e-05,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14730173349380493,
"step": 1340,
"valid_targets_mean": 4446.1,
"valid_targets_min": 1305
},
{
"epoch": 2.445859872611465,
"grad_norm": 0.64079393332815,
"learning_rate": 3.2904305557125265e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17309501767158508,
"step": 1345,
"valid_targets_mean": 4094.2,
"valid_targets_min": 2282
},
{
"epoch": 2.4549590536851684,
"grad_norm": 0.7018821745777597,
"learning_rate": 3.2834903951083363e-05,
"loss": 0.2771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16230127215385437,
"step": 1350,
"valid_targets_mean": 3237.2,
"valid_targets_min": 1578
},
{
"epoch": 2.4640582347588715,
"grad_norm": 0.5965681886862967,
"learning_rate": 3.27652385751896e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1440294235944748,
"step": 1355,
"valid_targets_mean": 4534.4,
"valid_targets_min": 3064
},
{
"epoch": 2.473157415832575,
"grad_norm": 0.6376682960206415,
"learning_rate": 3.269531086113573e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10924984514713287,
"step": 1360,
"valid_targets_mean": 3105.8,
"valid_targets_min": 262
},
{
"epoch": 2.4822565969062786,
"grad_norm": 0.5685224339416516,
"learning_rate": 3.262512224600478e-05,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11022941768169403,
"step": 1365,
"valid_targets_mean": 3321.5,
"valid_targets_min": 1122
},
{
"epoch": 2.4913557779799818,
"grad_norm": 0.4679822971053616,
"learning_rate": 3.2554674172241565e-05,
"loss": 0.2566,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10667596012353897,
"step": 1370,
"valid_targets_mean": 6181.6,
"valid_targets_min": 1169
},
{
"epoch": 2.5004549590536853,
"grad_norm": 0.6124226942623071,
"learning_rate": 3.2483968087623026e-05,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14309075474739075,
"step": 1375,
"valid_targets_mean": 3384.4,
"valid_targets_min": 274
},
{
"epoch": 2.5095541401273884,
"grad_norm": 0.6247095676280948,
"learning_rate": 3.241300544522848e-05,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1395222246646881,
"step": 1380,
"valid_targets_mean": 3201.8,
"valid_targets_min": 2156
},
{
"epoch": 2.518653321201092,
"grad_norm": 0.5328578793777622,
"learning_rate": 3.234178770340975e-05,
"loss": 0.2557,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08864390850067139,
"step": 1385,
"valid_targets_mean": 4039.1,
"valid_targets_min": 286
},
{
"epoch": 2.5277525022747955,
"grad_norm": 0.4773123951813783,
"learning_rate": 3.227031632576122e-05,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13746377825737,
"step": 1390,
"valid_targets_mean": 6369.5,
"valid_targets_min": 2005
},
{
"epoch": 2.5368516833484986,
"grad_norm": 0.6004745142765648,
"learning_rate": 3.219859278108972e-05,
"loss": 0.2679,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12306511402130127,
"step": 1395,
"valid_targets_mean": 3561.5,
"valid_targets_min": 238
},
{
"epoch": 2.5459508644222018,
"grad_norm": 0.6878586191935012,
"learning_rate": 3.212661854338438e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16240370273590088,
"step": 1400,
"valid_targets_mean": 3584.8,
"valid_targets_min": 1052
},
{
"epoch": 2.5550500454959053,
"grad_norm": 0.5824202233287424,
"learning_rate": 3.20543950917863e-05,
"loss": 0.2626,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13346585631370544,
"step": 1405,
"valid_targets_mean": 2869.1,
"valid_targets_min": 2043
},
{
"epoch": 2.564149226569609,
"grad_norm": 0.680238515947865,
"learning_rate": 3.1981923910558164e-05,
"loss": 0.2769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15468516945838928,
"step": 1410,
"valid_targets_mean": 3367.0,
"valid_targets_min": 1629
},
{
"epoch": 2.573248407643312,
"grad_norm": 0.5202125549195913,
"learning_rate": 3.190920648905376e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10637877881526947,
"step": 1415,
"valid_targets_mean": 3411.2,
"valid_targets_min": 297
},
{
"epoch": 2.5823475887170155,
"grad_norm": 0.5817714257013601,
"learning_rate": 3.183624432168736e-05,
"loss": 0.253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11493627727031708,
"step": 1420,
"valid_targets_mean": 3214.5,
"valid_targets_min": 1573
},
{
"epoch": 2.5914467697907186,
"grad_norm": 0.5458489312850151,
"learning_rate": 3.1763038907902976e-05,
"loss": 0.2737,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10880685597658157,
"step": 1425,
"valid_targets_mean": 3591.6,
"valid_targets_min": 633
},
{
"epoch": 2.600545950864422,
"grad_norm": 0.5542156910126472,
"learning_rate": 3.16895917521436e-05,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13165003061294556,
"step": 1430,
"valid_targets_mean": 4754.2,
"valid_targets_min": 3017
},
{
"epoch": 2.6096451319381258,
"grad_norm": 0.6533595108199927,
"learning_rate": 3.161590436382023e-05,
"loss": 0.2768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1214178055524826,
"step": 1435,
"valid_targets_mean": 2685.4,
"valid_targets_min": 355
},
{
"epoch": 2.618744313011829,
"grad_norm": 0.5111980360739798,
"learning_rate": 3.1541978257280915e-05,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12494254857301712,
"step": 1440,
"valid_targets_mean": 5197.2,
"valid_targets_min": 2480
},
{
"epoch": 2.6278434940855324,
"grad_norm": 0.5763523371672339,
"learning_rate": 3.1467814951779564e-05,
"loss": 0.2686,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09673012048006058,
"step": 1445,
"valid_targets_mean": 2934.5,
"valid_targets_min": 640
},
{
"epoch": 2.6369426751592355,
"grad_norm": 0.7378840239597381,
"learning_rate": 3.139341597144478e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11686737090349197,
"step": 1450,
"valid_targets_mean": 3688.1,
"valid_targets_min": 414
},
{
"epoch": 2.646041856232939,
"grad_norm": 0.5926896588467113,
"learning_rate": 3.13187828452485e-05,
"loss": 0.2758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13565243780612946,
"step": 1455,
"valid_targets_mean": 3212.2,
"valid_targets_min": 303
},
{
"epoch": 2.6551410373066426,
"grad_norm": 0.5485940410600364,
"learning_rate": 3.1243917106974583e-05,
"loss": 0.2685,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13510656356811523,
"step": 1460,
"valid_targets_mean": 3864.6,
"valid_targets_min": 2506
},
{
"epoch": 2.6642402183803457,
"grad_norm": 0.6320710190885632,
"learning_rate": 3.116882029518732e-05,
"loss": 0.2673,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15843375027179718,
"step": 1465,
"valid_targets_mean": 3470.5,
"valid_targets_min": 1637
},
{
"epoch": 2.673339399454049,
"grad_norm": 0.6126966480462319,
"learning_rate": 3.109349395319976e-05,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15615004301071167,
"step": 1470,
"valid_targets_mean": 3915.4,
"valid_targets_min": 1532
},
{
"epoch": 2.6824385805277524,
"grad_norm": 0.5686770606117241,
"learning_rate": 3.101793962904205e-05,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1370496153831482,
"step": 1475,
"valid_targets_mean": 4079.1,
"valid_targets_min": 919
},
{
"epoch": 2.691537761601456,
"grad_norm": 0.5856441860541246,
"learning_rate": 3.094215887542957e-05,
"loss": 0.2669,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.110836461186409,
"step": 1480,
"valid_targets_mean": 2751.5,
"valid_targets_min": 1269
},
{
"epoch": 2.700636942675159,
"grad_norm": 0.6233578615196819,
"learning_rate": 3.086615324973107e-05,
"loss": 0.2708,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15025722980499268,
"step": 1485,
"valid_targets_mean": 3894.9,
"valid_targets_min": 312
},
{
"epoch": 2.7097361237488626,
"grad_norm": 0.536781802707285,
"learning_rate": 3.07899243139366e-05,
"loss": 0.2633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09888775646686554,
"step": 1490,
"valid_targets_mean": 3418.4,
"valid_targets_min": 844
},
{
"epoch": 2.7188353048225657,
"grad_norm": 0.6866854486013821,
"learning_rate": 3.0713473634625507e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12067543715238571,
"step": 1495,
"valid_targets_mean": 3014.2,
"valid_targets_min": 643
},
{
"epoch": 2.7279344858962693,
"grad_norm": 0.6751006196997635,
"learning_rate": 3.0636802782934146e-05,
"loss": 0.2542,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1544184535741806,
"step": 1500,
"valid_targets_mean": 2988.5,
"valid_targets_min": 1152
},
{
"epoch": 2.737033666969973,
"grad_norm": 0.442079678607608,
"learning_rate": 3.055991333452364e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1539030522108078,
"step": 1505,
"valid_targets_mean": 6319.1,
"valid_targets_min": 1834
},
{
"epoch": 2.746132848043676,
"grad_norm": 0.5873539144786856,
"learning_rate": 3.0482806869547495e-05,
"loss": 0.2536,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1154666393995285,
"step": 1510,
"valid_targets_mean": 3250.0,
"valid_targets_min": 991
},
{
"epoch": 2.7552320291173795,
"grad_norm": 0.5752182793640411,
"learning_rate": 3.0405484972619116e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14140355587005615,
"step": 1515,
"valid_targets_mean": 4366.2,
"valid_targets_min": 1602
},
{
"epoch": 2.7643312101910826,
"grad_norm": 0.726912967043729,
"learning_rate": 3.0327949232779242e-05,
"loss": 0.2677,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13592445850372314,
"step": 1520,
"valid_targets_mean": 3295.1,
"valid_targets_min": 2203
},
{
"epoch": 2.773430391264786,
"grad_norm": 0.6215196361746996,
"learning_rate": 3.0250201243463297e-05,
"loss": 0.2581,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16549277305603027,
"step": 1525,
"valid_targets_mean": 3900.1,
"valid_targets_min": 1860
},
{
"epoch": 2.7825295723384897,
"grad_norm": 0.5415517684578123,
"learning_rate": 3.0172242602468637e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12296943366527557,
"step": 1530,
"valid_targets_mean": 4461.1,
"valid_targets_min": 820
},
{
"epoch": 2.791628753412193,
"grad_norm": 0.4749079544937464,
"learning_rate": 3.009407491192172e-05,
"loss": 0.2651,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09805374592542648,
"step": 1535,
"valid_targets_mean": 4534.9,
"valid_targets_min": 1317
},
{
"epoch": 2.8007279344858964,
"grad_norm": 0.5380978879739551,
"learning_rate": 3.0015699778245177e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11909287422895432,
"step": 1540,
"valid_targets_mean": 3597.5,
"valid_targets_min": 311
},
{
"epoch": 2.8098271155595995,
"grad_norm": 0.6019469943728163,
"learning_rate": 2.9937118812124796e-05,
"loss": 0.2713,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13189806044101715,
"step": 1545,
"valid_targets_mean": 3001.1,
"valid_targets_min": 2021
},
{
"epoch": 2.818926296633303,
"grad_norm": 0.6243801288042384,
"learning_rate": 2.9858333628476423e-05,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16052299737930298,
"step": 1550,
"valid_targets_mean": 4131.5,
"valid_targets_min": 2309
},
{
"epoch": 2.8280254777070066,
"grad_norm": 0.7862122605057308,
"learning_rate": 2.977934584641278e-05,
"loss": 0.27,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12268385291099548,
"step": 1555,
"valid_targets_mean": 1729.8,
"valid_targets_min": 275
},
{
"epoch": 2.8371246587807097,
"grad_norm": 0.5889590266099785,
"learning_rate": 2.9700157089210174e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.133815199136734,
"step": 1560,
"valid_targets_mean": 4164.0,
"valid_targets_min": 169
},
{
"epoch": 2.846223839854413,
"grad_norm": 0.5718002161440873,
"learning_rate": 2.9620768984275163e-05,
"loss": 0.2607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13359403610229492,
"step": 1565,
"valid_targets_mean": 3803.5,
"valid_targets_min": 2257
},
{
"epoch": 2.8553230209281164,
"grad_norm": 0.5008652494906181,
"learning_rate": 2.9541183163111076e-05,
"loss": 0.2631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10507234930992126,
"step": 1570,
"valid_targets_mean": 3964.6,
"valid_targets_min": 2507
},
{
"epoch": 2.86442220200182,
"grad_norm": 0.5010428450320672,
"learning_rate": 2.9461401261284536e-05,
"loss": 0.2534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1268589198589325,
"step": 1575,
"valid_targets_mean": 5799.9,
"valid_targets_min": 2969
},
{
"epoch": 2.873521383075523,
"grad_norm": 0.58820416909119,
"learning_rate": 2.9381424918391775e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10214714705944061,
"step": 1580,
"valid_targets_mean": 2422.4,
"valid_targets_min": 261
},
{
"epoch": 2.8826205641492266,
"grad_norm": 0.5880343496175168,
"learning_rate": 2.9301255778025014e-05,
"loss": 0.2704,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1449739933013916,
"step": 1585,
"valid_targets_mean": 4025.0,
"valid_targets_min": 2526
},
{
"epoch": 2.8917197452229297,
"grad_norm": 0.6036710857573726,
"learning_rate": 2.9220895487738627e-05,
"loss": 0.2617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13294830918312073,
"step": 1590,
"valid_targets_mean": 2878.0,
"valid_targets_min": 1298
},
{
"epoch": 2.9008189262966333,
"grad_norm": 0.6020483772824585,
"learning_rate": 2.9140345699015328e-05,
"loss": 0.2699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12777581810951233,
"step": 1595,
"valid_targets_mean": 3732.0,
"valid_targets_min": 1366
},
{
"epoch": 2.909918107370337,
"grad_norm": 0.6714113794998876,
"learning_rate": 2.905960806723219e-05,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13986052572727203,
"step": 1600,
"valid_targets_mean": 3049.1,
"valid_targets_min": 1681
},
{
"epoch": 2.91901728844404,
"grad_norm": 0.4996309143387443,
"learning_rate": 2.8978684251626652e-05,
"loss": 0.2661,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1562909185886383,
"step": 1605,
"valid_targets_mean": 6508.9,
"valid_targets_min": 3385
},
{
"epoch": 2.9281164695177435,
"grad_norm": 0.5506771309751523,
"learning_rate": 2.8897575915262418e-05,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13283151388168335,
"step": 1610,
"valid_targets_mean": 4325.6,
"valid_targets_min": 1944
},
{
"epoch": 2.9372156505914466,
"grad_norm": 0.566063666317329,
"learning_rate": 2.8816284724995273e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09932658076286316,
"step": 1615,
"valid_targets_mean": 2903.8,
"valid_targets_min": 493
},
{
"epoch": 2.94631483166515,
"grad_norm": 0.5468189644584138,
"learning_rate": 2.8734812351438823e-05,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11008670181035995,
"step": 1620,
"valid_targets_mean": 3202.6,
"valid_targets_min": 938
},
{
"epoch": 2.9554140127388537,
"grad_norm": 0.5886448368356968,
"learning_rate": 2.8653160468930168e-05,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1270906925201416,
"step": 1625,
"valid_targets_mean": 3301.6,
"valid_targets_min": 248
},
{
"epoch": 2.964513193812557,
"grad_norm": 0.6003432400545452,
"learning_rate": 2.85713307554955e-05,
"loss": 0.2674,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15293045341968536,
"step": 1630,
"valid_targets_mean": 3731.0,
"valid_targets_min": 1299
},
{
"epoch": 2.9736123748862604,
"grad_norm": 0.5216458066693334,
"learning_rate": 2.8489324892815604e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10243799537420273,
"step": 1635,
"valid_targets_mean": 4290.9,
"valid_targets_min": 2556
},
{
"epoch": 2.9827115559599635,
"grad_norm": 0.647682228722322,
"learning_rate": 2.8407144566191315e-05,
"loss": 0.2641,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11987321078777313,
"step": 1640,
"valid_targets_mean": 2687.5,
"valid_targets_min": 331
},
{
"epoch": 2.991810737033667,
"grad_norm": 0.5956168466588846,
"learning_rate": 2.8324791464508856e-05,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12937332689762115,
"step": 1645,
"valid_targets_mean": 3305.0,
"valid_targets_min": 1403
},
{
"epoch": 3.0,
"grad_norm": 0.9029027098902189,
"learning_rate": 2.824226728020516e-05,
"loss": 0.2554,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30957484245300293,
"step": 1650,
"valid_targets_mean": 3302.6,
"valid_targets_min": 1365
},
{
"epoch": 3.0090991810737036,
"grad_norm": 0.6627737045647052,
"learning_rate": 2.8159573709233074e-05,
"loss": 0.2479,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1534401923418045,
"step": 1655,
"valid_targets_mean": 3602.0,
"valid_targets_min": 685
},
{
"epoch": 3.0181983621474067,
"grad_norm": 0.6291036345714702,
"learning_rate": 2.80767124510265e-05,
"loss": 0.2109,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12472149729728699,
"step": 1660,
"valid_targets_mean": 3638.4,
"valid_targets_min": 1366
},
{
"epoch": 3.02729754322111,
"grad_norm": 0.5541449376554247,
"learning_rate": 2.7993685208465483e-05,
"loss": 0.2474,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1034252867102623,
"step": 1665,
"valid_targets_mean": 4169.1,
"valid_targets_min": 1226
},
{
"epoch": 3.0363967242948133,
"grad_norm": 0.6778018211647409,
"learning_rate": 2.7910493687841213e-05,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13861678540706635,
"step": 1670,
"valid_targets_mean": 4292.2,
"valid_targets_min": 1284
},
{
"epoch": 3.045495905368517,
"grad_norm": 0.6258555524981517,
"learning_rate": 2.7827139598820947e-05,
"loss": 0.2359,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10056846588850021,
"step": 1675,
"valid_targets_mean": 2452.4,
"valid_targets_min": 1017
},
{
"epoch": 3.05459508644222,
"grad_norm": 0.5339850920139807,
"learning_rate": 2.774362465441288e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10936719179153442,
"step": 1680,
"valid_targets_mean": 4660.5,
"valid_targets_min": 313
},
{
"epoch": 3.0636942675159236,
"grad_norm": 0.6071416816239227,
"learning_rate": 2.7659950570930956e-05,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10698353499174118,
"step": 1685,
"valid_targets_mean": 2520.0,
"valid_targets_min": 328
},
{
"epoch": 3.072793448589627,
"grad_norm": 0.5865148303237524,
"learning_rate": 2.7576119067959565e-05,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09415340423583984,
"step": 1690,
"valid_targets_mean": 3474.0,
"valid_targets_min": 1947
},
{
"epoch": 3.08189262966333,
"grad_norm": 0.6516039766541762,
"learning_rate": 2.7492131868318247e-05,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10586540400981903,
"step": 1695,
"valid_targets_mean": 2984.5,
"valid_targets_min": 1568
},
{
"epoch": 3.0909918107370338,
"grad_norm": 0.5753829853634493,
"learning_rate": 2.7407990698026227e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13014456629753113,
"step": 1700,
"valid_targets_mean": 4518.5,
"valid_targets_min": 298
},
{
"epoch": 3.100090991810737,
"grad_norm": 0.712305406096257,
"learning_rate": 2.7323697286266998e-05,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15478244423866272,
"step": 1705,
"valid_targets_mean": 3958.9,
"valid_targets_min": 1431
},
{
"epoch": 3.1091901728844404,
"grad_norm": 0.5603421184349171,
"learning_rate": 2.7239253365352774e-05,
"loss": 0.2337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1260107159614563,
"step": 1710,
"valid_targets_mean": 4813.8,
"valid_targets_min": 2219
},
{
"epoch": 3.1182893539581436,
"grad_norm": 0.6945149678969376,
"learning_rate": 2.7154660670688867e-05,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1382228136062622,
"step": 1715,
"valid_targets_mean": 2869.9,
"valid_targets_min": 1752
},
{
"epoch": 3.127388535031847,
"grad_norm": 0.6608358333888942,
"learning_rate": 2.706992094073803e-05,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1332719475030899,
"step": 1720,
"valid_targets_mean": 3072.0,
"valid_targets_min": 2326
},
{
"epoch": 3.1364877161055507,
"grad_norm": 0.5884814788647655,
"learning_rate": 2.6985035916984746e-05,
"loss": 0.2488,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1449941098690033,
"step": 1725,
"valid_targets_mean": 5181.2,
"valid_targets_min": 3160
},
{
"epoch": 3.1455868971792538,
"grad_norm": 0.5685308536656252,
"learning_rate": 2.6900007343899414e-05,
"loss": 0.2331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11001268029212952,
"step": 1730,
"valid_targets_mean": 4469.2,
"valid_targets_min": 2386
},
{
"epoch": 3.1546860782529573,
"grad_norm": 0.692558286911919,
"learning_rate": 2.6814836968902535e-05,
"loss": 0.2378,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14557890594005585,
"step": 1735,
"valid_targets_mean": 3579.2,
"valid_targets_min": 1998
},
{
"epoch": 3.1637852593266604,
"grad_norm": 0.589001169535335,
"learning_rate": 2.6729526542328755e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11505816876888275,
"step": 1740,
"valid_targets_mean": 4077.8,
"valid_targets_min": 1171
},
{
"epoch": 3.172884440400364,
"grad_norm": 0.5372069609633437,
"learning_rate": 2.6644077817390933e-05,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11513690650463104,
"step": 1745,
"valid_targets_mean": 4349.6,
"valid_targets_min": 2454
},
{
"epoch": 3.1819836214740675,
"grad_norm": 0.6140011398548391,
"learning_rate": 2.6558492550144092e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13439062237739563,
"step": 1750,
"valid_targets_mean": 4064.9,
"valid_targets_min": 2142
},
{
"epoch": 3.1910828025477707,
"grad_norm": 0.5956060584442296,
"learning_rate": 2.6472772499449323e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08770699054002762,
"step": 1755,
"valid_targets_mean": 2663.2,
"valid_targets_min": 1140
},
{
"epoch": 3.200181983621474,
"grad_norm": 0.6430662067017598,
"learning_rate": 2.6386919426937655e-05,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1511210948228836,
"step": 1760,
"valid_targets_mean": 3950.0,
"valid_targets_min": 545
},
{
"epoch": 3.2092811646951773,
"grad_norm": 0.5351581599278695,
"learning_rate": 2.6300935096973858e-05,
"loss": 0.2525,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11395445466041565,
"step": 1765,
"valid_targets_mean": 4045.6,
"valid_targets_min": 2197
},
{
"epoch": 3.218380345768881,
"grad_norm": 0.6904452232059044,
"learning_rate": 2.6214821276620157e-05,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12120945751667023,
"step": 1770,
"valid_targets_mean": 3098.6,
"valid_targets_min": 250
},
{
"epoch": 3.227479526842584,
"grad_norm": 0.5777775090819005,
"learning_rate": 2.6128579735599924e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08591067045927048,
"step": 1775,
"valid_targets_mean": 1854.9,
"valid_targets_min": 276
},
{
"epoch": 3.2365787079162875,
"grad_norm": 0.5250787648078289,
"learning_rate": 2.6042212246261337e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10418880730867386,
"step": 1780,
"valid_targets_mean": 3393.4,
"valid_targets_min": 1993
},
{
"epoch": 3.245677888989991,
"grad_norm": 0.6748695446147454,
"learning_rate": 2.595572058354092e-05,
"loss": 0.2215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11711028218269348,
"step": 1785,
"valid_targets_mean": 3478.6,
"valid_targets_min": 1383
},
{
"epoch": 3.254777070063694,
"grad_norm": 0.680006289788221,
"learning_rate": 2.5869106524927096e-05,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13660980761051178,
"step": 1790,
"valid_targets_mean": 3546.8,
"valid_targets_min": 260
},
{
"epoch": 3.2638762511373978,
"grad_norm": 0.6203082184778486,
"learning_rate": 2.5782371850423627e-05,
"loss": 0.2297,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.133883997797966,
"step": 1795,
"valid_targets_mean": 4430.2,
"valid_targets_min": 3003
},
{
"epoch": 3.272975432211101,
"grad_norm": 0.592304583983555,
"learning_rate": 2.5695518342513047e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11032648384571075,
"step": 1800,
"valid_targets_mean": 3791.2,
"valid_targets_min": 2560
},
{
"epoch": 3.2820746132848044,
"grad_norm": 0.6615154368059429,
"learning_rate": 2.5608547786120056e-05,
"loss": 0.235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10840634256601334,
"step": 1805,
"valid_targets_mean": 3448.1,
"valid_targets_min": 965
},
{
"epoch": 3.2911737943585075,
"grad_norm": 0.6061214028536877,
"learning_rate": 2.55214619685748e-05,
"loss": 0.2385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11647415161132812,
"step": 1810,
"valid_targets_mean": 3058.6,
"valid_targets_min": 251
},
{
"epoch": 3.300272975432211,
"grad_norm": 0.612922757802074,
"learning_rate": 2.5434262679576157e-05,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12078569084405899,
"step": 1815,
"valid_targets_mean": 4058.1,
"valid_targets_min": 275
},
{
"epoch": 3.3093721565059147,
"grad_norm": 0.7106121648750277,
"learning_rate": 2.5346951711154946e-05,
"loss": 0.2506,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10854356735944748,
"step": 1820,
"valid_targets_mean": 2593.4,
"valid_targets_min": 324
},
{
"epoch": 3.3184713375796178,
"grad_norm": 0.6913113203702447,
"learning_rate": 2.5259530857637125e-05,
"loss": 0.2351,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13775470852851868,
"step": 1825,
"valid_targets_mean": 3313.2,
"valid_targets_min": 2581
},
{
"epoch": 3.3275705186533213,
"grad_norm": 0.682855819822667,
"learning_rate": 2.5172001915606883e-05,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14159566164016724,
"step": 1830,
"valid_targets_mean": 3209.6,
"valid_targets_min": 496
},
{
"epoch": 3.3366696997270244,
"grad_norm": 0.5972089007845723,
"learning_rate": 2.5084366683869746e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09136951714754105,
"step": 1835,
"valid_targets_mean": 2752.5,
"valid_targets_min": 1878
},
{
"epoch": 3.345768880800728,
"grad_norm": 0.6302061631973847,
"learning_rate": 2.4996626963415577e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09223796427249908,
"step": 1840,
"valid_targets_mean": 2731.0,
"valid_targets_min": 289
},
{
"epoch": 3.3548680618744315,
"grad_norm": 0.635200704727907,
"learning_rate": 2.4908784557381616e-05,
"loss": 0.2341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12977059185504913,
"step": 1845,
"valid_targets_mean": 3390.6,
"valid_targets_min": 1780
},
{
"epoch": 3.3639672429481347,
"grad_norm": 0.616785501369989,
"learning_rate": 2.4820841271015364e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12457115948200226,
"step": 1850,
"valid_targets_mean": 4544.5,
"valid_targets_min": 2092
},
{
"epoch": 3.373066424021838,
"grad_norm": 0.5691230207719173,
"learning_rate": 2.4732798911637525e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10241171717643738,
"step": 1855,
"valid_targets_mean": 3519.0,
"valid_targets_min": 274
},
{
"epoch": 3.3821656050955413,
"grad_norm": 0.6705750722839043,
"learning_rate": 2.4644659288604853e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08712461590766907,
"step": 1860,
"valid_targets_mean": 1878.9,
"valid_targets_min": 253
},
{
"epoch": 3.391264786169245,
"grad_norm": 0.6859178535407267,
"learning_rate": 2.4556424213272955e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10289760679006577,
"step": 1865,
"valid_targets_mean": 2637.1,
"valid_targets_min": 411
},
{
"epoch": 3.400363967242948,
"grad_norm": 0.6468930323424454,
"learning_rate": 2.4468095498959086e-05,
"loss": 0.2248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12468135356903076,
"step": 1870,
"valid_targets_mean": 3236.8,
"valid_targets_min": 341
},
{
"epoch": 3.4094631483166515,
"grad_norm": 0.6573233362355302,
"learning_rate": 2.4379674960904867e-05,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1340944617986679,
"step": 1875,
"valid_targets_mean": 3330.8,
"valid_targets_min": 785
},
{
"epoch": 3.4185623293903546,
"grad_norm": 0.6857110616562382,
"learning_rate": 2.4291164416238994e-05,
"loss": 0.2342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13505122065544128,
"step": 1880,
"valid_targets_mean": 3543.1,
"valid_targets_min": 1663
},
{
"epoch": 3.427661510464058,
"grad_norm": 0.5745741235715318,
"learning_rate": 2.4202565683939872e-05,
"loss": 0.2423,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1247991994023323,
"step": 1885,
"valid_targets_mean": 4356.1,
"valid_targets_min": 1386
},
{
"epoch": 3.4367606915377618,
"grad_norm": 0.626758290724901,
"learning_rate": 2.411388058479827e-05,
"loss": 0.2253,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12153643369674683,
"step": 1890,
"valid_targets_mean": 3427.8,
"valid_targets_min": 1926
},
{
"epoch": 3.445859872611465,
"grad_norm": 0.6666850067429048,
"learning_rate": 2.402511094137987e-05,
"loss": 0.2139,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14569628238677979,
"step": 1895,
"valid_targets_mean": 4079.9,
"valid_targets_min": 2271
},
{
"epoch": 3.4549590536851684,
"grad_norm": 0.6201028472502161,
"learning_rate": 2.3936258577987807e-05,
"loss": 0.2317,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13898374140262604,
"step": 1900,
"valid_targets_mean": 3923.2,
"valid_targets_min": 1147
},
{
"epoch": 3.4640582347588715,
"grad_norm": 0.5393992734649197,
"learning_rate": 2.3847325320625223e-05,
"loss": 0.2384,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11783619225025177,
"step": 1905,
"valid_targets_mean": 4982.4,
"valid_targets_min": 2594
},
{
"epoch": 3.473157415832575,
"grad_norm": 0.6058665738384407,
"learning_rate": 2.3758312996957676e-05,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11445163190364838,
"step": 1910,
"valid_targets_mean": 3420.1,
"valid_targets_min": 1665
},
{
"epoch": 3.4822565969062786,
"grad_norm": 0.569106347802839,
"learning_rate": 2.366922343627565e-05,
"loss": 0.2201,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1065153181552887,
"step": 1915,
"valid_targets_mean": 3185.2,
"valid_targets_min": 1122
},
{
"epoch": 3.4913557779799818,
"grad_norm": 0.6711360787435348,
"learning_rate": 2.358005846945689e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13603505492210388,
"step": 1920,
"valid_targets_mean": 3550.5,
"valid_targets_min": 1731
},
{
"epoch": 3.5004549590536853,
"grad_norm": 0.6029423817813914,
"learning_rate": 2.349081992892885e-05,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1385492980480194,
"step": 1925,
"valid_targets_mean": 4586.5,
"valid_targets_min": 2817
},
{
"epoch": 3.5095541401273884,
"grad_norm": 0.5721952870442969,
"learning_rate": 2.3401509648630954e-05,
"loss": 0.2385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10515997558832169,
"step": 1930,
"valid_targets_mean": 4997.0,
"valid_targets_min": 3277
},
{
"epoch": 3.518653321201092,
"grad_norm": 0.6669379189824646,
"learning_rate": 2.331212946397698e-05,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12849804759025574,
"step": 1935,
"valid_targets_mean": 3554.0,
"valid_targets_min": 1566
},
{
"epoch": 3.5277525022747955,
"grad_norm": 0.5582718810153309,
"learning_rate": 2.3222681211817287e-05,
"loss": 0.2386,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10624731332063675,
"step": 1940,
"valid_targets_mean": 4358.5,
"valid_targets_min": 2948
},
{
"epoch": 3.5368516833484986,
"grad_norm": 0.6109402511946427,
"learning_rate": 2.31331667304011e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11600244790315628,
"step": 1945,
"valid_targets_mean": 3243.4,
"valid_targets_min": 1742
},
{
"epoch": 3.5459508644222018,
"grad_norm": 0.6223125409986712,
"learning_rate": 2.3043587859338735e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11614356935024261,
"step": 1950,
"valid_targets_mean": 3193.0,
"valid_targets_min": 1706
},
{
"epoch": 3.5550500454959053,
"grad_norm": 0.7483186029922464,
"learning_rate": 2.2953946439563736e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1298794150352478,
"step": 1955,
"valid_targets_mean": 2468.0,
"valid_targets_min": 931
},
{
"epoch": 3.564149226569609,
"grad_norm": 0.5256637837739685,
"learning_rate": 2.286424431329513e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08543480932712555,
"step": 1960,
"valid_targets_mean": 3995.2,
"valid_targets_min": 635
},
{
"epoch": 3.573248407643312,
"grad_norm": 0.6920745965137178,
"learning_rate": 2.277448332399949e-05,
"loss": 0.2228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14779648184776306,
"step": 1965,
"valid_targets_mean": 3713.6,
"valid_targets_min": 362
},
{
"epoch": 3.5823475887170155,
"grad_norm": 0.6731284896447256,
"learning_rate": 2.2684665316353112e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.136958509683609,
"step": 1970,
"valid_targets_mean": 3991.2,
"valid_targets_min": 2124
},
{
"epoch": 3.5914467697907186,
"grad_norm": 0.5687167935216879,
"learning_rate": 2.2594792136204037e-05,
"loss": 0.2388,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1017768532037735,
"step": 1975,
"valid_targets_mean": 3863.9,
"valid_targets_min": 2661
},
{
"epoch": 3.600545950864422,
"grad_norm": 0.5722468143481457,
"learning_rate": 2.250486563053419e-05,
"loss": 0.2411,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13285937905311584,
"step": 1980,
"valid_targets_mean": 4369.8,
"valid_targets_min": 336
},
{
"epoch": 3.6096451319381258,
"grad_norm": 0.6478782120428274,
"learning_rate": 2.241488764742135e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11048940569162369,
"step": 1985,
"valid_targets_mean": 3022.1,
"valid_targets_min": 204
},
{
"epoch": 3.618744313011829,
"grad_norm": 0.7168992027139708,
"learning_rate": 2.232486003600126e-05,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1075039803981781,
"step": 1990,
"valid_targets_mean": 3019.2,
"valid_targets_min": 1241
},
{
"epoch": 3.6278434940855324,
"grad_norm": 0.6570252469182816,
"learning_rate": 2.223478464642952e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11854603886604309,
"step": 1995,
"valid_targets_mean": 3483.4,
"valid_targets_min": 1784
},
{
"epoch": 3.6369426751592355,
"grad_norm": 0.6144475955980022,
"learning_rate": 2.2144663329843653e-05,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13097110390663147,
"step": 2000,
"valid_targets_mean": 3481.0,
"valid_targets_min": 905
},
{
"epoch": 3.646041856232939,
"grad_norm": 0.6052858271327498,
"learning_rate": 2.205449793832502e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10313941538333893,
"step": 2005,
"valid_targets_mean": 2982.5,
"valid_targets_min": 1198
},
{
"epoch": 3.6551410373066426,
"grad_norm": 0.44991266551208103,
"learning_rate": 2.1964290324860746e-05,
"loss": 0.216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0842527225613594,
"step": 2010,
"valid_targets_mean": 3413.9,
"valid_targets_min": 1441
},
{
"epoch": 3.6642402183803457,
"grad_norm": 0.6071858600053288,
"learning_rate": 2.1874042343305685e-05,
"loss": 0.2497,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13529914617538452,
"step": 2015,
"valid_targets_mean": 4147.6,
"valid_targets_min": 1343
},
{
"epoch": 3.673339399454049,
"grad_norm": 0.47499136647666873,
"learning_rate": 2.1783755848344276e-05,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09141851961612701,
"step": 2020,
"valid_targets_mean": 5427.8,
"valid_targets_min": 1521
},
{
"epoch": 3.6824385805277524,
"grad_norm": 0.6369533030675754,
"learning_rate": 2.1693432695452467e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0990004688501358,
"step": 2025,
"valid_targets_mean": 3742.5,
"valid_targets_min": 2285
},
{
"epoch": 3.691537761601456,
"grad_norm": 0.5840261880984583,
"learning_rate": 2.1603074740859534e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14113259315490723,
"step": 2030,
"valid_targets_mean": 4586.0,
"valid_targets_min": 2810
},
{
"epoch": 3.700636942675159,
"grad_norm": 0.6175870857155759,
"learning_rate": 2.1512683841509982e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1321922242641449,
"step": 2035,
"valid_targets_mean": 4026.5,
"valid_targets_min": 1495
},
{
"epoch": 3.7097361237488626,
"grad_norm": 0.6077331223001471,
"learning_rate": 2.1422261855025357e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13017022609710693,
"step": 2040,
"valid_targets_mean": 3657.9,
"valid_targets_min": 938
},
{
"epoch": 3.7188353048225657,
"grad_norm": 0.5264657471184423,
"learning_rate": 2.133181063966608e-05,
"loss": 0.2257,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1340341866016388,
"step": 2045,
"valid_targets_mean": 5327.8,
"valid_targets_min": 2985
},
{
"epoch": 3.7279344858962693,
"grad_norm": 0.47835522815598563,
"learning_rate": 2.1241332054293243e-05,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10275916755199432,
"step": 2050,
"valid_targets_mean": 4582.0,
"valid_targets_min": 1621
},
{
"epoch": 3.737033666969973,
"grad_norm": 0.6090285873450105,
"learning_rate": 2.115082795833044e-05,
"loss": 0.2339,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13608521223068237,
"step": 2055,
"valid_targets_mean": 4380.6,
"valid_targets_min": 1129
},
{
"epoch": 3.746132848043676,
"grad_norm": 0.6171346398603881,
"learning_rate": 2.1060300211725496e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06999486684799194,
"step": 2060,
"valid_targets_mean": 2120.9,
"valid_targets_min": 264
},
{
"epoch": 3.7552320291173795,
"grad_norm": 0.5078775221738135,
"learning_rate": 2.096975067491233e-05,
"loss": 0.2142,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07993730902671814,
"step": 2065,
"valid_targets_mean": 3289.5,
"valid_targets_min": 1058
},
{
"epoch": 3.7643312101910826,
"grad_norm": 0.5666497704776816,
"learning_rate": 2.087918120877263e-05,
"loss": 0.2361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10957177728414536,
"step": 2070,
"valid_targets_mean": 3678.8,
"valid_targets_min": 2266
},
{
"epoch": 3.773430391264786,
"grad_norm": 0.6118108100047842,
"learning_rate": 2.0788593674597663e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12245075404644012,
"step": 2075,
"valid_targets_mean": 4218.4,
"valid_targets_min": 2510
},
{
"epoch": 3.7825295723384897,
"grad_norm": 0.568781777071965,
"learning_rate": 2.0697989934050025e-05,
"loss": 0.2336,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12045073509216309,
"step": 2080,
"valid_targets_mean": 4220.2,
"valid_targets_min": 788
},
{
"epoch": 3.791628753412193,
"grad_norm": 0.5974784123285087,
"learning_rate": 2.0607371849125345e-05,
"loss": 0.2272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1365862637758255,
"step": 2085,
"valid_targets_mean": 4663.0,
"valid_targets_min": 2105
},
{
"epoch": 3.8007279344858964,
"grad_norm": 0.6015774380183622,
"learning_rate": 2.0516741282114062e-05,
"loss": 0.2324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11920566111803055,
"step": 2090,
"valid_targets_mean": 4117.2,
"valid_targets_min": 918
},
{
"epoch": 3.8098271155595995,
"grad_norm": 0.5784731444927348,
"learning_rate": 2.0426100095563132e-05,
"loss": 0.2286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11204256862401962,
"step": 2095,
"valid_targets_mean": 3581.0,
"valid_targets_min": 1857
},
{
"epoch": 3.818926296633303,
"grad_norm": 0.6283724815642847,
"learning_rate": 2.0335450152237742e-05,
"loss": 0.2348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12869086861610413,
"step": 2100,
"valid_targets_mean": 3699.2,
"valid_targets_min": 323
},
{
"epoch": 3.8280254777070066,
"grad_norm": 0.642415100550998,
"learning_rate": 2.0244793315083043e-05,
"loss": 0.2458,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14838621020317078,
"step": 2105,
"valid_targets_mean": 4103.6,
"valid_targets_min": 1857
},
{
"epoch": 3.8371246587807097,
"grad_norm": 0.611330076891204,
"learning_rate": 2.0154131447185876e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1300453096628189,
"step": 2110,
"valid_targets_mean": 4131.9,
"valid_targets_min": 2222
},
{
"epoch": 3.846223839854413,
"grad_norm": 0.6382028796568355,
"learning_rate": 2.0063466411736447e-05,
"loss": 0.2385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12640610337257385,
"step": 2115,
"valid_targets_mean": 3200.0,
"valid_targets_min": 1079
},
{
"epoch": 3.8553230209281164,
"grad_norm": 0.592317547174707,
"learning_rate": 1.997280007199008e-05,
"loss": 0.2202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14620466530323029,
"step": 2120,
"valid_targets_mean": 4840.1,
"valid_targets_min": 2407
},
{
"epoch": 3.86442220200182,
"grad_norm": 0.5955652421896328,
"learning_rate": 1.9882134291228877e-05,
"loss": 0.2247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12693578004837036,
"step": 2125,
"valid_targets_mean": 3716.4,
"valid_targets_min": 2313
},
{
"epoch": 3.873521383075523,
"grad_norm": 0.45425164985864347,
"learning_rate": 1.9791470932723486e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06094308942556381,
"step": 2130,
"valid_targets_mean": 2929.5,
"valid_targets_min": 406
},
{
"epoch": 3.8826205641492266,
"grad_norm": 0.5746326658191223,
"learning_rate": 1.9700811859694734e-05,
"loss": 0.2153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12974999845027924,
"step": 2135,
"valid_targets_mean": 4884.5,
"valid_targets_min": 1969
},
{
"epoch": 3.8917197452229297,
"grad_norm": 0.6158150136679469,
"learning_rate": 1.961015893527541e-05,
"loss": 0.24,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1246422678232193,
"step": 2140,
"valid_targets_mean": 3744.6,
"valid_targets_min": 271
},
{
"epoch": 3.9008189262966333,
"grad_norm": 0.5134096098504591,
"learning_rate": 1.9519514022471933e-05,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10631200671195984,
"step": 2145,
"valid_targets_mean": 5187.0,
"valid_targets_min": 2402
},
{
"epoch": 3.909918107370337,
"grad_norm": 0.6462071879791262,
"learning_rate": 1.942887898412608e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10570937395095825,
"step": 2150,
"valid_targets_mean": 3218.5,
"valid_targets_min": 693
},
{
"epoch": 3.91901728844404,
"grad_norm": 0.6127776684285441,
"learning_rate": 1.9338255682876682e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09252439439296722,
"step": 2155,
"valid_targets_mean": 3153.1,
"valid_targets_min": 293
},
{
"epoch": 3.9281164695177435,
"grad_norm": 0.7186098539492584,
"learning_rate": 1.924764598112138e-05,
"loss": 0.2252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08831615746021271,
"step": 2160,
"valid_targets_mean": 2062.8,
"valid_targets_min": 311
},
{
"epoch": 3.9372156505914466,
"grad_norm": 0.6015779882414538,
"learning_rate": 1.9157051740978326e-05,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08883961290121078,
"step": 2165,
"valid_targets_mean": 2913.9,
"valid_targets_min": 866
},
{
"epoch": 3.94631483166515,
"grad_norm": 0.7661092923072249,
"learning_rate": 1.9066474824247913e-05,
"loss": 0.2451,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11353622376918793,
"step": 2170,
"valid_targets_mean": 4695.0,
"valid_targets_min": 2684
},
{
"epoch": 3.9554140127388537,
"grad_norm": 0.6358343088472361,
"learning_rate": 1.8975917092374542e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08747850358486176,
"step": 2175,
"valid_targets_mean": 2095.9,
"valid_targets_min": 246
},
{
"epoch": 3.964513193812557,
"grad_norm": 0.6356945476266306,
"learning_rate": 1.888538040640831e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10770977288484573,
"step": 2180,
"valid_targets_mean": 3358.5,
"valid_targets_min": 1388
},
{
"epoch": 3.9736123748862604,
"grad_norm": 0.4680125277198997,
"learning_rate": 1.8794866626966834e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1037270575761795,
"step": 2185,
"valid_targets_mean": 6218.2,
"valid_targets_min": 979
},
{
"epoch": 3.9827115559599635,
"grad_norm": 0.561916925920865,
"learning_rate": 1.8704377614196963e-05,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12491119652986526,
"step": 2190,
"valid_targets_mean": 3551.0,
"valid_targets_min": 2256
},
{
"epoch": 3.991810737033667,
"grad_norm": 0.6171678094348222,
"learning_rate": 1.8613915227736584e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13132691383361816,
"step": 2195,
"valid_targets_mean": 3616.2,
"valid_targets_min": 1897
},
{
"epoch": 4.0,
"grad_norm": 0.8713646274215626,
"learning_rate": 1.852348132667635e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2565116882324219,
"step": 2200,
"valid_targets_mean": 3516.8,
"valid_targets_min": 820
},
{
"epoch": 4.0090991810737036,
"grad_norm": 0.7610478323964359,
"learning_rate": 1.843307776952155e-05,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1043773666024208,
"step": 2205,
"valid_targets_mean": 2845.2,
"valid_targets_min": 419
},
{
"epoch": 4.018198362147407,
"grad_norm": 0.6999568780697065,
"learning_rate": 1.834270641415386e-05,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09883319586515427,
"step": 2210,
"valid_targets_mean": 3011.8,
"valid_targets_min": 191
},
{
"epoch": 4.02729754322111,
"grad_norm": 0.639663595129245,
"learning_rate": 1.8252369117793172e-05,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10715536773204803,
"step": 2215,
"valid_targets_mean": 3646.4,
"valid_targets_min": 705
},
{
"epoch": 4.036396724294813,
"grad_norm": 0.6155902648302152,
"learning_rate": 1.8162067736959454e-05,
"loss": 0.2153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08828684687614441,
"step": 2220,
"valid_targets_mean": 3454.4,
"valid_targets_min": 272
},
{
"epoch": 4.045495905368517,
"grad_norm": 0.6985946692476135,
"learning_rate": 1.8071804127434545e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11581951379776001,
"step": 2225,
"valid_targets_mean": 2963.2,
"valid_targets_min": 343
},
{
"epoch": 4.05459508644222,
"grad_norm": 0.6305907311339457,
"learning_rate": 1.7981580144224066e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1013331338763237,
"step": 2230,
"valid_targets_mean": 3289.9,
"valid_targets_min": 1675
},
{
"epoch": 4.063694267515924,
"grad_norm": 0.5757227023580752,
"learning_rate": 1.7891397641519272e-05,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08844532072544098,
"step": 2235,
"valid_targets_mean": 3442.2,
"valid_targets_min": 462
},
{
"epoch": 4.072793448589627,
"grad_norm": 0.6815233873910455,
"learning_rate": 1.7801258472658964e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11015966534614563,
"step": 2240,
"valid_targets_mean": 3494.4,
"valid_targets_min": 1363
},
{
"epoch": 4.08189262966333,
"grad_norm": 0.5289726572096387,
"learning_rate": 1.7711164490091365e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09975562989711761,
"step": 2245,
"valid_targets_mean": 5850.0,
"valid_targets_min": 2197
},
{
"epoch": 4.090991810737034,
"grad_norm": 0.6366132972111163,
"learning_rate": 1.7621117545336098e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10522039234638214,
"step": 2250,
"valid_targets_mean": 3253.4,
"valid_targets_min": 1322
},
{
"epoch": 4.100090991810737,
"grad_norm": 0.718026894601455,
"learning_rate": 1.7531119488946107e-05,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15831488370895386,
"step": 2255,
"valid_targets_mean": 4147.0,
"valid_targets_min": 2306
},
{
"epoch": 4.10919017288444,
"grad_norm": 0.6415953800163945,
"learning_rate": 1.7441172170469634e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12810300290584564,
"step": 2260,
"valid_targets_mean": 4011.8,
"valid_targets_min": 1456
},
{
"epoch": 4.1182893539581436,
"grad_norm": 0.6763238164852513,
"learning_rate": 1.7351277438412197e-05,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09420953691005707,
"step": 2265,
"valid_targets_mean": 2700.8,
"valid_targets_min": 443
},
{
"epoch": 4.127388535031847,
"grad_norm": 0.6513239865451258,
"learning_rate": 1.726143714019862e-05,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1157243549823761,
"step": 2270,
"valid_targets_mean": 3612.5,
"valid_targets_min": 258
},
{
"epoch": 4.136487716105551,
"grad_norm": 0.669251316448323,
"learning_rate": 1.7171653122135065e-05,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11020094156265259,
"step": 2275,
"valid_targets_mean": 3440.4,
"valid_targets_min": 411
},
{
"epoch": 4.145586897179254,
"grad_norm": 0.6459739960236776,
"learning_rate": 1.708192722937106e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1289825737476349,
"step": 2280,
"valid_targets_mean": 4582.9,
"valid_targets_min": 1766
},
{
"epoch": 4.154686078252957,
"grad_norm": 0.5874955425165647,
"learning_rate": 1.6992261305861635e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0869600772857666,
"step": 2285,
"valid_targets_mean": 3355.1,
"valid_targets_min": 1226
},
{
"epoch": 4.16378525932666,
"grad_norm": 0.5381128847881688,
"learning_rate": 1.6902657194329357e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10084788501262665,
"step": 2290,
"valid_targets_mean": 4416.6,
"valid_targets_min": 1936
},
{
"epoch": 4.172884440400364,
"grad_norm": 0.6222544662905637,
"learning_rate": 1.681311673622651e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07266297936439514,
"step": 2295,
"valid_targets_mean": 2939.8,
"valid_targets_min": 291
},
{
"epoch": 4.1819836214740675,
"grad_norm": 0.6319977100323101,
"learning_rate": 1.6723641771697246e-05,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1194155216217041,
"step": 2300,
"valid_targets_mean": 3916.6,
"valid_targets_min": 518
},
{
"epoch": 4.191082802547771,
"grad_norm": 0.591815007892247,
"learning_rate": 1.663423413953976e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10994294285774231,
"step": 2305,
"valid_targets_mean": 4506.1,
"valid_targets_min": 1525
},
{
"epoch": 4.200181983621474,
"grad_norm": 0.6379876571697218,
"learning_rate": 1.6544895677168483e-05,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08801357448101044,
"step": 2310,
"valid_targets_mean": 3171.1,
"valid_targets_min": 502
},
{
"epoch": 4.209281164695177,
"grad_norm": 0.6711685746669366,
"learning_rate": 1.6455628220576357e-05,
"loss": 0.2176,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0922049880027771,
"step": 2315,
"valid_targets_mean": 3022.6,
"valid_targets_min": 335
},
{
"epoch": 4.218380345768881,
"grad_norm": 0.6513788938326086,
"learning_rate": 1.6366433604297072e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1115066409111023,
"step": 2320,
"valid_targets_mean": 4586.1,
"valid_targets_min": 683
},
{
"epoch": 4.227479526842584,
"grad_norm": 0.6872049756707485,
"learning_rate": 1.62773136613674e-05,
"loss": 0.2183,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11089625954627991,
"step": 2325,
"valid_targets_mean": 3216.5,
"valid_targets_min": 1052
},
{
"epoch": 4.236578707916287,
"grad_norm": 0.6140058427675289,
"learning_rate": 1.6188270223289483e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09252717345952988,
"step": 2330,
"valid_targets_mean": 3930.9,
"valid_targets_min": 2630
},
{
"epoch": 4.245677888989991,
"grad_norm": 0.5704927973308062,
"learning_rate": 1.609930511999321e-05,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09383821487426758,
"step": 2335,
"valid_targets_mean": 3737.4,
"valid_targets_min": 1864
},
{
"epoch": 4.254777070063694,
"grad_norm": 0.6500476887222959,
"learning_rate": 1.6010420179798623e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10442210733890533,
"step": 2340,
"valid_targets_mean": 3499.1,
"valid_targets_min": 1180
},
{
"epoch": 4.263876251137398,
"grad_norm": 0.6077011125705658,
"learning_rate": 1.5921617229378338e-05,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09526053071022034,
"step": 2345,
"valid_targets_mean": 3782.8,
"valid_targets_min": 1700
},
{
"epoch": 4.272975432211101,
"grad_norm": 0.6716438775104191,
"learning_rate": 1.583289809372e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10904216766357422,
"step": 2350,
"valid_targets_mean": 3186.6,
"valid_targets_min": 293
},
{
"epoch": 4.282074613284804,
"grad_norm": 0.6442033894228911,
"learning_rate": 1.5744264596088763e-05,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09692924469709396,
"step": 2355,
"valid_targets_mean": 3195.0,
"valid_targets_min": 1919
},
{
"epoch": 4.2911737943585075,
"grad_norm": 0.605259860092484,
"learning_rate": 1.5655718557989848e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12487993389368057,
"step": 2360,
"valid_targets_mean": 4756.9,
"valid_targets_min": 174
},
{
"epoch": 4.300272975432211,
"grad_norm": 0.6012856431758457,
"learning_rate": 1.5567261799131102e-05,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11706040799617767,
"step": 2365,
"valid_targets_mean": 4453.1,
"valid_targets_min": 1956
},
{
"epoch": 4.309372156505915,
"grad_norm": 0.6662252762890644,
"learning_rate": 1.5478896137385584e-05,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11574854701757431,
"step": 2370,
"valid_targets_mean": 4047.9,
"valid_targets_min": 1240
},
{
"epoch": 4.318471337579618,
"grad_norm": 0.6949646893771946,
"learning_rate": 1.5390623388754232e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13453787565231323,
"step": 2375,
"valid_targets_mean": 3733.9,
"valid_targets_min": 246
},
{
"epoch": 4.327570518653321,
"grad_norm": 0.6364584731603552,
"learning_rate": 1.5302445367328507e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09400258213281631,
"step": 2380,
"valid_targets_mean": 3628.4,
"valid_targets_min": 2326
},
{
"epoch": 4.336669699727024,
"grad_norm": 0.6981094613137421,
"learning_rate": 1.5214363885253156e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11428219079971313,
"step": 2385,
"valid_targets_mean": 3146.9,
"valid_targets_min": 1342
},
{
"epoch": 4.345768880800728,
"grad_norm": 0.5204287394542879,
"learning_rate": 1.5126380752688934e-05,
"loss": 0.2029,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10040925443172455,
"step": 2390,
"valid_targets_mean": 5846.6,
"valid_targets_min": 1070
},
{
"epoch": 4.3548680618744315,
"grad_norm": 0.6916260441992553,
"learning_rate": 1.503849777777543e-05,
"loss": 0.2009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12089954316616058,
"step": 2395,
"valid_targets_mean": 3570.8,
"valid_targets_min": 174
},
{
"epoch": 4.363967242948135,
"grad_norm": 0.6330493436940652,
"learning_rate": 1.4950716766593872e-05,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11220642179250717,
"step": 2400,
"valid_targets_mean": 4110.6,
"valid_targets_min": 2053
},
{
"epoch": 4.373066424021838,
"grad_norm": 0.721664357235738,
"learning_rate": 1.4863039523130054e-05,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1065458357334137,
"step": 2405,
"valid_targets_mean": 3365.8,
"valid_targets_min": 643
},
{
"epoch": 4.382165605095541,
"grad_norm": 0.6645783192296282,
"learning_rate": 1.4775467849237234e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09038594365119934,
"step": 2410,
"valid_targets_mean": 2629.5,
"valid_targets_min": 1128
},
{
"epoch": 4.391264786169245,
"grad_norm": 0.6881468289493442,
"learning_rate": 1.468800354459912e-05,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10560519993305206,
"step": 2415,
"valid_targets_mean": 2953.2,
"valid_targets_min": 1138
},
{
"epoch": 4.400363967242948,
"grad_norm": 0.6931148166696036,
"learning_rate": 1.4600648406692863e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11844750493764877,
"step": 2420,
"valid_targets_mean": 3428.8,
"valid_targets_min": 1667
},
{
"epoch": 4.409463148316651,
"grad_norm": 0.6526904247649924,
"learning_rate": 1.451340423075214e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12365461885929108,
"step": 2425,
"valid_targets_mean": 3943.5,
"valid_targets_min": 384
},
{
"epoch": 4.418562329390355,
"grad_norm": 0.6996140130562708,
"learning_rate": 1.4426272809730248e-05,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09634485095739365,
"step": 2430,
"valid_targets_mean": 3138.9,
"valid_targets_min": 348
},
{
"epoch": 4.427661510464058,
"grad_norm": 0.737117477945688,
"learning_rate": 1.433925593426326e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10732056200504303,
"step": 2435,
"valid_targets_mean": 3061.6,
"valid_targets_min": 1399
},
{
"epoch": 4.436760691537762,
"grad_norm": 0.7083417741605627,
"learning_rate": 1.4252355392633237e-05,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10135871171951294,
"step": 2440,
"valid_targets_mean": 2752.9,
"valid_targets_min": 1729
},
{
"epoch": 4.445859872611465,
"grad_norm": 0.6487462790943196,
"learning_rate": 1.4165572970731435e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11768800020217896,
"step": 2445,
"valid_targets_mean": 3779.2,
"valid_targets_min": 1305
},
{
"epoch": 4.454959053685168,
"grad_norm": 0.6223053953705814,
"learning_rate": 1.4078910452021664e-05,
"loss": 0.2145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10405602306127548,
"step": 2450,
"valid_targets_mean": 3966.5,
"valid_targets_min": 1867
},
{
"epoch": 4.4640582347588715,
"grad_norm": 0.5530441312033447,
"learning_rate": 1.3992369617503594e-05,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07695738971233368,
"step": 2455,
"valid_targets_mean": 3257.8,
"valid_targets_min": 1033
},
{
"epoch": 4.473157415832575,
"grad_norm": 0.4801472386964888,
"learning_rate": 1.3905952245676173e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07861844450235367,
"step": 2460,
"valid_targets_mean": 5649.1,
"valid_targets_min": 319
},
{
"epoch": 4.482256596906279,
"grad_norm": 0.539148660231581,
"learning_rate": 1.3819660112501054e-05,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08029848337173462,
"step": 2465,
"valid_targets_mean": 3955.0,
"valid_targets_min": 479
},
{
"epoch": 4.491355777979982,
"grad_norm": 0.6401695191719436,
"learning_rate": 1.3733494991366128e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09944336116313934,
"step": 2470,
"valid_targets_mean": 3213.2,
"valid_targets_min": 1200
},
{
"epoch": 4.500454959053685,
"grad_norm": 0.5262655333217622,
"learning_rate": 1.364745865304906e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09738464653491974,
"step": 2475,
"valid_targets_mean": 4905.0,
"valid_targets_min": 1553
},
{
"epoch": 4.509554140127388,
"grad_norm": 0.6146356778717295,
"learning_rate": 1.3561552865680899e-05,
"loss": 0.2011,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10408352315425873,
"step": 2480,
"valid_targets_mean": 3832.9,
"valid_targets_min": 2663
},
{
"epoch": 4.518653321201092,
"grad_norm": 0.7659267914126828,
"learning_rate": 1.3475779394709754e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1010979562997818,
"step": 2485,
"valid_targets_mean": 2808.4,
"valid_targets_min": 278
},
{
"epoch": 4.5277525022747955,
"grad_norm": 0.510564342275182,
"learning_rate": 1.3390140002864481e-05,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08257513493299484,
"step": 2490,
"valid_targets_mean": 4374.2,
"valid_targets_min": 288
},
{
"epoch": 4.536851683348498,
"grad_norm": 0.6523581194287932,
"learning_rate": 1.3304636450118495e-05,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08213072270154953,
"step": 2495,
"valid_targets_mean": 2523.9,
"valid_targets_min": 296
},
{
"epoch": 4.545950864422202,
"grad_norm": 0.5793152107148682,
"learning_rate": 1.3219270493653587e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08051525056362152,
"step": 2500,
"valid_targets_mean": 3704.6,
"valid_targets_min": 1690
},
{
"epoch": 4.555050045495905,
"grad_norm": 0.6131550258175434,
"learning_rate": 1.3134043887823807e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09287137538194656,
"step": 2505,
"valid_targets_mean": 3077.4,
"valid_targets_min": 1546
},
{
"epoch": 4.564149226569609,
"grad_norm": 0.7031749159784869,
"learning_rate": 1.3048958384119397e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11600330471992493,
"step": 2510,
"valid_targets_mean": 3279.9,
"valid_targets_min": 234
},
{
"epoch": 4.573248407643312,
"grad_norm": 0.7014191302183409,
"learning_rate": 1.2964015731130836e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1107967346906662,
"step": 2515,
"valid_targets_mean": 2881.2,
"valid_targets_min": 303
},
{
"epoch": 4.582347588717015,
"grad_norm": 0.6277578775645954,
"learning_rate": 1.2879217674512865e-05,
"loss": 0.2151,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09785157442092896,
"step": 2520,
"valid_targets_mean": 3342.5,
"valid_targets_min": 1204
},
{
"epoch": 4.591446769790719,
"grad_norm": 0.5777297826894398,
"learning_rate": 1.279456595694864e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09805427491664886,
"step": 2525,
"valid_targets_mean": 3845.9,
"valid_targets_min": 2171
},
{
"epoch": 4.600545950864422,
"grad_norm": 0.6598092832045845,
"learning_rate": 1.2710062318113887e-05,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11755596101284027,
"step": 2530,
"valid_targets_mean": 3864.6,
"valid_targets_min": 1366
},
{
"epoch": 4.609645131938126,
"grad_norm": 0.6671458531470443,
"learning_rate": 1.2625708494641188e-05,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1005607545375824,
"step": 2535,
"valid_targets_mean": 3189.8,
"valid_targets_min": 281
},
{
"epoch": 4.618744313011829,
"grad_norm": 0.6140756298428148,
"learning_rate": 1.2541506220084262e-05,
"loss": 0.2042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09862984716892242,
"step": 2540,
"valid_targets_mean": 3352.1,
"valid_targets_min": 832
},
{
"epoch": 4.627843494085532,
"grad_norm": 0.6276792709672552,
"learning_rate": 1.2457457224882356e-05,
"loss": 0.2156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12656915187835693,
"step": 2545,
"valid_targets_mean": 4384.1,
"valid_targets_min": 2344
},
{
"epoch": 4.6369426751592355,
"grad_norm": 0.5611724864069938,
"learning_rate": 1.237356323632468e-05,
"loss": 0.2194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08815105259418488,
"step": 2550,
"valid_targets_mean": 3377.1,
"valid_targets_min": 844
},
{
"epoch": 4.646041856232939,
"grad_norm": 0.5969416948846179,
"learning_rate": 1.2289825978514882e-05,
"loss": 0.1953,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1119343563914299,
"step": 2555,
"valid_targets_mean": 5220.2,
"valid_targets_min": 224
},
{
"epoch": 4.655141037306643,
"grad_norm": 0.6312969359281144,
"learning_rate": 1.2206247172335662e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10778310894966125,
"step": 2560,
"valid_targets_mean": 3573.1,
"valid_targets_min": 1281
},
{
"epoch": 4.664240218380346,
"grad_norm": 0.6080986613871091,
"learning_rate": 1.2122828535413378e-05,
"loss": 0.2196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09418709576129913,
"step": 2565,
"valid_targets_mean": 4105.8,
"valid_targets_min": 983
},
{
"epoch": 4.673339399454049,
"grad_norm": 0.5115892671372317,
"learning_rate": 1.2039571782082762e-05,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09335912019014359,
"step": 2570,
"valid_targets_mean": 5629.6,
"valid_targets_min": 1092
},
{
"epoch": 4.682438580527752,
"grad_norm": 0.5143277504292695,
"learning_rate": 1.1956478623351652e-05,
"loss": 0.2062,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08968564122915268,
"step": 2575,
"valid_targets_mean": 3954.0,
"valid_targets_min": 266
},
{
"epoch": 4.691537761601456,
"grad_norm": 0.5350470272834709,
"learning_rate": 1.187355076686589e-05,
"loss": 0.2192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09997965395450592,
"step": 2580,
"valid_targets_mean": 4128.8,
"valid_targets_min": 1291
},
{
"epoch": 4.7006369426751595,
"grad_norm": 0.575219861090753,
"learning_rate": 1.1790789916874172e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09727989137172699,
"step": 2585,
"valid_targets_mean": 4808.1,
"valid_targets_min": 1380
},
{
"epoch": 4.709736123748863,
"grad_norm": 0.4802440243107621,
"learning_rate": 1.1708197774193055e-05,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06863594055175781,
"step": 2590,
"valid_targets_mean": 3348.6,
"valid_targets_min": 296
},
{
"epoch": 4.718835304822566,
"grad_norm": 0.6089877547455099,
"learning_rate": 1.1625776036172006e-05,
"loss": 0.2166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11346261203289032,
"step": 2595,
"valid_targets_mean": 4466.2,
"valid_targets_min": 3012
},
{
"epoch": 4.727934485896269,
"grad_norm": 0.6172209994895129,
"learning_rate": 1.1543526396658475e-05,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0995795875787735,
"step": 2600,
"valid_targets_mean": 3648.6,
"valid_targets_min": 1229
},
{
"epoch": 4.737033666969973,
"grad_norm": 0.7217327753696113,
"learning_rate": 1.1461450545963167e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09528639167547226,
"step": 2605,
"valid_targets_mean": 2344.5,
"valid_targets_min": 882
},
{
"epoch": 4.746132848043676,
"grad_norm": 0.5818659549176181,
"learning_rate": 1.137955017082521e-05,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12783287465572357,
"step": 2610,
"valid_targets_mean": 5329.2,
"valid_targets_min": 2962
},
{
"epoch": 4.755232029117379,
"grad_norm": 0.6354180951281558,
"learning_rate": 1.1297826954377587e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10776399075984955,
"step": 2615,
"valid_targets_mean": 3988.8,
"valid_targets_min": 2456
},
{
"epoch": 4.764331210191083,
"grad_norm": 0.5491068184424446,
"learning_rate": 1.1216282576112436e-05,
"loss": 0.2153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08702103793621063,
"step": 2620,
"valid_targets_mean": 4804.8,
"valid_targets_min": 1155
},
{
"epoch": 4.773430391264786,
"grad_norm": 0.6451125893227769,
"learning_rate": 1.1134918711846651e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08675537258386612,
"step": 2625,
"valid_targets_mean": 3419.2,
"valid_targets_min": 1706
},
{
"epoch": 4.78252957233849,
"grad_norm": 0.47554214997356037,
"learning_rate": 1.1053737033687346e-05,
"loss": 0.1997,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11160045862197876,
"step": 2630,
"valid_targets_mean": 6470.4,
"valid_targets_min": 2796
},
{
"epoch": 4.791628753412192,
"grad_norm": 0.6647977556732426,
"learning_rate": 1.097273920999757e-05,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10980549454689026,
"step": 2635,
"valid_targets_mean": 3851.6,
"valid_targets_min": 1611
},
{
"epoch": 4.800727934485896,
"grad_norm": 0.7333185609047528,
"learning_rate": 1.0891926905361948e-05,
"loss": 0.206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09020430594682693,
"step": 2640,
"valid_targets_mean": 2755.9,
"valid_targets_min": 1097
},
{
"epoch": 4.8098271155595995,
"grad_norm": 0.8175132256728149,
"learning_rate": 1.081130178055251e-05,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10943802446126938,
"step": 2645,
"valid_targets_mean": 3038.6,
"valid_targets_min": 649
},
{
"epoch": 4.818926296633303,
"grad_norm": 0.5704955810867999,
"learning_rate": 1.0730865492494593e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0999983698129654,
"step": 2650,
"valid_targets_mean": 3916.9,
"valid_targets_min": 530
},
{
"epoch": 4.828025477707007,
"grad_norm": 0.5812062616005016,
"learning_rate": 1.0650619694232704e-05,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08837728202342987,
"step": 2655,
"valid_targets_mean": 4211.1,
"valid_targets_min": 1487
},
{
"epoch": 4.837124658780709,
"grad_norm": 0.6858967753840393,
"learning_rate": 1.057056603489665e-05,
"loss": 0.2221,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08689923584461212,
"step": 2660,
"valid_targets_mean": 2381.0,
"valid_targets_min": 734
},
{
"epoch": 4.846223839854413,
"grad_norm": 0.5225583496996413,
"learning_rate": 1.0490706159667534e-05,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10315491259098053,
"step": 2665,
"valid_targets_mean": 5551.4,
"valid_targets_min": 261
},
{
"epoch": 4.855323020928116,
"grad_norm": 0.6353564860251033,
"learning_rate": 1.0411041709744063e-05,
"loss": 0.2155,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10783381760120392,
"step": 2670,
"valid_targets_mean": 3868.9,
"valid_targets_min": 1684
},
{
"epoch": 4.86442220200182,
"grad_norm": 0.5953265038631231,
"learning_rate": 1.0331574322308722e-05,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1189485713839531,
"step": 2675,
"valid_targets_mean": 5104.8,
"valid_targets_min": 3054
},
{
"epoch": 4.8735213830755235,
"grad_norm": 0.6415429927593447,
"learning_rate": 1.0252305630494201e-05,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12192051112651825,
"step": 2680,
"valid_targets_mean": 4007.9,
"valid_targets_min": 2307
},
{
"epoch": 4.882620564149226,
"grad_norm": 0.6184392622335321,
"learning_rate": 1.0173237263349776e-05,
"loss": 0.218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11877385526895523,
"step": 2685,
"valid_targets_mean": 4085.5,
"valid_targets_min": 2538
},
{
"epoch": 4.89171974522293,
"grad_norm": 0.7931778991412655,
"learning_rate": 1.0094370845807857e-05,
"loss": 0.2072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08358285576105118,
"step": 2690,
"valid_targets_mean": 3763.9,
"valid_targets_min": 862
},
{
"epoch": 4.900818926296633,
"grad_norm": 0.6311410360214902,
"learning_rate": 1.001570799865061e-05,
"loss": 0.2087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11487400531768799,
"step": 2695,
"valid_targets_mean": 4217.5,
"valid_targets_min": 1774
},
{
"epoch": 4.909918107370337,
"grad_norm": 0.7140049951695571,
"learning_rate": 9.937250338476607e-06,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10089785605669022,
"step": 2700,
"valid_targets_mean": 3144.9,
"valid_targets_min": 270
},
{
"epoch": 4.91901728844404,
"grad_norm": 0.6106766257514653,
"learning_rate": 9.858999477667656e-06,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11438564956188202,
"step": 2705,
"valid_targets_mean": 4361.9,
"valid_targets_min": 2272
},
{
"epoch": 4.928116469517743,
"grad_norm": 0.6079273725174243,
"learning_rate": 9.780957024355591e-06,
"loss": 0.2153,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12418875843286514,
"step": 2710,
"valid_targets_mean": 4085.1,
"valid_targets_min": 1507
},
{
"epoch": 4.937215650591447,
"grad_norm": 0.6640440215081552,
"learning_rate": 9.703124582389312e-06,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10496009886264801,
"step": 2715,
"valid_targets_mean": 3474.0,
"valid_targets_min": 623
},
{
"epoch": 4.94631483166515,
"grad_norm": 0.5074954317268019,
"learning_rate": 9.62550375130175e-06,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11362551897764206,
"step": 2720,
"valid_targets_mean": 6144.5,
"valid_targets_min": 2101
},
{
"epoch": 4.955414012738854,
"grad_norm": 0.6141137566846254,
"learning_rate": 9.548096126277058e-06,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10736232250928879,
"step": 2725,
"valid_targets_mean": 4007.6,
"valid_targets_min": 782
},
{
"epoch": 4.964513193812557,
"grad_norm": 0.7037671666670862,
"learning_rate": 9.470903298117744e-06,
"loss": 0.2149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08674223721027374,
"step": 2730,
"valid_targets_mean": 2620.1,
"valid_targets_min": 503
},
{
"epoch": 4.97361237488626,
"grad_norm": 0.6720492919968285,
"learning_rate": 9.393926853212083e-06,
"loss": 0.222,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09978747367858887,
"step": 2735,
"valid_targets_mean": 2898.4,
"valid_targets_min": 312
},
{
"epoch": 4.9827115559599635,
"grad_norm": 0.6640282659720391,
"learning_rate": 9.317168373501426e-06,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12521491944789886,
"step": 2740,
"valid_targets_mean": 3868.2,
"valid_targets_min": 717
},
{
"epoch": 4.991810737033667,
"grad_norm": 0.639234313775148,
"learning_rate": 9.240629436447752e-06,
"loss": 0.2084,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10244851559400558,
"step": 2745,
"valid_targets_mean": 3245.0,
"valid_targets_min": 1846
},
{
"epoch": 5.0,
"grad_norm": 0.8400368899966859,
"learning_rate": 9.164311615001202e-06,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21654963493347168,
"step": 2750,
"valid_targets_mean": 4341.1,
"valid_targets_min": 2991
},
{
"epoch": 5.0090991810737036,
"grad_norm": 0.6599564352988212,
"learning_rate": 9.08821647756778e-06,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09215378761291504,
"step": 2755,
"valid_targets_mean": 3409.8,
"valid_targets_min": 1066
},
{
"epoch": 5.018198362147407,
"grad_norm": 0.6391140878318657,
"learning_rate": 9.012345587977129e-06,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10837959498167038,
"step": 2760,
"valid_targets_mean": 3909.9,
"valid_targets_min": 1191
},
{
"epoch": 5.02729754322111,
"grad_norm": 0.6596315232469888,
"learning_rate": 8.936700505450356e-06,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0778820738196373,
"step": 2765,
"valid_targets_mean": 3222.8,
"valid_targets_min": 651
},
{
"epoch": 5.036396724294813,
"grad_norm": 0.6659317308109189,
"learning_rate": 8.861282784568045e-06,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09588353335857391,
"step": 2770,
"valid_targets_mean": 3816.9,
"valid_targets_min": 1487
},
{
"epoch": 5.045495905368517,
"grad_norm": 0.6408446103459217,
"learning_rate": 8.786093975238226e-06,
"loss": 0.1828,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10558507591485977,
"step": 2775,
"valid_targets_mean": 3739.4,
"valid_targets_min": 905
},
{
"epoch": 5.05459508644222,
"grad_norm": 0.6889473769582733,
"learning_rate": 8.711135622664622e-06,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09545275568962097,
"step": 2780,
"valid_targets_mean": 3136.0,
"valid_targets_min": 774
},
{
"epoch": 5.063694267515924,
"grad_norm": 0.6209629716703886,
"learning_rate": 8.636409267314806e-06,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11099449545145035,
"step": 2785,
"valid_targets_mean": 4257.4,
"valid_targets_min": 2079
},
{
"epoch": 5.072793448589627,
"grad_norm": 0.7331847549756079,
"learning_rate": 8.561916444888618e-06,
"loss": 0.1865,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07423612475395203,
"step": 2790,
"valid_targets_mean": 2260.2,
"valid_targets_min": 532
},
{
"epoch": 5.08189262966333,
"grad_norm": 0.6779516599757347,
"learning_rate": 8.487658686286533e-06,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08769124746322632,
"step": 2795,
"valid_targets_mean": 3655.4,
"valid_targets_min": 1305
},
{
"epoch": 5.090991810737034,
"grad_norm": 0.5999220678378101,
"learning_rate": 8.413637517578246e-06,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07237271219491959,
"step": 2800,
"valid_targets_mean": 2676.8,
"valid_targets_min": 906
},
{
"epoch": 5.100090991810737,
"grad_norm": 0.644834454156687,
"learning_rate": 8.339854459971313e-06,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11657403409481049,
"step": 2805,
"valid_targets_mean": 4839.6,
"valid_targets_min": 2415
},
{
"epoch": 5.10919017288444,
"grad_norm": 0.7045688864470244,
"learning_rate": 8.266311029779843e-06,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1073337197303772,
"step": 2810,
"valid_targets_mean": 3931.5,
"valid_targets_min": 1637
},
{
"epoch": 5.1182893539581436,
"grad_norm": 0.565876863581839,
"learning_rate": 8.193008738393409e-06,
"loss": 0.1926,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0898812934756279,
"step": 2815,
"valid_targets_mean": 4452.4,
"valid_targets_min": 1995
},
{
"epoch": 5.127388535031847,
"grad_norm": 0.6506292732182613,
"learning_rate": 8.119949092245893e-06,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11412489414215088,
"step": 2820,
"valid_targets_mean": 4151.5,
"valid_targets_min": 1833
},
{
"epoch": 5.136487716105551,
"grad_norm": 0.5027182726275019,
"learning_rate": 8.047133592784626e-06,
"loss": 0.1777,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.052972182631492615,
"step": 2825,
"valid_targets_mean": 2347.1,
"valid_targets_min": 1377
},
{
"epoch": 5.145586897179254,
"grad_norm": 0.6458372413032774,
"learning_rate": 7.974563736439454e-06,
"loss": 0.1962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10185573995113373,
"step": 2830,
"valid_targets_mean": 3600.2,
"valid_targets_min": 1398
},
{
"epoch": 5.154686078252957,
"grad_norm": 0.6506764230442754,
"learning_rate": 7.902241014592042e-06,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10488687455654144,
"step": 2835,
"valid_targets_mean": 4610.5,
"valid_targets_min": 1416
},
{
"epoch": 5.16378525932666,
"grad_norm": 0.6436541968180498,
"learning_rate": 7.830166913545181e-06,
"loss": 0.1921,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09069611132144928,
"step": 2840,
"valid_targets_mean": 3433.5,
"valid_targets_min": 505
},
{
"epoch": 5.172884440400364,
"grad_norm": 0.4626395887872623,
"learning_rate": 7.758342914492257e-06,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06200661510229111,
"step": 2845,
"valid_targets_mean": 3226.2,
"valid_targets_min": 2125
},
{
"epoch": 5.1819836214740675,
"grad_norm": 0.7215464420250767,
"learning_rate": 7.686770493486835e-06,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1292155385017395,
"step": 2850,
"valid_targets_mean": 4119.8,
"valid_targets_min": 3043
},
{
"epoch": 5.191082802547771,
"grad_norm": 0.7567338525506948,
"learning_rate": 7.615451121412285e-06,
"loss": 0.2044,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09649307280778885,
"step": 2855,
"valid_targets_mean": 2608.2,
"valid_targets_min": 1653
},
{
"epoch": 5.200181983621474,
"grad_norm": 0.5615329874332277,
"learning_rate": 7.5443862639516e-06,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08881063759326935,
"step": 2860,
"valid_targets_mean": 4857.6,
"valid_targets_min": 1486
},
{
"epoch": 5.209281164695177,
"grad_norm": 0.6474968897106395,
"learning_rate": 7.4735773815572044e-06,
"loss": 0.1996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08092313259840012,
"step": 2865,
"valid_targets_mean": 3331.4,
"valid_targets_min": 1751
},
{
"epoch": 5.218380345768881,
"grad_norm": 0.7512014770821924,
"learning_rate": 7.403025929421026e-06,
"loss": 0.1935,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10584090650081635,
"step": 2870,
"valid_targets_mean": 3191.8,
"valid_targets_min": 418
},
{
"epoch": 5.227479526842584,
"grad_norm": 0.6171676317926769,
"learning_rate": 7.332733357444524e-06,
"loss": 0.1915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.101641945540905,
"step": 2875,
"valid_targets_mean": 4167.4,
"valid_targets_min": 1878
},
{
"epoch": 5.236578707916287,
"grad_norm": 0.6090694716523611,
"learning_rate": 7.262701110208936e-06,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1275119036436081,
"step": 2880,
"valid_targets_mean": 4991.8,
"valid_targets_min": 1623
},
{
"epoch": 5.245677888989991,
"grad_norm": 0.6487776113260872,
"learning_rate": 7.192930626945556e-06,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11216533184051514,
"step": 2885,
"valid_targets_mean": 4438.9,
"valid_targets_min": 287
},
{
"epoch": 5.254777070063694,
"grad_norm": 0.6935423881379369,
"learning_rate": 7.123423341506168e-06,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.13863793015480042,
"step": 2890,
"valid_targets_mean": 4484.0,
"valid_targets_min": 1794
},
{
"epoch": 5.263876251137398,
"grad_norm": 0.7180859077507289,
"learning_rate": 7.054180682333602e-06,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11712032556533813,
"step": 2895,
"valid_targets_mean": 3767.9,
"valid_targets_min": 826
},
{
"epoch": 5.272975432211101,
"grad_norm": 0.8564178897094312,
"learning_rate": 6.985204072432348e-06,
"loss": 0.1836,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10308965295553207,
"step": 2900,
"valid_targets_mean": 3870.2,
"valid_targets_min": 315
},
{
"epoch": 5.282074613284804,
"grad_norm": 0.6990237305747672,
"learning_rate": 6.916494929339315e-06,
"loss": 0.1856,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09179669618606567,
"step": 2905,
"valid_targets_mean": 3426.9,
"valid_targets_min": 2150
},
{
"epoch": 5.2911737943585075,
"grad_norm": 0.6611162751423953,
"learning_rate": 6.848054665094714e-06,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10533514618873596,
"step": 2910,
"valid_targets_mean": 4009.6,
"valid_targets_min": 2796
},
{
"epoch": 5.300272975432211,
"grad_norm": 0.632945921815168,
"learning_rate": 6.779884686213043e-06,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08963876217603683,
"step": 2915,
"valid_targets_mean": 3893.6,
"valid_targets_min": 2795
},
{
"epoch": 5.309372156505915,
"grad_norm": 0.658709053791018,
"learning_rate": 6.71198639365415e-06,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09715458005666733,
"step": 2920,
"valid_targets_mean": 4235.1,
"valid_targets_min": 2097
},
{
"epoch": 5.318471337579618,
"grad_norm": 0.6250400516126823,
"learning_rate": 6.644361182794494e-06,
"loss": 0.2024,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0602688193321228,
"step": 2925,
"valid_targets_mean": 2938.6,
"valid_targets_min": 307
},
{
"epoch": 5.327570518653321,
"grad_norm": 0.55876772270244,
"learning_rate": 6.577010443398388e-06,
"loss": 0.1906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11603139340877533,
"step": 2930,
"valid_targets_mean": 4585.6,
"valid_targets_min": 2899
},
{
"epoch": 5.336669699727024,
"grad_norm": 0.9315616265660619,
"learning_rate": 6.50993555958954e-06,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12010517716407776,
"step": 2935,
"valid_targets_mean": 3430.1,
"valid_targets_min": 316
},
{
"epoch": 5.345768880800728,
"grad_norm": 0.7204613647012345,
"learning_rate": 6.4431379098225185e-06,
"loss": 0.1951,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10857885330915451,
"step": 2940,
"valid_targets_mean": 2946.4,
"valid_targets_min": 1170
},
{
"epoch": 5.3548680618744315,
"grad_norm": 0.6296169963119035,
"learning_rate": 6.376618866854485e-06,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11538192629814148,
"step": 2945,
"valid_targets_mean": 4234.2,
"valid_targets_min": 2754
},
{
"epoch": 5.363967242948135,
"grad_norm": 0.6054462885658843,
"learning_rate": 6.310379797716946e-06,
"loss": 0.1772,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09557513147592545,
"step": 2950,
"valid_targets_mean": 3620.1,
"valid_targets_min": 2284
},
{
"epoch": 5.373066424021838,
"grad_norm": 0.654527494183749,
"learning_rate": 6.24442206368766e-06,
"loss": 0.1811,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10764510929584503,
"step": 2955,
"valid_targets_mean": 4421.6,
"valid_targets_min": 2417
},
{
"epoch": 5.382165605095541,
"grad_norm": 0.5786089054473685,
"learning_rate": 6.178747020262708e-06,
"loss": 0.1905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08632392436265945,
"step": 2960,
"valid_targets_mean": 4199.2,
"valid_targets_min": 2021
},
{
"epoch": 5.391264786169245,
"grad_norm": 0.6546097104084383,
"learning_rate": 6.1133560171285625e-06,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1134294718503952,
"step": 2965,
"valid_targets_mean": 4297.5,
"valid_targets_min": 373
},
{
"epoch": 5.400363967242948,
"grad_norm": 0.6646922900616847,
"learning_rate": 6.04825039813443e-06,
"loss": 0.197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11780969798564911,
"step": 2970,
"valid_targets_mean": 3949.9,
"valid_targets_min": 2606
},
{
"epoch": 5.409463148316651,
"grad_norm": 0.7577811833468597,
"learning_rate": 5.983431501264545e-06,
"loss": 0.1966,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11065106838941574,
"step": 2975,
"valid_targets_mean": 3088.9,
"valid_targets_min": 146
},
{
"epoch": 5.418562329390355,
"grad_norm": 0.7097525789137502,
"learning_rate": 5.918900658610765e-06,
"loss": 0.1897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08051986992359161,
"step": 2980,
"valid_targets_mean": 2664.9,
"valid_targets_min": 1134
},
{
"epoch": 5.427661510464058,
"grad_norm": 0.6710138217823898,
"learning_rate": 5.8546591963451226e-06,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11588048934936523,
"step": 2985,
"valid_targets_mean": 4215.2,
"valid_targets_min": 570
},
{
"epoch": 5.436760691537762,
"grad_norm": 0.6354446709712156,
"learning_rate": 5.790708434692627e-06,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09757719933986664,
"step": 2990,
"valid_targets_mean": 4249.8,
"valid_targets_min": 562
},
{
"epoch": 5.445859872611465,
"grad_norm": 0.7042148180116533,
"learning_rate": 5.727049687904076e-06,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12138056755065918,
"step": 2995,
"valid_targets_mean": 3693.6,
"valid_targets_min": 324
},
{
"epoch": 5.454959053685168,
"grad_norm": 0.7040724026167792,
"learning_rate": 5.66368426422909e-06,
"loss": 0.1847,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08605970442295074,
"step": 3000,
"valid_targets_mean": 3419.9,
"valid_targets_min": 1530
},
{
"epoch": 5.4640582347588715,
"grad_norm": 0.6446010445583191,
"learning_rate": 5.60061346588922e-06,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09227697551250458,
"step": 3005,
"valid_targets_mean": 3576.0,
"valid_targets_min": 963
},
{
"epoch": 5.473157415832575,
"grad_norm": 0.6732664608100785,
"learning_rate": 5.537838589051155e-06,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09739650785923004,
"step": 3010,
"valid_targets_mean": 3776.4,
"valid_targets_min": 1882
},
{
"epoch": 5.482256596906279,
"grad_norm": 0.7452964277656658,
"learning_rate": 5.475360923800141e-06,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10715839266777039,
"step": 3015,
"valid_targets_mean": 3063.9,
"valid_targets_min": 1229
},
{
"epoch": 5.491355777979982,
"grad_norm": 0.6107630351697494,
"learning_rate": 5.413181754113392e-06,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0687195211648941,
"step": 3020,
"valid_targets_mean": 3125.1,
"valid_targets_min": 1139
},
{
"epoch": 5.500454959053685,
"grad_norm": 0.7590005159280938,
"learning_rate": 5.351302357833785e-06,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11881700158119202,
"step": 3025,
"valid_targets_mean": 3752.2,
"valid_targets_min": 1901
},
{
"epoch": 5.509554140127388,
"grad_norm": 0.6632847021155858,
"learning_rate": 5.289724006643529e-06,
"loss": 0.1845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08095594495534897,
"step": 3030,
"valid_targets_mean": 3555.4,
"valid_targets_min": 282
},
{
"epoch": 5.518653321201092,
"grad_norm": 0.7147244658894554,
"learning_rate": 5.2284479660380906e-06,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1063327044248581,
"step": 3035,
"valid_targets_mean": 3433.1,
"valid_targets_min": 863
},
{
"epoch": 5.5277525022747955,
"grad_norm": 0.6674123109790042,
"learning_rate": 5.167475495300134e-06,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08822742849588394,
"step": 3040,
"valid_targets_mean": 3217.4,
"valid_targets_min": 184
},
{
"epoch": 5.536851683348498,
"grad_norm": 0.7927516257807617,
"learning_rate": 5.1068078474736695e-06,
"loss": 0.1934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08748479187488556,
"step": 3045,
"valid_targets_mean": 2495.0,
"valid_targets_min": 341
},
{
"epoch": 5.545950864422202,
"grad_norm": 0.6092514194762859,
"learning_rate": 5.046446269338314e-06,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07830236107110977,
"step": 3050,
"valid_targets_mean": 3540.8,
"valid_targets_min": 1729
},
{
"epoch": 5.555050045495905,
"grad_norm": 0.6198263788192565,
"learning_rate": 4.986392001383633e-06,
"loss": 0.2015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08909077942371368,
"step": 3055,
"valid_targets_mean": 3665.4,
"valid_targets_min": 2018
},
{
"epoch": 5.564149226569609,
"grad_norm": 0.6063356340051946,
"learning_rate": 4.926646277783675e-06,
"loss": 0.2002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11191258579492569,
"step": 3060,
"valid_targets_mean": 4533.5,
"valid_targets_min": 2212
},
{
"epoch": 5.573248407643312,
"grad_norm": 0.6174222418189697,
"learning_rate": 4.867210326371596e-06,
"loss": 0.1987,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10383233428001404,
"step": 3065,
"valid_targets_mean": 3871.8,
"valid_targets_min": 934
},
{
"epoch": 5.582347588717015,
"grad_norm": 0.6672351852695292,
"learning_rate": 4.808085368614441e-06,
"loss": 0.1917,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08448068797588348,
"step": 3070,
"valid_targets_mean": 3447.0,
"valid_targets_min": 2571
},
{
"epoch": 5.591446769790719,
"grad_norm": 0.6342439680320546,
"learning_rate": 4.74927261958801e-06,
"loss": 0.1853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09464578330516815,
"step": 3075,
"valid_targets_mean": 4008.8,
"valid_targets_min": 2600
},
{
"epoch": 5.600545950864422,
"grad_norm": 0.5561239465486564,
"learning_rate": 4.690773287951942e-06,
"loss": 0.1875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10652168095111847,
"step": 3080,
"valid_targets_mean": 6017.8,
"valid_targets_min": 617
},
{
"epoch": 5.609645131938126,
"grad_norm": 0.6579389422471904,
"learning_rate": 4.632588575924795e-06,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07432182878255844,
"step": 3085,
"valid_targets_mean": 3037.5,
"valid_targets_min": 830
},
{
"epoch": 5.618744313011829,
"grad_norm": 0.6928933643318304,
"learning_rate": 4.574719679259425e-06,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0847567692399025,
"step": 3090,
"valid_targets_mean": 2883.1,
"valid_targets_min": 1811
},
{
"epoch": 5.627843494085532,
"grad_norm": 0.6665338076859805,
"learning_rate": 4.5171677872183506e-06,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11493894457817078,
"step": 3095,
"valid_targets_mean": 4355.8,
"valid_targets_min": 2402
},
{
"epoch": 5.6369426751592355,
"grad_norm": 0.6558712450079212,
"learning_rate": 4.459934082549353e-06,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07048974186182022,
"step": 3100,
"valid_targets_mean": 2948.5,
"valid_targets_min": 303
},
{
"epoch": 5.646041856232939,
"grad_norm": 0.7512626734457848,
"learning_rate": 4.4030197414611344e-06,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08836065977811813,
"step": 3105,
"valid_targets_mean": 2718.9,
"valid_targets_min": 328
},
{
"epoch": 5.655141037306643,
"grad_norm": 0.584447343787106,
"learning_rate": 4.346425933599165e-06,
"loss": 0.1932,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09327764809131622,
"step": 3110,
"valid_targets_mean": 4604.0,
"valid_targets_min": 2483
},
{
"epoch": 5.664240218380346,
"grad_norm": 0.7012629818494418,
"learning_rate": 4.2901538220216565e-06,
"loss": 0.1861,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1240246444940567,
"step": 3115,
"valid_targets_mean": 3864.8,
"valid_targets_min": 1696
},
{
"epoch": 5.673339399454049,
"grad_norm": 0.6818751320160401,
"learning_rate": 4.234204563175625e-06,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11969830095767975,
"step": 3120,
"valid_targets_mean": 4422.2,
"valid_targets_min": 1399
},
{
"epoch": 5.682438580527752,
"grad_norm": 0.6243267919910356,
"learning_rate": 4.17857930687318e-06,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0908406525850296,
"step": 3125,
"valid_targets_mean": 3557.4,
"valid_targets_min": 1688
},
{
"epoch": 5.691537761601456,
"grad_norm": 0.6263500654494952,
"learning_rate": 4.123279196267815e-06,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10891071707010269,
"step": 3130,
"valid_targets_mean": 4622.1,
"valid_targets_min": 2885
},
{
"epoch": 5.7006369426751595,
"grad_norm": 0.5071756770136553,
"learning_rate": 4.068305367831002e-06,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08039593696594238,
"step": 3135,
"valid_targets_mean": 6038.0,
"valid_targets_min": 2348
},
{
"epoch": 5.709736123748863,
"grad_norm": 0.4614868119067622,
"learning_rate": 4.013658951328769e-06,
"loss": 0.1804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0638853907585144,
"step": 3140,
"valid_targets_mean": 4969.6,
"valid_targets_min": 1838
},
{
"epoch": 5.718835304822566,
"grad_norm": 0.6146918657528648,
"learning_rate": 3.95934106979853e-06,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08923767507076263,
"step": 3145,
"valid_targets_mean": 3871.9,
"valid_targets_min": 1397
},
{
"epoch": 5.727934485896269,
"grad_norm": 0.6962786938805647,
"learning_rate": 3.905352839525962e-06,
"loss": 0.1822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10900229960680008,
"step": 3150,
"valid_targets_mean": 3616.6,
"valid_targets_min": 2038
},
{
"epoch": 5.737033666969973,
"grad_norm": 0.8242667170719575,
"learning_rate": 3.851695370022093e-06,
"loss": 0.2048,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11732503771781921,
"step": 3155,
"valid_targets_mean": 2471.9,
"valid_targets_min": 981
},
{
"epoch": 5.746132848043676,
"grad_norm": 0.514853122363082,
"learning_rate": 3.7983697640005048e-06,
"loss": 0.1789,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06776493042707443,
"step": 3160,
"valid_targets_mean": 5999.6,
"valid_targets_min": 1698
},
{
"epoch": 5.755232029117379,
"grad_norm": 0.6973901617447613,
"learning_rate": 3.7453771173546426e-06,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10990776866674423,
"step": 3165,
"valid_targets_mean": 3826.5,
"valid_targets_min": 1536
},
{
"epoch": 5.764331210191083,
"grad_norm": 0.7899673614884827,
"learning_rate": 3.6927185191353188e-06,
"loss": 0.1889,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10077675431966782,
"step": 3170,
"valid_targets_mean": 2454.1,
"valid_targets_min": 296
},
{
"epoch": 5.773430391264786,
"grad_norm": 0.7435936878316338,
"learning_rate": 3.640395051528316e-06,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10760288685560226,
"step": 3175,
"valid_targets_mean": 3099.8,
"valid_targets_min": 479
},
{
"epoch": 5.78252957233849,
"grad_norm": 0.5855128837104117,
"learning_rate": 3.5884077898321713e-06,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08257067948579788,
"step": 3180,
"valid_targets_mean": 4963.6,
"valid_targets_min": 1282
},
{
"epoch": 5.791628753412192,
"grad_norm": 0.73223681822564,
"learning_rate": 3.536757802436039e-06,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10566624999046326,
"step": 3185,
"valid_targets_mean": 4045.1,
"valid_targets_min": 2082
},
{
"epoch": 5.800727934485896,
"grad_norm": 0.8342270549063188,
"learning_rate": 3.4854461507977776e-06,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1105557456612587,
"step": 3190,
"valid_targets_mean": 3795.4,
"valid_targets_min": 1844
},
{
"epoch": 5.8098271155595995,
"grad_norm": 0.7488071230149675,
"learning_rate": 3.4344738894220964e-06,
"loss": 0.1927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09993422031402588,
"step": 3195,
"valid_targets_mean": 2751.0,
"valid_targets_min": 304
},
{
"epoch": 5.818926296633303,
"grad_norm": 0.6527632692808096,
"learning_rate": 3.383842065838907e-06,
"loss": 0.1952,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08624714612960815,
"step": 3200,
"valid_targets_mean": 4010.1,
"valid_targets_min": 656
},
{
"epoch": 5.828025477707007,
"grad_norm": 0.7057227913605232,
"learning_rate": 3.3335517205818e-06,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1098092719912529,
"step": 3205,
"valid_targets_mean": 3173.8,
"valid_targets_min": 306
},
{
"epoch": 5.837124658780709,
"grad_norm": 0.7498429878517248,
"learning_rate": 3.2836038871666444e-06,
"loss": 0.1941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09733176231384277,
"step": 3210,
"valid_targets_mean": 2920.4,
"valid_targets_min": 323
},
{
"epoch": 5.846223839854413,
"grad_norm": 0.7678861288920167,
"learning_rate": 3.2339995920703517e-06,
"loss": 0.1943,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09264662861824036,
"step": 3215,
"valid_targets_mean": 2972.4,
"valid_targets_min": 432
},
{
"epoch": 5.855323020928116,
"grad_norm": 0.7126042337111156,
"learning_rate": 3.184739854709784e-06,
"loss": 0.1908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09754851460456848,
"step": 3220,
"valid_targets_mean": 2903.9,
"valid_targets_min": 378
},
{
"epoch": 5.86442220200182,
"grad_norm": 0.5870517895385682,
"learning_rate": 3.1358256874208214e-06,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07877151668071747,
"step": 3225,
"valid_targets_mean": 4363.0,
"valid_targets_min": 2095
},
{
"epoch": 5.8735213830755235,
"grad_norm": 0.41510201360538945,
"learning_rate": 3.0872580954375177e-06,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06783401966094971,
"step": 3230,
"valid_targets_mean": 6266.4,
"valid_targets_min": 220
},
{
"epoch": 5.882620564149226,
"grad_norm": 0.81215723384434,
"learning_rate": 3.039038076871481e-06,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10604351758956909,
"step": 3235,
"valid_targets_mean": 2252.6,
"valid_targets_min": 330
},
{
"epoch": 5.89171974522293,
"grad_norm": 0.6607354187702422,
"learning_rate": 2.9911666226913374e-06,
"loss": 0.184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10948610305786133,
"step": 3240,
"valid_targets_mean": 3968.1,
"valid_targets_min": 2753
},
{
"epoch": 5.900818926296633,
"grad_norm": 0.7603934954380941,
"learning_rate": 2.9436447167023674e-06,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0869530588388443,
"step": 3245,
"valid_targets_mean": 2893.4,
"valid_targets_min": 1586
},
{
"epoch": 5.909918107370337,
"grad_norm": 0.688654887024806,
"learning_rate": 2.896473335526313e-06,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10053776204586029,
"step": 3250,
"valid_targets_mean": 3450.5,
"valid_targets_min": 1140
},
{
"epoch": 5.91901728844404,
"grad_norm": 0.5557339400861658,
"learning_rate": 2.849653448581271e-06,
"loss": 0.2019,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09264858812093735,
"step": 3255,
"valid_targets_mean": 5173.5,
"valid_targets_min": 3253
},
{
"epoch": 5.928116469517743,
"grad_norm": 0.7416951109335438,
"learning_rate": 2.8031860180617898e-06,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08064906299114227,
"step": 3260,
"valid_targets_mean": 2143.0,
"valid_targets_min": 321
},
{
"epoch": 5.937215650591447,
"grad_norm": 0.6806462407891796,
"learning_rate": 2.757071998919094e-06,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08997666835784912,
"step": 3265,
"valid_targets_mean": 3098.5,
"valid_targets_min": 1426
},
{
"epoch": 5.94631483166515,
"grad_norm": 0.9457363421014185,
"learning_rate": 2.7113123388414674e-06,
"loss": 0.1798,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10374726355075836,
"step": 3270,
"valid_targets_mean": 3998.0,
"valid_targets_min": 1284
},
{
"epoch": 5.955414012738854,
"grad_norm": 0.6333595915046111,
"learning_rate": 2.665907978234754e-06,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0839000940322876,
"step": 3275,
"valid_targets_mean": 3718.5,
"valid_targets_min": 1549
},
{
"epoch": 5.964513193812557,
"grad_norm": 0.6317391914040702,
"learning_rate": 2.6208598502030546e-06,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07819197326898575,
"step": 3280,
"valid_targets_mean": 3617.8,
"valid_targets_min": 324
},
{
"epoch": 5.97361237488626,
"grad_norm": 0.7013649236653172,
"learning_rate": 2.5761688805295305e-06,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08413440734148026,
"step": 3285,
"valid_targets_mean": 4389.9,
"valid_targets_min": 1822
},
{
"epoch": 5.9827115559599635,
"grad_norm": 0.6373036325583057,
"learning_rate": 2.531835987657407e-06,
"loss": 0.1948,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08172917366027832,
"step": 3290,
"valid_targets_mean": 3622.1,
"valid_targets_min": 1142
},
{
"epoch": 5.991810737033667,
"grad_norm": 0.6456213843152628,
"learning_rate": 2.487862082671064e-06,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10779787600040436,
"step": 3295,
"valid_targets_mean": 4613.9,
"valid_targets_min": 2582
},
{
"epoch": 6.0,
"grad_norm": 0.9311049045037445,
"learning_rate": 2.4442480692773398e-06,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20936749875545502,
"step": 3300,
"valid_targets_mean": 4251.6,
"valid_targets_min": 1194
},
{
"epoch": 6.0090991810737036,
"grad_norm": 0.6630710786735985,
"learning_rate": 2.400994843786939e-06,
"loss": 0.1874,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10251843929290771,
"step": 3305,
"valid_targets_mean": 3764.8,
"valid_targets_min": 2661
},
{
"epoch": 6.018198362147407,
"grad_norm": 0.7119618968014333,
"learning_rate": 2.3581032950960215e-06,
"loss": 0.1806,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10553539544343948,
"step": 3310,
"valid_targets_mean": 3514.8,
"valid_targets_min": 284
},
{
"epoch": 6.02729754322111,
"grad_norm": 0.6316945505068378,
"learning_rate": 2.3155743046679468e-06,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07232202589511871,
"step": 3315,
"valid_targets_mean": 2813.9,
"valid_targets_min": 450
},
{
"epoch": 6.036396724294813,
"grad_norm": 0.7284470744983149,
"learning_rate": 2.273408746515133e-06,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10341562330722809,
"step": 3320,
"valid_targets_mean": 3263.8,
"valid_targets_min": 1226
},
{
"epoch": 6.045495905368517,
"grad_norm": 0.6753238887882468,
"learning_rate": 2.2316074871811157e-06,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11383339017629623,
"step": 3325,
"valid_targets_mean": 4718.8,
"valid_targets_min": 1925
},
{
"epoch": 6.05459508644222,
"grad_norm": 0.79171407891943,
"learning_rate": 2.190171385722726e-06,
"loss": 0.1837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.120953768491745,
"step": 3330,
"valid_targets_mean": 3292.0,
"valid_targets_min": 1226
},
{
"epoch": 6.063694267515924,
"grad_norm": 0.7571964417090677,
"learning_rate": 2.1491012936924548e-06,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10194280743598938,
"step": 3335,
"valid_targets_mean": 3252.8,
"valid_targets_min": 1129
},
{
"epoch": 6.072793448589627,
"grad_norm": 0.6462489524858733,
"learning_rate": 2.108398055120926e-06,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09468749165534973,
"step": 3340,
"valid_targets_mean": 4044.8,
"valid_targets_min": 2258
},
{
"epoch": 6.08189262966333,
"grad_norm": 0.6329963807730029,
"learning_rate": 2.068062506499584e-06,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09946207702159882,
"step": 3345,
"valid_targets_mean": 4238.4,
"valid_targets_min": 3247
},
{
"epoch": 6.090991810737034,
"grad_norm": 0.6534737467236128,
"learning_rate": 2.0280954767634674e-06,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1006544977426529,
"step": 3350,
"valid_targets_mean": 4195.1,
"valid_targets_min": 3324
},
{
"epoch": 6.100090991810737,
"grad_norm": 0.6084808914799551,
"learning_rate": 1.988497787274195e-06,
"loss": 0.1726,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08862239122390747,
"step": 3355,
"valid_targets_mean": 4239.9,
"valid_targets_min": 1722
},
{
"epoch": 6.10919017288444,
"grad_norm": 0.589702916474223,
"learning_rate": 1.9492702518030905e-06,
"loss": 0.1739,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07204552739858627,
"step": 3360,
"valid_targets_mean": 4596.2,
"valid_targets_min": 370
},
{
"epoch": 6.1182893539581436,
"grad_norm": 0.6606144333508663,
"learning_rate": 1.910413676514438e-06,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07720930874347687,
"step": 3365,
"valid_targets_mean": 2887.5,
"valid_targets_min": 1416
},
{
"epoch": 6.127388535031847,
"grad_norm": 0.7498116580413373,
"learning_rate": 1.8719288599489304e-06,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10034845769405365,
"step": 3370,
"valid_targets_mean": 2805.8,
"valid_targets_min": 366
},
{
"epoch": 6.136487716105551,
"grad_norm": 0.7087123237706273,
"learning_rate": 1.833816593007256e-06,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06755095720291138,
"step": 3375,
"valid_targets_mean": 2808.6,
"valid_targets_min": 241
},
{
"epoch": 6.145586897179254,
"grad_norm": 0.7335482831720123,
"learning_rate": 1.796077658933848e-06,
"loss": 0.1799,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08181584626436234,
"step": 3380,
"valid_targets_mean": 2851.8,
"valid_targets_min": 388
},
{
"epoch": 6.154686078252957,
"grad_norm": 0.6343581720941749,
"learning_rate": 1.7587128333007709e-06,
"loss": 0.1756,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06355266273021698,
"step": 3385,
"valid_targets_mean": 2750.6,
"valid_targets_min": 466
},
{
"epoch": 6.16378525932666,
"grad_norm": 0.7485197111003649,
"learning_rate": 1.7217228839918098e-06,
"loss": 0.1882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12135298550128937,
"step": 3390,
"valid_targets_mean": 3754.4,
"valid_targets_min": 1390
},
{
"epoch": 6.172884440400364,
"grad_norm": 0.6326523371386163,
"learning_rate": 1.6851085711866598e-06,
"loss": 0.1896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0887572169303894,
"step": 3395,
"valid_targets_mean": 3659.1,
"valid_targets_min": 439
},
{
"epoch": 6.1819836214740675,
"grad_norm": 0.6855263364388163,
"learning_rate": 1.648870647345322e-06,
"loss": 0.179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09419068694114685,
"step": 3400,
"valid_targets_mean": 3603.6,
"valid_targets_min": 1045
},
{
"epoch": 6.191082802547771,
"grad_norm": 0.7052701277624316,
"learning_rate": 1.6130098571926468e-06,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08835876733064651,
"step": 3405,
"valid_targets_mean": 3416.0,
"valid_targets_min": 1820
},
{
"epoch": 6.200181983621474,
"grad_norm": 0.805871081345842,
"learning_rate": 1.577526937703e-06,
"loss": 0.1728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08823437243700027,
"step": 3410,
"valid_targets_mean": 3513.1,
"valid_targets_min": 850
},
{
"epoch": 6.209281164695177,
"grad_norm": 0.6952014427915162,
"learning_rate": 1.5424226180851443e-06,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09718883037567139,
"step": 3415,
"valid_targets_mean": 2961.5,
"valid_targets_min": 1589
},
{
"epoch": 6.218380345768881,
"grad_norm": 0.7522478675724774,
"learning_rate": 1.5076976197672432e-06,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09957942366600037,
"step": 3420,
"valid_targets_mean": 2994.0,
"valid_targets_min": 261
},
{
"epoch": 6.227479526842584,
"grad_norm": 0.5843906150152982,
"learning_rate": 1.473352656382039e-06,
"loss": 0.1796,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08296208083629608,
"step": 3425,
"valid_targets_mean": 4887.5,
"valid_targets_min": 1391
},
{
"epoch": 6.236578707916287,
"grad_norm": 0.5837216159683262,
"learning_rate": 1.439388433752178e-06,
"loss": 0.1831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07392477989196777,
"step": 3430,
"valid_targets_mean": 3705.4,
"valid_targets_min": 1438
},
{
"epoch": 6.245677888989991,
"grad_norm": 0.832232290805666,
"learning_rate": 1.4058056498757112e-06,
"loss": 0.1891,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08831807225942612,
"step": 3435,
"valid_targets_mean": 2949.4,
"valid_targets_min": 2220
},
{
"epoch": 6.254777070063694,
"grad_norm": 0.6668489366701206,
"learning_rate": 1.372604994911757e-06,
"loss": 0.1905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.098930224776268,
"step": 3440,
"valid_targets_mean": 3662.5,
"valid_targets_min": 1352
},
{
"epoch": 6.263876251137398,
"grad_norm": 0.7886986156617598,
"learning_rate": 1.3397871511662986e-06,
"loss": 0.1815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07638974487781525,
"step": 3445,
"valid_targets_mean": 2858.8,
"valid_targets_min": 300
},
{
"epoch": 6.272975432211101,
"grad_norm": 0.6775710838871868,
"learning_rate": 1.307352793078187e-06,
"loss": 0.1896,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06637515127658844,
"step": 3450,
"valid_targets_mean": 2564.6,
"valid_targets_min": 340
},
{
"epoch": 6.282074613284804,
"grad_norm": 0.674208803714708,
"learning_rate": 1.275302587205256e-06,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09290862083435059,
"step": 3455,
"valid_targets_mean": 3960.8,
"valid_targets_min": 1941
},
{
"epoch": 6.2911737943585075,
"grad_norm": 0.5635004473154176,
"learning_rate": 1.2436371922106404e-06,
"loss": 0.1843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08775106072425842,
"step": 3460,
"valid_targets_mean": 5250.9,
"valid_targets_min": 1717
},
{
"epoch": 6.300272975432211,
"grad_norm": 0.7520104883929547,
"learning_rate": 1.2123572588492306e-06,
"loss": 0.1759,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10040166974067688,
"step": 3465,
"valid_targets_mean": 2924.0,
"valid_targets_min": 152
},
{
"epoch": 6.309372156505915,
"grad_norm": 0.5052669919871685,
"learning_rate": 1.1814634299543103e-06,
"loss": 0.1835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05836692452430725,
"step": 3470,
"valid_targets_mean": 3446.1,
"valid_targets_min": 274
},
{
"epoch": 6.318471337579618,
"grad_norm": 0.6764453024690077,
"learning_rate": 1.1509563404243274e-06,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0781787857413292,
"step": 3475,
"valid_targets_mean": 2825.0,
"valid_targets_min": 1768
},
{
"epoch": 6.327570518653321,
"grad_norm": 0.6467509750256821,
"learning_rate": 1.1208366172098684e-06,
"loss": 0.1752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08091972023248672,
"step": 3480,
"valid_targets_mean": 4351.2,
"valid_targets_min": 2307
},
{
"epoch": 6.336669699727024,
"grad_norm": 0.6973506532346149,
"learning_rate": 1.0911048793007484e-06,
"loss": 0.1813,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10063889622688293,
"step": 3485,
"valid_targets_mean": 3283.0,
"valid_targets_min": 1507
},
{
"epoch": 6.345768880800728,
"grad_norm": 0.7884690054718912,
"learning_rate": 1.0617617377133205e-06,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09718523919582367,
"step": 3490,
"valid_targets_mean": 2890.5,
"valid_targets_min": 1782
},
{
"epoch": 6.3548680618744315,
"grad_norm": 0.6032301705318348,
"learning_rate": 1.0328077954778904e-06,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10235874354839325,
"step": 3495,
"valid_targets_mean": 4765.8,
"valid_targets_min": 274
},
{
"epoch": 6.363967242948135,
"grad_norm": 0.6690252665633033,
"learning_rate": 1.004243647626344e-06,
"loss": 0.1784,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09461713582277298,
"step": 3500,
"valid_targets_mean": 3810.2,
"valid_targets_min": 2408
},
{
"epoch": 6.373066424021838,
"grad_norm": 0.6384555467290254,
"learning_rate": 9.760698811799064e-07,
"loss": 0.1872,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08460795879364014,
"step": 3505,
"valid_targets_mean": 3914.2,
"valid_targets_min": 424
},
{
"epoch": 6.382165605095541,
"grad_norm": 0.6491331565328212,
"learning_rate": 9.482870751370755e-07,
"loss": 0.1805,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09265074133872986,
"step": 3510,
"valid_targets_mean": 3294.6,
"valid_targets_min": 2030
},
{
"epoch": 6.391264786169245,
"grad_norm": 0.6514066852280065,
"learning_rate": 9.208958004617475e-07,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08725515007972717,
"step": 3515,
"valid_targets_mean": 3477.8,
"valid_targets_min": 2131
},
{
"epoch": 6.400363967242948,
"grad_norm": 0.5939503819831969,
"learning_rate": 8.938966200714482e-07,
"loss": 0.1768,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0967637449502945,
"step": 3520,
"valid_targets_mean": 6093.5,
"valid_targets_min": 3168
},
{
"epoch": 6.409463148316651,
"grad_norm": 0.6196766279683386,
"learning_rate": 8.672900888257918e-07,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10511632263660431,
"step": 3525,
"valid_targets_mean": 5057.6,
"valid_targets_min": 2994
},
{
"epoch": 6.418562329390355,
"grad_norm": 0.4824895138585985,
"learning_rate": 8.410767535150599e-07,
"loss": 0.1723,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.05214907228946686,
"step": 3530,
"valid_targets_mean": 2645.6,
"valid_targets_min": 1427
},
{
"epoch": 6.427661510464058,
"grad_norm": 0.6827325735386334,
"learning_rate": 8.152571528489828e-07,
"loss": 0.1863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09623458236455917,
"step": 3535,
"valid_targets_mean": 3689.5,
"valid_targets_min": 169
},
{
"epoch": 6.436760691537762,
"grad_norm": 0.663892399984698,
"learning_rate": 7.898318174456498e-07,
"loss": 0.1864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0786326676607132,
"step": 3540,
"valid_targets_mean": 3200.2,
"valid_targets_min": 191
},
{
"epoch": 6.445859872611465,
"grad_norm": 0.6940887008237617,
"learning_rate": 7.64801269820612e-07,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0850784108042717,
"step": 3545,
"valid_targets_mean": 3372.0,
"valid_targets_min": 340
},
{
"epoch": 6.454959053685168,
"grad_norm": 0.6899041090836107,
"learning_rate": 7.401660243761543e-07,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08928936719894409,
"step": 3550,
"valid_targets_mean": 3396.8,
"valid_targets_min": 384
},
{
"epoch": 6.4640582347588715,
"grad_norm": 0.6908252432631689,
"learning_rate": 7.159265873907006e-07,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11242173612117767,
"step": 3555,
"valid_targets_mean": 4323.0,
"valid_targets_min": 3470
},
{
"epoch": 6.473157415832575,
"grad_norm": 0.8113352916097301,
"learning_rate": 6.920834570084389e-07,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.12070198357105255,
"step": 3560,
"valid_targets_mean": 3102.1,
"valid_targets_min": 433
},
{
"epoch": 6.482256596906279,
"grad_norm": 0.7063405925347518,
"learning_rate": 6.686371232290567e-07,
"loss": 0.1982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0846632719039917,
"step": 3565,
"valid_targets_mean": 3217.4,
"valid_targets_min": 1225
},
{
"epoch": 6.491355777979982,
"grad_norm": 0.6875590318727268,
"learning_rate": 6.455880678976845e-07,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07678349316120148,
"step": 3570,
"valid_targets_mean": 2996.9,
"valid_targets_min": 293
},
{
"epoch": 6.500454959053685,
"grad_norm": 0.6775291716880106,
"learning_rate": 6.229367646949924e-07,
"loss": 0.1711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1015455350279808,
"step": 3575,
"valid_targets_mean": 3940.4,
"valid_targets_min": 1506
},
{
"epoch": 6.509554140127388,
"grad_norm": 0.8193290349914585,
"learning_rate": 6.006836791274606e-07,
"loss": 0.1795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11495477706193924,
"step": 3580,
"valid_targets_mean": 3150.9,
"valid_targets_min": 321
},
{
"epoch": 6.518653321201092,
"grad_norm": 0.5890978652371885,
"learning_rate": 5.788292685177954e-07,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10000624507665634,
"step": 3585,
"valid_targets_mean": 4716.1,
"valid_targets_min": 2782
},
{
"epoch": 6.5277525022747955,
"grad_norm": 0.6121071180946909,
"learning_rate": 5.573739819955459e-07,
"loss": 0.1727,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07249385118484497,
"step": 3590,
"valid_targets_mean": 3096.5,
"valid_targets_min": 458
},
{
"epoch": 6.536851683348498,
"grad_norm": 0.6411275060644541,
"learning_rate": 5.363182604878803e-07,
"loss": 0.1855,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0972464308142662,
"step": 3595,
"valid_targets_mean": 4242.2,
"valid_targets_min": 3201
},
{
"epoch": 6.545950864422202,
"grad_norm": 0.592828910076141,
"learning_rate": 5.156625367104973e-07,
"loss": 0.1914,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07627043128013611,
"step": 3600,
"valid_targets_mean": 3982.1,
"valid_targets_min": 308
},
{
"epoch": 6.555050045495905,
"grad_norm": 0.7052782207800322,
"learning_rate": 4.954072351587646e-07,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0874359980225563,
"step": 3605,
"valid_targets_mean": 3140.6,
"valid_targets_min": 1511
},
{
"epoch": 6.564149226569609,
"grad_norm": 0.6894516190804516,
"learning_rate": 4.75552772098975e-07,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09235049039125443,
"step": 3610,
"valid_targets_mean": 3940.2,
"valid_targets_min": 311
},
{
"epoch": 6.573248407643312,
"grad_norm": 0.6215785808807689,
"learning_rate": 4.560995555597969e-07,
"loss": 0.1814,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0887666791677475,
"step": 3615,
"valid_targets_mean": 3609.2,
"valid_targets_min": 1385
},
{
"epoch": 6.582347588717015,
"grad_norm": 0.6192208581963837,
"learning_rate": 4.3704798532388624e-07,
"loss": 0.1846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10467948019504547,
"step": 3620,
"valid_targets_mean": 4307.4,
"valid_targets_min": 2053
},
{
"epoch": 6.591446769790719,
"grad_norm": 0.6338893728376359,
"learning_rate": 4.1839845291968607e-07,
"loss": 0.1878,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10062219947576523,
"step": 3625,
"valid_targets_mean": 4577.0,
"valid_targets_min": 2230
},
{
"epoch": 6.600545950864422,
"grad_norm": 0.6990330295376892,
"learning_rate": 4.001513416133551e-07,
"loss": 0.177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08158162236213684,
"step": 3630,
"valid_targets_mean": 3457.1,
"valid_targets_min": 336
},
{
"epoch": 6.609645131938126,
"grad_norm": 0.506941996196486,
"learning_rate": 3.823070264009099e-07,
"loss": 0.1786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07667286694049835,
"step": 3635,
"valid_targets_mean": 4367.6,
"valid_targets_min": 278
},
{
"epoch": 6.618744313011829,
"grad_norm": 0.6337734569018411,
"learning_rate": 3.648658740005107e-07,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07626718282699585,
"step": 3640,
"valid_targets_mean": 3231.2,
"valid_targets_min": 2235
},
{
"epoch": 6.627843494085532,
"grad_norm": 0.5875375339866471,
"learning_rate": 3.4782824284492975e-07,
"loss": 0.1802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10731066018342972,
"step": 3645,
"valid_targets_mean": 5920.9,
"valid_targets_min": 3895
},
{
"epoch": 6.6369426751592355,
"grad_norm": 0.67413263385624,
"learning_rate": 3.31194483074182e-07,
"loss": 0.1736,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09552273899316788,
"step": 3650,
"valid_targets_mean": 4226.9,
"valid_targets_min": 261
},
{
"epoch": 6.646041856232939,
"grad_norm": 0.6521249448828749,
"learning_rate": 3.149649365283258e-07,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.06236450746655464,
"step": 3655,
"valid_targets_mean": 2752.9,
"valid_targets_min": 288
},
{
"epoch": 6.655141037306643,
"grad_norm": 0.6212796752617139,
"learning_rate": 2.9913993674044904e-07,
"loss": 0.1848,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09087605029344559,
"step": 3660,
"valid_targets_mean": 4887.8,
"valid_targets_min": 1841
},
{
"epoch": 6.664240218380346,
"grad_norm": 0.7027944694981803,
"learning_rate": 2.8371980892979436e-07,
"loss": 0.1859,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1104184091091156,
"step": 3665,
"valid_targets_mean": 3617.5,
"valid_targets_min": 1831
},
{
"epoch": 6.673339399454049,
"grad_norm": 0.6087584684328681,
"learning_rate": 2.687048699951067e-07,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07848186790943146,
"step": 3670,
"valid_targets_mean": 3574.5,
"valid_targets_min": 1333
},
{
"epoch": 6.682438580527752,
"grad_norm": 0.6580904025427522,
"learning_rate": 2.5409542850808765e-07,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10046820342540741,
"step": 3675,
"valid_targets_mean": 3933.9,
"valid_targets_min": 260
},
{
"epoch": 6.691537761601456,
"grad_norm": 0.6087191196250359,
"learning_rate": 2.3989178470707364e-07,
"loss": 0.18,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08826770633459091,
"step": 3680,
"valid_targets_mean": 4082.4,
"valid_targets_min": 1308
},
{
"epoch": 6.7006369426751595,
"grad_norm": 0.8153778673745999,
"learning_rate": 2.260942304908609e-07,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11358342319726944,
"step": 3685,
"valid_targets_mean": 3213.5,
"valid_targets_min": 588
},
{
"epoch": 6.709736123748863,
"grad_norm": 0.7140363348627277,
"learning_rate": 2.1270304941271025e-07,
"loss": 0.2003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11204315721988678,
"step": 3690,
"valid_targets_mean": 4244.4,
"valid_targets_min": 2250
},
{
"epoch": 6.718835304822566,
"grad_norm": 0.7549599688622531,
"learning_rate": 1.9971851667451413e-07,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1169305294752121,
"step": 3695,
"valid_targets_mean": 3374.1,
"valid_targets_min": 1968
},
{
"epoch": 6.727934485896269,
"grad_norm": 0.6941835790300109,
"learning_rate": 1.8714089912113876e-07,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1251552700996399,
"step": 3700,
"valid_targets_mean": 4214.8,
"valid_targets_min": 2772
},
{
"epoch": 6.737033666969973,
"grad_norm": 0.8007989348447613,
"learning_rate": 1.749704552349507e-07,
"loss": 0.1944,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10345979034900665,
"step": 3705,
"valid_targets_mean": 2992.9,
"valid_targets_min": 263
},
{
"epoch": 6.746132848043676,
"grad_norm": 0.719702971321928,
"learning_rate": 1.6320743513049686e-07,
"loss": 0.1774,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10299459844827652,
"step": 3710,
"valid_targets_mean": 2893.6,
"valid_targets_min": 313
},
{
"epoch": 6.755232029117379,
"grad_norm": 0.7087967586285943,
"learning_rate": 1.5185208054936394e-07,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1190565824508667,
"step": 3715,
"valid_targets_mean": 4597.0,
"valid_targets_min": 1703
},
{
"epoch": 6.764331210191083,
"grad_norm": 0.5318051425992069,
"learning_rate": 1.4090462485521816e-07,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07275549322366714,
"step": 3720,
"valid_targets_mean": 3686.5,
"valid_targets_min": 355
},
{
"epoch": 6.773430391264786,
"grad_norm": 0.7887933323438483,
"learning_rate": 1.303652930289956e-07,
"loss": 0.1857,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0893682911992073,
"step": 3725,
"valid_targets_mean": 2508.0,
"valid_targets_min": 894
},
{
"epoch": 6.78252957233849,
"grad_norm": 0.6939538297031341,
"learning_rate": 1.2023430166429485e-07,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09880831837654114,
"step": 3730,
"valid_targets_mean": 3593.8,
"valid_targets_min": 235
},
{
"epoch": 6.791628753412192,
"grad_norm": 0.7431914466111932,
"learning_rate": 1.1051185896291616e-07,
"loss": 0.182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07245789468288422,
"step": 3735,
"valid_targets_mean": 2910.5,
"valid_targets_min": 164
},
{
"epoch": 6.800727934485896,
"grad_norm": 0.6531446016749648,
"learning_rate": 1.011981647305782e-07,
"loss": 0.1607,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07852613925933838,
"step": 3740,
"valid_targets_mean": 3377.0,
"valid_targets_min": 1521
},
{
"epoch": 6.8098271155595995,
"grad_norm": 0.7324557362184932,
"learning_rate": 9.22934103728279e-08,
"loss": 0.1792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07569163292646408,
"step": 3745,
"valid_targets_mean": 2686.8,
"valid_targets_min": 339
},
{
"epoch": 6.818926296633303,
"grad_norm": 0.6590389864988105,
"learning_rate": 8.37977788910882e-08,
"loss": 0.17,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07628272473812103,
"step": 3750,
"valid_targets_mean": 2587.9,
"valid_targets_min": 686
},
{
"epoch": 6.828025477707007,
"grad_norm": 0.7436442598809084,
"learning_rate": 7.571144487891202e-08,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09393531084060669,
"step": 3755,
"valid_targets_mean": 2498.8,
"valid_targets_min": 581
},
{
"epoch": 6.837124658780709,
"grad_norm": 0.7374402989833732,
"learning_rate": 6.803457451838746e-08,
"loss": 0.1849,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1075291633605957,
"step": 3760,
"valid_targets_mean": 3226.6,
"valid_targets_min": 734
},
{
"epoch": 6.846223839854413,
"grad_norm": 0.4604358460897986,
"learning_rate": 6.076732557672272e-08,
"loss": 0.1717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07132543623447418,
"step": 3765,
"valid_targets_mean": 7595.2,
"valid_targets_min": 360
},
{
"epoch": 6.855323020928116,
"grad_norm": 0.7017036176712402,
"learning_rate": 5.390984740299976e-08,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09402775019407272,
"step": 3770,
"valid_targets_mean": 3475.1,
"valid_targets_min": 1721
},
{
"epoch": 6.86442220200182,
"grad_norm": 0.7041095060978012,
"learning_rate": 4.7462280925116847e-08,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09718748927116394,
"step": 3775,
"valid_targets_mean": 4057.4,
"valid_targets_min": 334
},
{
"epoch": 6.8735213830755235,
"grad_norm": 0.7879474477338477,
"learning_rate": 4.142475864688411e-08,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09216184914112091,
"step": 3780,
"valid_targets_mean": 2256.6,
"valid_targets_min": 263
},
{
"epoch": 6.882620564149226,
"grad_norm": 0.7052882526108005,
"learning_rate": 3.5797404645296906e-08,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0836934745311737,
"step": 3785,
"valid_targets_mean": 3189.5,
"valid_targets_min": 302
},
{
"epoch": 6.89171974522293,
"grad_norm": 0.6415834858261883,
"learning_rate": 3.0580334567995585e-08,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10515318065881729,
"step": 3790,
"valid_targets_mean": 4577.0,
"valid_targets_min": 2504
},
{
"epoch": 6.900818926296633,
"grad_norm": 0.7167619855564329,
"learning_rate": 2.5773655630880746e-08,
"loss": 0.1956,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1195126473903656,
"step": 3795,
"valid_targets_mean": 4239.6,
"valid_targets_min": 2600
},
{
"epoch": 6.909918107370337,
"grad_norm": 0.5847738389354258,
"learning_rate": 2.1377466615912778e-08,
"loss": 0.1808,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.07136321067810059,
"step": 3800,
"valid_targets_mean": 4093.9,
"valid_targets_min": 1204
},
{
"epoch": 6.91901728844404,
"grad_norm": 0.6674740866579093,
"learning_rate": 1.7391857869086815e-08,
"loss": 0.1794,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09090028703212738,
"step": 3805,
"valid_targets_mean": 3187.9,
"valid_targets_min": 1087
},
{
"epoch": 6.928116469517743,
"grad_norm": 0.6940020851233624,
"learning_rate": 1.3816911298565327e-08,
"loss": 0.1821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08191139996051788,
"step": 3810,
"valid_targets_mean": 3583.0,
"valid_targets_min": 2403
},
{
"epoch": 6.937215650591447,
"grad_norm": 0.6521002518067545,
"learning_rate": 1.0652700373006142e-08,
"loss": 0.1841,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0826297402381897,
"step": 3815,
"valid_targets_mean": 3706.0,
"valid_targets_min": 1384
},
{
"epoch": 6.94631483166515,
"grad_norm": 0.6871719319654492,
"learning_rate": 7.899290120039205e-09,
"loss": 0.1694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.0961792916059494,
"step": 3820,
"valid_targets_mean": 3572.2,
"valid_targets_min": 986
},
{
"epoch": 6.955414012738854,
"grad_norm": 0.7108375386012565,
"learning_rate": 5.556737124945422e-09,
"loss": 0.1964,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.10159586369991302,
"step": 3825,
"valid_targets_mean": 3412.9,
"valid_targets_min": 633
},
{
"epoch": 6.964513193812557,
"grad_norm": 0.7344106634967527,
"learning_rate": 3.6250895294842605e-09,
"loss": 0.1839,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08290895074605942,
"step": 3830,
"valid_targets_mean": 2692.9,
"valid_targets_min": 301
},
{
"epoch": 6.97361237488626,
"grad_norm": 0.6078419999211205,
"learning_rate": 2.1043870309078727e-09,
"loss": 0.1842,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.08749958872795105,
"step": 3835,
"valid_targets_mean": 4106.5,
"valid_targets_min": 1108
},
{
"epoch": 6.9827115559599635,
"grad_norm": 0.6441846884391178,
"learning_rate": 9.946608811395308e-10,
"loss": 0.1778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09097015857696533,
"step": 3840,
"valid_targets_mean": 3864.9,
"valid_targets_min": 1595
},
{
"epoch": 6.991810737033667,
"grad_norm": 0.6584217092501846,
"learning_rate": 2.959338861407979e-10,
"loss": 0.1885,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.09941902756690979,
"step": 3845,
"valid_targets_mean": 3675.5,
"valid_targets_min": 2043
},
{
"epoch": 7.0,
"grad_norm": 0.8102798117849903,
"learning_rate": 8.220405436354384e-12,
"loss": 0.1758,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1581478863954544,
"step": 3850,
"valid_targets_mean": 4096.2,
"valid_targets_min": 1169
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1581478863954544,
"step": 3850,
"total_flos": 1.0887953365472379e+18,
"train_loss": 0.25177762028458833,
"train_runtime": 92981.7064,
"train_samples_per_second": 0.662,
"train_steps_per_second": 0.041,
"valid_targets_mean": 4096.2,
"valid_targets_min": 1169
}
],
"logging_steps": 5,
"max_steps": 3850,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 200,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.0887953365472379e+18,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}