a1-stack_bash_withtests / trainer_state.json
EtashGuha's picture
Upload folder using huggingface_hub
907faae verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.0,
"eval_steps": 500,
"global_step": 4662,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.0075075075075075074,
"grad_norm": 11.018023139973177,
"learning_rate": 3.426124197002142e-07,
"loss": 0.6962,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.666359007358551,
"step": 5,
"valid_targets_mean": 3406.2,
"valid_targets_min": 590
},
{
"epoch": 0.015015015015015015,
"grad_norm": 14.300498234778246,
"learning_rate": 7.708779443254819e-07,
"loss": 0.6812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7260710597038269,
"step": 10,
"valid_targets_mean": 2929.3,
"valid_targets_min": 540
},
{
"epoch": 0.02252252252252252,
"grad_norm": 10.308334513580103,
"learning_rate": 1.1991434689507496e-06,
"loss": 0.694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.7622815370559692,
"step": 15,
"valid_targets_mean": 4942.4,
"valid_targets_min": 474
},
{
"epoch": 0.03003003003003003,
"grad_norm": 9.480467405179247,
"learning_rate": 1.6274089935760173e-06,
"loss": 0.63,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5915040969848633,
"step": 20,
"valid_targets_mean": 4988.7,
"valid_targets_min": 506
},
{
"epoch": 0.03753753753753754,
"grad_norm": 6.98322327787682,
"learning_rate": 2.055674518201285e-06,
"loss": 0.634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6035254001617432,
"step": 25,
"valid_targets_mean": 4144.8,
"valid_targets_min": 406
},
{
"epoch": 0.04504504504504504,
"grad_norm": 4.519545202299929,
"learning_rate": 2.4839400428265524e-06,
"loss": 0.6108,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6693063974380493,
"step": 30,
"valid_targets_mean": 2645.9,
"valid_targets_min": 811
},
{
"epoch": 0.052552552552552555,
"grad_norm": 2.254075439509915,
"learning_rate": 2.9122055674518203e-06,
"loss": 0.583,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.6287423968315125,
"step": 35,
"valid_targets_mean": 5337.9,
"valid_targets_min": 424
},
{
"epoch": 0.06006006006006006,
"grad_norm": 1.5869006029617074,
"learning_rate": 3.3404710920770882e-06,
"loss": 0.4981,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5136668682098389,
"step": 40,
"valid_targets_mean": 4675.1,
"valid_targets_min": 683
},
{
"epoch": 0.06756756756756757,
"grad_norm": 1.2871585570908246,
"learning_rate": 3.7687366167023558e-06,
"loss": 0.498,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4761298894882202,
"step": 45,
"valid_targets_mean": 4580.2,
"valid_targets_min": 695
},
{
"epoch": 0.07507507507507508,
"grad_norm": 1.1073292407135484,
"learning_rate": 4.197002141327624e-06,
"loss": 0.4618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4800295829772949,
"step": 50,
"valid_targets_mean": 3829.7,
"valid_targets_min": 408
},
{
"epoch": 0.08258258258258258,
"grad_norm": 0.8919504665868666,
"learning_rate": 4.625267665952891e-06,
"loss": 0.5237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.525561511516571,
"step": 55,
"valid_targets_mean": 5515.5,
"valid_targets_min": 571
},
{
"epoch": 0.09009009009009009,
"grad_norm": 0.865780829661676,
"learning_rate": 5.05353319057816e-06,
"loss": 0.5163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.5415364503860474,
"step": 60,
"valid_targets_mean": 3433.2,
"valid_targets_min": 511
},
{
"epoch": 0.09759759759759759,
"grad_norm": 0.5872913252913201,
"learning_rate": 5.481798715203427e-06,
"loss": 0.4707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3888802230358124,
"step": 65,
"valid_targets_mean": 5232.6,
"valid_targets_min": 664
},
{
"epoch": 0.10510510510510511,
"grad_norm": 0.5994653626627001,
"learning_rate": 5.910064239828695e-06,
"loss": 0.4821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43450668454170227,
"step": 70,
"valid_targets_mean": 5187.1,
"valid_targets_min": 460
},
{
"epoch": 0.11261261261261261,
"grad_norm": 0.6662883071321841,
"learning_rate": 6.338329764453962e-06,
"loss": 0.4331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3964645564556122,
"step": 75,
"valid_targets_mean": 3182.0,
"valid_targets_min": 880
},
{
"epoch": 0.12012012012012012,
"grad_norm": 0.6301518751447736,
"learning_rate": 6.76659528907923e-06,
"loss": 0.4374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37995022535324097,
"step": 80,
"valid_targets_mean": 3907.1,
"valid_targets_min": 773
},
{
"epoch": 0.12762762762762764,
"grad_norm": 0.6479909629866574,
"learning_rate": 7.194860813704497e-06,
"loss": 0.4749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.43532025814056396,
"step": 85,
"valid_targets_mean": 3381.8,
"valid_targets_min": 727
},
{
"epoch": 0.13513513513513514,
"grad_norm": 0.601954910384077,
"learning_rate": 7.623126338329765e-06,
"loss": 0.449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37232670187950134,
"step": 90,
"valid_targets_mean": 3859.4,
"valid_targets_min": 681
},
{
"epoch": 0.14264264264264265,
"grad_norm": 0.6010699211352588,
"learning_rate": 8.051391862955033e-06,
"loss": 0.4036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3912065625190735,
"step": 95,
"valid_targets_mean": 4532.2,
"valid_targets_min": 525
},
{
"epoch": 0.15015015015015015,
"grad_norm": 0.6776934870921543,
"learning_rate": 8.4796573875803e-06,
"loss": 0.4009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3918367922306061,
"step": 100,
"valid_targets_mean": 3923.7,
"valid_targets_min": 631
},
{
"epoch": 0.15765765765765766,
"grad_norm": 0.5815397148408697,
"learning_rate": 8.907922912205568e-06,
"loss": 0.422,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40705981850624084,
"step": 105,
"valid_targets_mean": 4907.4,
"valid_targets_min": 624
},
{
"epoch": 0.16516516516516516,
"grad_norm": 0.6207231229898003,
"learning_rate": 9.336188436830836e-06,
"loss": 0.4197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35407790541648865,
"step": 110,
"valid_targets_mean": 4749.1,
"valid_targets_min": 357
},
{
"epoch": 0.17267267267267267,
"grad_norm": 0.7161182478604338,
"learning_rate": 9.764453961456105e-06,
"loss": 0.4271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3748543858528137,
"step": 115,
"valid_targets_mean": 2599.0,
"valid_targets_min": 495
},
{
"epoch": 0.18018018018018017,
"grad_norm": 0.6433782885571062,
"learning_rate": 1.019271948608137e-05,
"loss": 0.4129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.44952958822250366,
"step": 120,
"valid_targets_mean": 3456.8,
"valid_targets_min": 521
},
{
"epoch": 0.18768768768768768,
"grad_norm": 0.608760987576289,
"learning_rate": 1.062098501070664e-05,
"loss": 0.396,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4421440064907074,
"step": 125,
"valid_targets_mean": 4304.8,
"valid_targets_min": 676
},
{
"epoch": 0.19519519519519518,
"grad_norm": 0.6056247540086898,
"learning_rate": 1.1049250535331907e-05,
"loss": 0.356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3524633049964905,
"step": 130,
"valid_targets_mean": 4378.4,
"valid_targets_min": 699
},
{
"epoch": 0.20270270270270271,
"grad_norm": 0.7470542876873747,
"learning_rate": 1.1477516059957175e-05,
"loss": 0.3928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3509212136268616,
"step": 135,
"valid_targets_mean": 3348.1,
"valid_targets_min": 580
},
{
"epoch": 0.21021021021021022,
"grad_norm": 0.5297517332166896,
"learning_rate": 1.1905781584582443e-05,
"loss": 0.3971,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3493044376373291,
"step": 140,
"valid_targets_mean": 4820.6,
"valid_targets_min": 588
},
{
"epoch": 0.21771771771771772,
"grad_norm": 0.8236972811131019,
"learning_rate": 1.233404710920771e-05,
"loss": 0.4229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4382990002632141,
"step": 145,
"valid_targets_mean": 4910.1,
"valid_targets_min": 704
},
{
"epoch": 0.22522522522522523,
"grad_norm": 0.5641188867988419,
"learning_rate": 1.2762312633832978e-05,
"loss": 0.4053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4189315438270569,
"step": 150,
"valid_targets_mean": 4847.2,
"valid_targets_min": 479
},
{
"epoch": 0.23273273273273273,
"grad_norm": 0.759436996305121,
"learning_rate": 1.3190578158458245e-05,
"loss": 0.3995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4512358009815216,
"step": 155,
"valid_targets_mean": 3609.1,
"valid_targets_min": 660
},
{
"epoch": 0.24024024024024024,
"grad_norm": 0.5776616654260357,
"learning_rate": 1.3618843683083513e-05,
"loss": 0.3982,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.366862416267395,
"step": 160,
"valid_targets_mean": 4489.5,
"valid_targets_min": 709
},
{
"epoch": 0.24774774774774774,
"grad_norm": 0.5621030834623711,
"learning_rate": 1.404710920770878e-05,
"loss": 0.3562,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3245847225189209,
"step": 165,
"valid_targets_mean": 3611.0,
"valid_targets_min": 857
},
{
"epoch": 0.2552552552552553,
"grad_norm": 0.6383475705856398,
"learning_rate": 1.4475374732334048e-05,
"loss": 0.3633,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3641152083873749,
"step": 170,
"valid_targets_mean": 3776.7,
"valid_targets_min": 273
},
{
"epoch": 0.2627627627627628,
"grad_norm": 0.6387883870614447,
"learning_rate": 1.4903640256959315e-05,
"loss": 0.3892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4122806787490845,
"step": 175,
"valid_targets_mean": 4106.8,
"valid_targets_min": 367
},
{
"epoch": 0.2702702702702703,
"grad_norm": 0.5859730062305724,
"learning_rate": 1.5331905781584583e-05,
"loss": 0.4145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4545392692089081,
"step": 180,
"valid_targets_mean": 5412.8,
"valid_targets_min": 485
},
{
"epoch": 0.2777777777777778,
"grad_norm": 0.6291566957212851,
"learning_rate": 1.576017130620985e-05,
"loss": 0.3586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34801965951919556,
"step": 185,
"valid_targets_mean": 3683.8,
"valid_targets_min": 388
},
{
"epoch": 0.2852852852852853,
"grad_norm": 0.7714952807971188,
"learning_rate": 1.618843683083512e-05,
"loss": 0.4031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33357149362564087,
"step": 190,
"valid_targets_mean": 3992.8,
"valid_targets_min": 645
},
{
"epoch": 0.2927927927927928,
"grad_norm": 0.6022688124054402,
"learning_rate": 1.6616702355460387e-05,
"loss": 0.3632,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32963526248931885,
"step": 195,
"valid_targets_mean": 4479.6,
"valid_targets_min": 376
},
{
"epoch": 0.3003003003003003,
"grad_norm": 0.5461125797479052,
"learning_rate": 1.7044967880085653e-05,
"loss": 0.3609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3471255898475647,
"step": 200,
"valid_targets_mean": 5124.2,
"valid_targets_min": 2440
},
{
"epoch": 0.3078078078078078,
"grad_norm": 0.6479231652954496,
"learning_rate": 1.7473233404710924e-05,
"loss": 0.3709,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36097437143325806,
"step": 205,
"valid_targets_mean": 3874.2,
"valid_targets_min": 536
},
{
"epoch": 0.3153153153153153,
"grad_norm": 0.6307321400936947,
"learning_rate": 1.790149892933619e-05,
"loss": 0.356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32168492674827576,
"step": 210,
"valid_targets_mean": 4215.9,
"valid_targets_min": 750
},
{
"epoch": 0.3228228228228228,
"grad_norm": 0.7342733098843338,
"learning_rate": 1.8329764453961457e-05,
"loss": 0.3716,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3192724585533142,
"step": 215,
"valid_targets_mean": 3300.5,
"valid_targets_min": 465
},
{
"epoch": 0.3303303303303303,
"grad_norm": 0.6269217295173055,
"learning_rate": 1.8758029978586724e-05,
"loss": 0.382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.393771767616272,
"step": 220,
"valid_targets_mean": 3780.5,
"valid_targets_min": 520
},
{
"epoch": 0.33783783783783783,
"grad_norm": 0.6699586606597604,
"learning_rate": 1.9186295503211994e-05,
"loss": 0.3367,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3441130518913269,
"step": 225,
"valid_targets_mean": 3570.4,
"valid_targets_min": 367
},
{
"epoch": 0.34534534534534533,
"grad_norm": 0.6212030440388314,
"learning_rate": 1.961456102783726e-05,
"loss": 0.3249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28860020637512207,
"step": 230,
"valid_targets_mean": 4043.8,
"valid_targets_min": 797
},
{
"epoch": 0.35285285285285284,
"grad_norm": 0.5933247879185318,
"learning_rate": 2.004282655246253e-05,
"loss": 0.3663,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2963605523109436,
"step": 235,
"valid_targets_mean": 4519.4,
"valid_targets_min": 679
},
{
"epoch": 0.36036036036036034,
"grad_norm": 0.5915857140141431,
"learning_rate": 2.0471092077087794e-05,
"loss": 0.3707,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3590105175971985,
"step": 240,
"valid_targets_mean": 4801.9,
"valid_targets_min": 786
},
{
"epoch": 0.36786786786786785,
"grad_norm": 0.6926624493340766,
"learning_rate": 2.089935760171306e-05,
"loss": 0.3699,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3375079035758972,
"step": 245,
"valid_targets_mean": 3064.8,
"valid_targets_min": 636
},
{
"epoch": 0.37537537537537535,
"grad_norm": 0.5625060900455121,
"learning_rate": 2.1327623126338334e-05,
"loss": 0.3717,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2878052592277527,
"step": 250,
"valid_targets_mean": 4984.9,
"valid_targets_min": 389
},
{
"epoch": 0.38288288288288286,
"grad_norm": 0.4895346484151352,
"learning_rate": 2.17558886509636e-05,
"loss": 0.3319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3224838972091675,
"step": 255,
"valid_targets_mean": 5919.2,
"valid_targets_min": 631
},
{
"epoch": 0.39039039039039036,
"grad_norm": 0.6186907667129198,
"learning_rate": 2.2184154175588867e-05,
"loss": 0.3133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3299029767513275,
"step": 260,
"valid_targets_mean": 4151.9,
"valid_targets_min": 694
},
{
"epoch": 0.3978978978978979,
"grad_norm": 0.637540257330486,
"learning_rate": 2.2612419700214137e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31127655506134033,
"step": 265,
"valid_targets_mean": 4565.4,
"valid_targets_min": 667
},
{
"epoch": 0.40540540540540543,
"grad_norm": 0.6482997719326944,
"learning_rate": 2.3040685224839404e-05,
"loss": 0.371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3371477723121643,
"step": 270,
"valid_targets_mean": 4799.7,
"valid_targets_min": 565
},
{
"epoch": 0.41291291291291293,
"grad_norm": 0.630240697831865,
"learning_rate": 2.346895074946467e-05,
"loss": 0.4042,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3549198508262634,
"step": 275,
"valid_targets_mean": 3973.2,
"valid_targets_min": 571
},
{
"epoch": 0.42042042042042044,
"grad_norm": 0.5378005948550142,
"learning_rate": 2.3897216274089937e-05,
"loss": 0.3568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3140275776386261,
"step": 280,
"valid_targets_mean": 4524.4,
"valid_targets_min": 466
},
{
"epoch": 0.42792792792792794,
"grad_norm": 0.5496707584360776,
"learning_rate": 2.4325481798715207e-05,
"loss": 0.3439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27984702587127686,
"step": 285,
"valid_targets_mean": 5251.4,
"valid_targets_min": 871
},
{
"epoch": 0.43543543543543545,
"grad_norm": 0.6054529261217243,
"learning_rate": 2.4753747323340474e-05,
"loss": 0.3399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717384994029999,
"step": 290,
"valid_targets_mean": 5978.3,
"valid_targets_min": 665
},
{
"epoch": 0.44294294294294295,
"grad_norm": 0.60946853866193,
"learning_rate": 2.518201284796574e-05,
"loss": 0.3324,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31978553533554077,
"step": 295,
"valid_targets_mean": 3610.3,
"valid_targets_min": 729
},
{
"epoch": 0.45045045045045046,
"grad_norm": 0.7112237553385803,
"learning_rate": 2.5610278372591007e-05,
"loss": 0.365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36318349838256836,
"step": 300,
"valid_targets_mean": 2997.6,
"valid_targets_min": 398
},
{
"epoch": 0.45795795795795796,
"grad_norm": 0.5754561363093669,
"learning_rate": 2.6038543897216277e-05,
"loss": 0.3475,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3775876760482788,
"step": 305,
"valid_targets_mean": 5485.2,
"valid_targets_min": 291
},
{
"epoch": 0.46546546546546547,
"grad_norm": 0.5225836627231101,
"learning_rate": 2.6466809421841544e-05,
"loss": 0.3327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2630726099014282,
"step": 310,
"valid_targets_mean": 5477.4,
"valid_targets_min": 1953
},
{
"epoch": 0.47297297297297297,
"grad_norm": 0.6631066150226813,
"learning_rate": 2.689507494646681e-05,
"loss": 0.3341,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4078267812728882,
"step": 315,
"valid_targets_mean": 4227.4,
"valid_targets_min": 691
},
{
"epoch": 0.4804804804804805,
"grad_norm": 0.5625056894327084,
"learning_rate": 2.732334047109208e-05,
"loss": 0.3307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34400713443756104,
"step": 320,
"valid_targets_mean": 6082.6,
"valid_targets_min": 756
},
{
"epoch": 0.487987987987988,
"grad_norm": 0.5720940827291631,
"learning_rate": 2.7751605995717347e-05,
"loss": 0.3544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.364154189825058,
"step": 325,
"valid_targets_mean": 5058.0,
"valid_targets_min": 1324
},
{
"epoch": 0.4954954954954955,
"grad_norm": 0.6142764560167397,
"learning_rate": 2.8179871520342614e-05,
"loss": 0.3567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3340011239051819,
"step": 330,
"valid_targets_mean": 3809.8,
"valid_targets_min": 606
},
{
"epoch": 0.503003003003003,
"grad_norm": 0.6862489554890606,
"learning_rate": 2.860813704496788e-05,
"loss": 0.3377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.347086638212204,
"step": 335,
"valid_targets_mean": 3381.4,
"valid_targets_min": 529
},
{
"epoch": 0.5105105105105106,
"grad_norm": 0.5884162448896875,
"learning_rate": 2.903640256959315e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3551441431045532,
"step": 340,
"valid_targets_mean": 4280.0,
"valid_targets_min": 656
},
{
"epoch": 0.5180180180180181,
"grad_norm": 0.5985519809481195,
"learning_rate": 2.9464668094218417e-05,
"loss": 0.3718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3538270592689514,
"step": 345,
"valid_targets_mean": 4933.6,
"valid_targets_min": 679
},
{
"epoch": 0.5255255255255256,
"grad_norm": 0.6608489868770677,
"learning_rate": 2.9892933618843684e-05,
"loss": 0.3821,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3977230191230774,
"step": 350,
"valid_targets_mean": 4619.8,
"valid_targets_min": 617
},
{
"epoch": 0.5330330330330331,
"grad_norm": 0.6666435654761541,
"learning_rate": 3.032119914346895e-05,
"loss": 0.3205,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3276807963848114,
"step": 355,
"valid_targets_mean": 3228.0,
"valid_targets_min": 396
},
{
"epoch": 0.5405405405405406,
"grad_norm": 0.5700169845584041,
"learning_rate": 3.0749464668094224e-05,
"loss": 0.3373,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.252112478017807,
"step": 360,
"valid_targets_mean": 4043.2,
"valid_targets_min": 470
},
{
"epoch": 0.5480480480480481,
"grad_norm": 0.5969317196396643,
"learning_rate": 3.117773019271949e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257426917552948,
"step": 365,
"valid_targets_mean": 3501.2,
"valid_targets_min": 637
},
{
"epoch": 0.5555555555555556,
"grad_norm": 0.5338582932799799,
"learning_rate": 3.160599571734476e-05,
"loss": 0.3469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4118390679359436,
"step": 370,
"valid_targets_mean": 6022.6,
"valid_targets_min": 668
},
{
"epoch": 0.5630630630630631,
"grad_norm": 0.7156868770693144,
"learning_rate": 3.2034261241970024e-05,
"loss": 0.342,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33580997586250305,
"step": 375,
"valid_targets_mean": 3146.6,
"valid_targets_min": 580
},
{
"epoch": 0.5705705705705706,
"grad_norm": 0.6105442252909425,
"learning_rate": 3.246252676659529e-05,
"loss": 0.3246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29976391792297363,
"step": 380,
"valid_targets_mean": 4423.6,
"valid_targets_min": 579
},
{
"epoch": 0.5780780780780781,
"grad_norm": 0.48535869781119606,
"learning_rate": 3.289079229122056e-05,
"loss": 0.3211,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2958953380584717,
"step": 385,
"valid_targets_mean": 5096.5,
"valid_targets_min": 1111
},
{
"epoch": 0.5855855855855856,
"grad_norm": 0.5293285996606892,
"learning_rate": 3.3319057815845824e-05,
"loss": 0.3012,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29280033707618713,
"step": 390,
"valid_targets_mean": 4133.6,
"valid_targets_min": 664
},
{
"epoch": 0.5930930930930931,
"grad_norm": 0.6364074446274751,
"learning_rate": 3.37473233404711e-05,
"loss": 0.3546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3336215019226074,
"step": 395,
"valid_targets_mean": 3474.1,
"valid_targets_min": 277
},
{
"epoch": 0.6006006006006006,
"grad_norm": 0.7064277061832516,
"learning_rate": 3.4175588865096364e-05,
"loss": 0.3238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38183677196502686,
"step": 400,
"valid_targets_mean": 4343.8,
"valid_targets_min": 831
},
{
"epoch": 0.6081081081081081,
"grad_norm": 0.5234255969114723,
"learning_rate": 3.460385438972163e-05,
"loss": 0.3259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3263946771621704,
"step": 405,
"valid_targets_mean": 5912.4,
"valid_targets_min": 525
},
{
"epoch": 0.6156156156156156,
"grad_norm": 0.6859056535544392,
"learning_rate": 3.50321199143469e-05,
"loss": 0.3613,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4518062472343445,
"step": 410,
"valid_targets_mean": 4294.0,
"valid_targets_min": 672
},
{
"epoch": 0.6231231231231231,
"grad_norm": 0.593812126409495,
"learning_rate": 3.5460385438972164e-05,
"loss": 0.3236,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.284976601600647,
"step": 415,
"valid_targets_mean": 4542.8,
"valid_targets_min": 732
},
{
"epoch": 0.6306306306306306,
"grad_norm": 0.5542761631226861,
"learning_rate": 3.588865096359743e-05,
"loss": 0.3575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3369911313056946,
"step": 420,
"valid_targets_mean": 4173.8,
"valid_targets_min": 623
},
{
"epoch": 0.6381381381381381,
"grad_norm": 0.694482077890855,
"learning_rate": 3.63169164882227e-05,
"loss": 0.331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35457199811935425,
"step": 425,
"valid_targets_mean": 3347.3,
"valid_targets_min": 323
},
{
"epoch": 0.6456456456456456,
"grad_norm": 0.5087776401105766,
"learning_rate": 3.674518201284797e-05,
"loss": 0.3077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2870054244995117,
"step": 430,
"valid_targets_mean": 5496.8,
"valid_targets_min": 995
},
{
"epoch": 0.6531531531531531,
"grad_norm": 0.5710934865190025,
"learning_rate": 3.717344753747324e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3406960964202881,
"step": 435,
"valid_targets_mean": 4272.1,
"valid_targets_min": 578
},
{
"epoch": 0.6606606606606606,
"grad_norm": 0.6532417856194169,
"learning_rate": 3.7601713062098504e-05,
"loss": 0.3358,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3105970621109009,
"step": 440,
"valid_targets_mean": 4052.7,
"valid_targets_min": 469
},
{
"epoch": 0.6681681681681682,
"grad_norm": 0.5810179731496691,
"learning_rate": 3.802997858672377e-05,
"loss": 0.3534,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2967357933521271,
"step": 445,
"valid_targets_mean": 5399.5,
"valid_targets_min": 481
},
{
"epoch": 0.6756756756756757,
"grad_norm": 0.4933051723343659,
"learning_rate": 3.8458244111349045e-05,
"loss": 0.307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2656002640724182,
"step": 450,
"valid_targets_mean": 5050.2,
"valid_targets_min": 536
},
{
"epoch": 0.6831831831831832,
"grad_norm": 0.5117823141215931,
"learning_rate": 3.8886509635974305e-05,
"loss": 0.3345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3394744396209717,
"step": 455,
"valid_targets_mean": 4780.2,
"valid_targets_min": 698
},
{
"epoch": 0.6906906906906907,
"grad_norm": 0.5513150421712305,
"learning_rate": 3.931477516059957e-05,
"loss": 0.3344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38678789138793945,
"step": 460,
"valid_targets_mean": 4995.6,
"valid_targets_min": 787
},
{
"epoch": 0.6981981981981982,
"grad_norm": 0.5223578821175074,
"learning_rate": 3.974304068522484e-05,
"loss": 0.3301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3217771053314209,
"step": 465,
"valid_targets_mean": 5331.4,
"valid_targets_min": 1007
},
{
"epoch": 0.7057057057057057,
"grad_norm": 0.5938737922502441,
"learning_rate": 3.999997756656772e-05,
"loss": 0.3306,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31824183464050293,
"step": 470,
"valid_targets_mean": 4223.0,
"valid_targets_min": 452
},
{
"epoch": 0.7132132132132132,
"grad_norm": 0.49626310595338613,
"learning_rate": 3.9999725191032436e-05,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26925772428512573,
"step": 475,
"valid_targets_mean": 5763.9,
"valid_targets_min": 761
},
{
"epoch": 0.7207207207207207,
"grad_norm": 0.6276161448251935,
"learning_rate": 3.999919240172184e-05,
"loss": 0.3228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.325122594833374,
"step": 480,
"valid_targets_mean": 4395.4,
"valid_targets_min": 662
},
{
"epoch": 0.7282282282282282,
"grad_norm": 0.598897987227093,
"learning_rate": 3.9998379206106104e-05,
"loss": 0.2941,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2764396369457245,
"step": 485,
"valid_targets_mean": 5031.5,
"valid_targets_min": 836
},
{
"epoch": 0.7357357357357357,
"grad_norm": 0.5920738798268582,
"learning_rate": 3.9997285615586944e-05,
"loss": 0.3449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33547401428222656,
"step": 490,
"valid_targets_mean": 4218.7,
"valid_targets_min": 416
},
{
"epoch": 0.7432432432432432,
"grad_norm": 0.5388292737396405,
"learning_rate": 3.999591164549747e-05,
"loss": 0.3216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30026373267173767,
"step": 495,
"valid_targets_mean": 5046.2,
"valid_targets_min": 885
},
{
"epoch": 0.7507507507507507,
"grad_norm": 0.7138413019632255,
"learning_rate": 3.999425731510195e-05,
"loss": 0.3161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3095625340938568,
"step": 500,
"valid_targets_mean": 3115.5,
"valid_targets_min": 696
},
{
"epoch": 0.7582582582582582,
"grad_norm": 0.5065067605354636,
"learning_rate": 3.9992322647595543e-05,
"loss": 0.3132,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2668853998184204,
"step": 505,
"valid_targets_mean": 4890.2,
"valid_targets_min": 583
},
{
"epoch": 0.7657657657657657,
"grad_norm": 0.48772270569522996,
"learning_rate": 3.999010767010401e-05,
"loss": 0.2792,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21127644181251526,
"step": 510,
"valid_targets_mean": 4030.5,
"valid_targets_min": 620
},
{
"epoch": 0.7732732732732732,
"grad_norm": 0.688910852981923,
"learning_rate": 3.998761241368328e-05,
"loss": 0.3356,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31102752685546875,
"step": 515,
"valid_targets_mean": 2963.6,
"valid_targets_min": 662
},
{
"epoch": 0.7807807807807807,
"grad_norm": 0.590399156229966,
"learning_rate": 3.9984836913319044e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.295174777507782,
"step": 520,
"valid_targets_mean": 3820.8,
"valid_targets_min": 547
},
{
"epoch": 0.7882882882882883,
"grad_norm": 0.7498553089205983,
"learning_rate": 3.998178120792627e-05,
"loss": 0.3289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29107627272605896,
"step": 525,
"valid_targets_mean": 4623.9,
"valid_targets_min": 463
},
{
"epoch": 0.7957957957957958,
"grad_norm": 0.541430521248251,
"learning_rate": 3.9978445340348646e-05,
"loss": 0.3114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.35057809948921204,
"step": 530,
"valid_targets_mean": 4895.9,
"valid_targets_min": 810
},
{
"epoch": 0.8033033033033034,
"grad_norm": 0.6145616694631061,
"learning_rate": 3.997482935735796e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2825467586517334,
"step": 535,
"valid_targets_mean": 4079.4,
"valid_targets_min": 593
},
{
"epoch": 0.8108108108108109,
"grad_norm": 0.6457216047110463,
"learning_rate": 3.997093330965349e-05,
"loss": 0.3289,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37978658080101013,
"step": 540,
"valid_targets_mean": 3493.6,
"valid_targets_min": 513
},
{
"epoch": 0.8183183183183184,
"grad_norm": 0.5512024613609153,
"learning_rate": 3.9966757251861256e-05,
"loss": 0.3083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30473941564559937,
"step": 545,
"valid_targets_mean": 4363.6,
"valid_targets_min": 798
},
{
"epoch": 0.8258258258258259,
"grad_norm": 0.5404758251655593,
"learning_rate": 3.996230124253328e-05,
"loss": 0.2928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2958792746067047,
"step": 550,
"valid_targets_mean": 4708.9,
"valid_targets_min": 480
},
{
"epoch": 0.8333333333333334,
"grad_norm": 0.5409326702314928,
"learning_rate": 3.995756534414672e-05,
"loss": 0.3015,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3055042028427124,
"step": 555,
"valid_targets_mean": 4889.0,
"valid_targets_min": 634
},
{
"epoch": 0.8408408408408409,
"grad_norm": 0.877523092977663,
"learning_rate": 3.9952549623103065e-05,
"loss": 0.3031,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27620965242385864,
"step": 560,
"valid_targets_mean": 3901.4,
"valid_targets_min": 782
},
{
"epoch": 0.8483483483483484,
"grad_norm": 0.5593566066914221,
"learning_rate": 3.994725414972713e-05,
"loss": 0.331,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33034461736679077,
"step": 565,
"valid_targets_mean": 4464.5,
"valid_targets_min": 847
},
{
"epoch": 0.8558558558558559,
"grad_norm": 0.6652170124791761,
"learning_rate": 3.994167899826614e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.258162260055542,
"step": 570,
"valid_targets_mean": 3842.9,
"valid_targets_min": 410
},
{
"epoch": 0.8633633633633634,
"grad_norm": 0.5319260103081287,
"learning_rate": 3.993582424688861e-05,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2436560094356537,
"step": 575,
"valid_targets_mean": 4503.2,
"valid_targets_min": 810
},
{
"epoch": 0.8708708708708709,
"grad_norm": 0.5435805707257723,
"learning_rate": 3.9929689977683315e-05,
"loss": 0.3088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2837572991847992,
"step": 580,
"valid_targets_mean": 4475.9,
"valid_targets_min": 697
},
{
"epoch": 0.8783783783783784,
"grad_norm": 0.6279074659022925,
"learning_rate": 3.992327627665814e-05,
"loss": 0.3233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3020919859409332,
"step": 585,
"valid_targets_mean": 3179.3,
"valid_targets_min": 602
},
{
"epoch": 0.8858858858858859,
"grad_norm": 0.6751035596060991,
"learning_rate": 3.99165832337388e-05,
"loss": 0.3098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2893165349960327,
"step": 590,
"valid_targets_mean": 3005.4,
"valid_targets_min": 504
},
{
"epoch": 0.8933933933933934,
"grad_norm": 0.9253018906213728,
"learning_rate": 3.990961094276767e-05,
"loss": 0.3072,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3459416627883911,
"step": 595,
"valid_targets_mean": 2077.6,
"valid_targets_min": 485
},
{
"epoch": 0.9009009009009009,
"grad_norm": 0.6687225112938137,
"learning_rate": 3.990235950150242e-05,
"loss": 0.3079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36818212270736694,
"step": 600,
"valid_targets_mean": 3371.7,
"valid_targets_min": 715
},
{
"epoch": 0.9084084084084084,
"grad_norm": 0.5328749806757945,
"learning_rate": 3.9894829011614627e-05,
"loss": 0.3135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25350844860076904,
"step": 605,
"valid_targets_mean": 3857.8,
"valid_targets_min": 521
},
{
"epoch": 0.9159159159159159,
"grad_norm": 0.675741595187441,
"learning_rate": 3.988701957868842e-05,
"loss": 0.3172,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3360707759857178,
"step": 610,
"valid_targets_mean": 2917.3,
"valid_targets_min": 605
},
{
"epoch": 0.9234234234234234,
"grad_norm": 0.6571910621752247,
"learning_rate": 3.987893131221892e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2482086569070816,
"step": 615,
"valid_targets_mean": 3313.1,
"valid_targets_min": 510
},
{
"epoch": 0.9309309309309309,
"grad_norm": 0.6979768745974733,
"learning_rate": 3.987056432561075e-05,
"loss": 0.3034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3537478744983673,
"step": 620,
"valid_targets_mean": 3899.6,
"valid_targets_min": 471
},
{
"epoch": 0.9384384384384384,
"grad_norm": 0.46982739010374835,
"learning_rate": 3.986191873617645e-05,
"loss": 0.318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27537375688552856,
"step": 625,
"valid_targets_mean": 5885.1,
"valid_targets_min": 593
},
{
"epoch": 0.9459459459459459,
"grad_norm": 0.5400448261626185,
"learning_rate": 3.985299466513479e-05,
"loss": 0.3106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3220127820968628,
"step": 630,
"valid_targets_mean": 4269.6,
"valid_targets_min": 558
},
{
"epoch": 0.9534534534534534,
"grad_norm": 0.5242379048874888,
"learning_rate": 3.984379223760912e-05,
"loss": 0.3102,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.36460551619529724,
"step": 635,
"valid_targets_mean": 4742.2,
"valid_targets_min": 670
},
{
"epoch": 0.960960960960961,
"grad_norm": 0.5056910710384006,
"learning_rate": 3.983431158262558e-05,
"loss": 0.2783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2684648334980011,
"step": 640,
"valid_targets_mean": 4608.9,
"valid_targets_min": 805
},
{
"epoch": 0.9684684684684685,
"grad_norm": 0.5297540154671703,
"learning_rate": 3.982455283311131e-05,
"loss": 0.325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25975459814071655,
"step": 645,
"valid_targets_mean": 4382.8,
"valid_targets_min": 772
},
{
"epoch": 0.975975975975976,
"grad_norm": 0.555629136176801,
"learning_rate": 3.981451612589259e-05,
"loss": 0.28,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26162397861480713,
"step": 650,
"valid_targets_mean": 4827.0,
"valid_targets_min": 611
},
{
"epoch": 0.9834834834834835,
"grad_norm": 0.7355128171152777,
"learning_rate": 3.980420160169289e-05,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28353631496429443,
"step": 655,
"valid_targets_mean": 4060.4,
"valid_targets_min": 766
},
{
"epoch": 0.990990990990991,
"grad_norm": 0.6098329219635357,
"learning_rate": 3.979360940513092e-05,
"loss": 0.3267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2917211651802063,
"step": 660,
"valid_targets_mean": 3110.2,
"valid_targets_min": 536
},
{
"epoch": 0.9984984984984985,
"grad_norm": 0.6602685528415261,
"learning_rate": 3.978273968471865e-05,
"loss": 0.3291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37517815828323364,
"step": 665,
"valid_targets_mean": 3097.9,
"valid_targets_min": 623
},
{
"epoch": 1.006006006006006,
"grad_norm": 0.5990905965495634,
"learning_rate": 3.97715925928591e-05,
"loss": 0.3701,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31573376059532166,
"step": 670,
"valid_targets_mean": 5335.8,
"valid_targets_min": 657
},
{
"epoch": 1.0135135135135136,
"grad_norm": 0.5051572310687712,
"learning_rate": 3.9760168285844345e-05,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2896278500556946,
"step": 675,
"valid_targets_mean": 4987.1,
"valid_targets_min": 724
},
{
"epoch": 1.021021021021021,
"grad_norm": 0.5358689615840903,
"learning_rate": 3.974846692385323e-05,
"loss": 0.2765,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29317814111709595,
"step": 680,
"valid_targets_mean": 5053.4,
"valid_targets_min": 723
},
{
"epoch": 1.0285285285285286,
"grad_norm": 0.7789287894144826,
"learning_rate": 3.973648867094917e-05,
"loss": 0.3181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3238382935523987,
"step": 685,
"valid_targets_mean": 3482.4,
"valid_targets_min": 492
},
{
"epoch": 1.0360360360360361,
"grad_norm": 0.5563018194673951,
"learning_rate": 3.972423369507783e-05,
"loss": 0.3166,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3259349465370178,
"step": 690,
"valid_targets_mean": 5252.0,
"valid_targets_min": 850
},
{
"epoch": 1.0435435435435436,
"grad_norm": 0.7250068591194968,
"learning_rate": 3.971170216806477e-05,
"loss": 0.3198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3443298935890198,
"step": 695,
"valid_targets_mean": 2799.4,
"valid_targets_min": 588
},
{
"epoch": 1.0510510510510511,
"grad_norm": 0.7089445149146085,
"learning_rate": 3.969889426561304e-05,
"loss": 0.3328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31399601697921753,
"step": 700,
"valid_targets_mean": 3693.1,
"valid_targets_min": 606
},
{
"epoch": 1.0585585585585586,
"grad_norm": 0.4834579345868247,
"learning_rate": 3.968581016730073e-05,
"loss": 0.2893,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28393715620040894,
"step": 705,
"valid_targets_mean": 5210.3,
"valid_targets_min": 1146
},
{
"epoch": 1.0660660660660661,
"grad_norm": 0.580488043726015,
"learning_rate": 3.9672450056578426e-05,
"loss": 0.3114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3525095582008362,
"step": 710,
"valid_targets_mean": 4987.9,
"valid_targets_min": 872
},
{
"epoch": 1.0735735735735736,
"grad_norm": 0.5830757190666622,
"learning_rate": 3.965881412076665e-05,
"loss": 0.2927,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2518344223499298,
"step": 715,
"valid_targets_mean": 3772.8,
"valid_targets_min": 301
},
{
"epoch": 1.0810810810810811,
"grad_norm": 0.603911299798853,
"learning_rate": 3.964490255105325e-05,
"loss": 0.2897,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2885856330394745,
"step": 720,
"valid_targets_mean": 3888.7,
"valid_targets_min": 610
},
{
"epoch": 1.0885885885885886,
"grad_norm": 0.721271255619491,
"learning_rate": 3.96307155424907e-05,
"loss": 0.3009,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33753496408462524,
"step": 725,
"valid_targets_mean": 3255.9,
"valid_targets_min": 323
},
{
"epoch": 1.0960960960960962,
"grad_norm": 0.5688287102135644,
"learning_rate": 3.961625329399335e-05,
"loss": 0.288,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24445214867591858,
"step": 730,
"valid_targets_mean": 4295.9,
"valid_targets_min": 322
},
{
"epoch": 1.1036036036036037,
"grad_norm": 0.5822780762193985,
"learning_rate": 3.960151600833469e-05,
"loss": 0.303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3242020606994629,
"step": 735,
"valid_targets_mean": 4509.4,
"valid_targets_min": 749
},
{
"epoch": 1.1111111111111112,
"grad_norm": 0.6988383396255673,
"learning_rate": 3.958650389214444e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2766273021697998,
"step": 740,
"valid_targets_mean": 3003.1,
"valid_targets_min": 528
},
{
"epoch": 1.1186186186186187,
"grad_norm": 0.5530037303674098,
"learning_rate": 3.95712171559057e-05,
"loss": 0.2862,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2562218904495239,
"step": 745,
"valid_targets_mean": 4301.1,
"valid_targets_min": 761
},
{
"epoch": 1.1261261261261262,
"grad_norm": 0.5917466496490228,
"learning_rate": 3.955565601395199e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27801835536956787,
"step": 750,
"valid_targets_mean": 4016.3,
"valid_targets_min": 611
},
{
"epoch": 1.1336336336336337,
"grad_norm": 0.5314431651828969,
"learning_rate": 3.953982068446424e-05,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2895042896270752,
"step": 755,
"valid_targets_mean": 4829.9,
"valid_targets_min": 689
},
{
"epoch": 1.1411411411411412,
"grad_norm": 0.5403700692721292,
"learning_rate": 3.952371138946773e-05,
"loss": 0.311,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2900671660900116,
"step": 760,
"valid_targets_mean": 5102.2,
"valid_targets_min": 811
},
{
"epoch": 1.1486486486486487,
"grad_norm": 0.4466270912829498,
"learning_rate": 3.950732835482896e-05,
"loss": 0.2634,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23144987225532532,
"step": 765,
"valid_targets_mean": 4800.4,
"valid_targets_min": 566
},
{
"epoch": 1.1561561561561562,
"grad_norm": 0.5126441976083996,
"learning_rate": 3.9490671810252525e-05,
"loss": 0.2738,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2398991733789444,
"step": 770,
"valid_targets_mean": 3322.2,
"valid_targets_min": 260
},
{
"epoch": 1.1636636636636637,
"grad_norm": 0.6835376056729422,
"learning_rate": 3.947374198927787e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2788790464401245,
"step": 775,
"valid_targets_mean": 2824.4,
"valid_targets_min": 481
},
{
"epoch": 1.1711711711711712,
"grad_norm": 0.7480255450833108,
"learning_rate": 3.945653912927599e-05,
"loss": 0.3116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.41352379322052,
"step": 780,
"valid_targets_mean": 3108.0,
"valid_targets_min": 525
},
{
"epoch": 1.1786786786786787,
"grad_norm": 0.7012989879636262,
"learning_rate": 3.943906347144615e-05,
"loss": 0.2908,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2697921395301819,
"step": 785,
"valid_targets_mean": 2765.4,
"valid_targets_min": 559
},
{
"epoch": 1.1861861861861862,
"grad_norm": 0.6294134200242447,
"learning_rate": 3.942131526081249e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28815174102783203,
"step": 790,
"valid_targets_mean": 5498.2,
"valid_targets_min": 760
},
{
"epoch": 1.1936936936936937,
"grad_norm": 0.5405122434808368,
"learning_rate": 3.940329474622055e-05,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26721876859664917,
"step": 795,
"valid_targets_mean": 4779.1,
"valid_targets_min": 657
},
{
"epoch": 1.2012012012012012,
"grad_norm": 0.6027467491848216,
"learning_rate": 3.938500218033384e-05,
"loss": 0.2749,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28523164987564087,
"step": 800,
"valid_targets_mean": 3985.0,
"valid_targets_min": 673
},
{
"epoch": 1.2087087087087087,
"grad_norm": 0.49337094306984625,
"learning_rate": 3.936643781963024e-05,
"loss": 0.3508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3622555136680603,
"step": 805,
"valid_targets_mean": 6322.6,
"valid_targets_min": 390
},
{
"epoch": 1.2162162162162162,
"grad_norm": 0.5183504295911457,
"learning_rate": 3.9347601924398475e-05,
"loss": 0.2833,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2589194178581238,
"step": 810,
"valid_targets_mean": 4678.0,
"valid_targets_min": 899
},
{
"epoch": 1.2237237237237237,
"grad_norm": 0.5342990678808706,
"learning_rate": 3.932849475873438e-05,
"loss": 0.3152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2209431231021881,
"step": 815,
"valid_targets_mean": 4677.4,
"valid_targets_min": 815
},
{
"epoch": 1.2312312312312312,
"grad_norm": 0.4783352437662895,
"learning_rate": 3.9309116590537266e-05,
"loss": 0.2653,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2841101884841919,
"step": 820,
"valid_targets_mean": 4398.6,
"valid_targets_min": 874
},
{
"epoch": 1.2387387387387387,
"grad_norm": 0.5066260881718098,
"learning_rate": 3.9289467691506125e-05,
"loss": 0.3159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2934754490852356,
"step": 825,
"valid_targets_mean": 4760.6,
"valid_targets_min": 670
},
{
"epoch": 1.2462462462462462,
"grad_norm": 0.6920092254384417,
"learning_rate": 3.926954833713585e-05,
"loss": 0.3049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3148398697376251,
"step": 830,
"valid_targets_mean": 2882.6,
"valid_targets_min": 635
},
{
"epoch": 1.2537537537537538,
"grad_norm": 0.49074537646024496,
"learning_rate": 3.924935880671334e-05,
"loss": 0.3005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2520464062690735,
"step": 835,
"valid_targets_mean": 5137.5,
"valid_targets_min": 1027
},
{
"epoch": 1.2612612612612613,
"grad_norm": 0.6626501857332863,
"learning_rate": 3.922889938331361e-05,
"loss": 0.3003,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.38677817583084106,
"step": 840,
"valid_targets_mean": 3420.8,
"valid_targets_min": 627
},
{
"epoch": 1.2687687687687688,
"grad_norm": 0.5332552957049799,
"learning_rate": 3.920817035379581e-05,
"loss": 0.2804,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30235785245895386,
"step": 845,
"valid_targets_mean": 4300.7,
"valid_targets_min": 645
},
{
"epoch": 1.2762762762762763,
"grad_norm": 0.5542167310126439,
"learning_rate": 3.9187172008799195e-05,
"loss": 0.3007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3331342339515686,
"step": 850,
"valid_targets_mean": 4431.8,
"valid_targets_min": 382
},
{
"epoch": 1.2837837837837838,
"grad_norm": 0.47602297520673265,
"learning_rate": 3.9165904642739085e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24128374457359314,
"step": 855,
"valid_targets_mean": 5224.0,
"valid_targets_min": 565
},
{
"epoch": 1.2912912912912913,
"grad_norm": 0.4907394738004159,
"learning_rate": 3.914436855380269e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2902330458164215,
"step": 860,
"valid_targets_mean": 4872.4,
"valid_targets_min": 469
},
{
"epoch": 1.2987987987987988,
"grad_norm": 0.5780103792011559,
"learning_rate": 3.9122564043944956e-05,
"loss": 0.3022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.324124276638031,
"step": 865,
"valid_targets_mean": 4095.2,
"valid_targets_min": 836
},
{
"epoch": 1.3063063063063063,
"grad_norm": 1.4238637814086352,
"learning_rate": 3.910049141888433e-05,
"loss": 0.3061,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3050238788127899,
"step": 870,
"valid_targets_mean": 5166.2,
"valid_targets_min": 716
},
{
"epoch": 1.3138138138138138,
"grad_norm": 0.49302688153022367,
"learning_rate": 3.907815098809849e-05,
"loss": 0.268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2744116187095642,
"step": 875,
"valid_targets_mean": 5715.9,
"valid_targets_min": 491
},
{
"epoch": 1.3213213213213213,
"grad_norm": 0.6362296442287568,
"learning_rate": 3.9055543064819945e-05,
"loss": 0.3095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28804486989974976,
"step": 880,
"valid_targets_mean": 3622.8,
"valid_targets_min": 642
},
{
"epoch": 1.3288288288288288,
"grad_norm": 0.627623374325793,
"learning_rate": 3.9032667966031704e-05,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3453376293182373,
"step": 885,
"valid_targets_mean": 3533.0,
"valid_targets_min": 600
},
{
"epoch": 1.3363363363363363,
"grad_norm": 0.6493174026676456,
"learning_rate": 3.9009526012462834e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3329022228717804,
"step": 890,
"valid_targets_mean": 4443.5,
"valid_targets_min": 699
},
{
"epoch": 1.3438438438438438,
"grad_norm": 0.5328791757099103,
"learning_rate": 3.89861175285839e-05,
"loss": 0.2754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2938082218170166,
"step": 895,
"valid_targets_mean": 4643.6,
"valid_targets_min": 674
},
{
"epoch": 1.3513513513513513,
"grad_norm": 0.5404971152718483,
"learning_rate": 3.89624428426025e-05,
"loss": 0.3149,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3295516073703766,
"step": 900,
"valid_targets_mean": 5400.6,
"valid_targets_min": 431
},
{
"epoch": 1.3588588588588588,
"grad_norm": 0.5148482135727713,
"learning_rate": 3.8938502286458586e-05,
"loss": 0.2965,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2672591209411621,
"step": 905,
"valid_targets_mean": 4434.6,
"valid_targets_min": 414
},
{
"epoch": 1.3663663663663663,
"grad_norm": 0.46940700753823117,
"learning_rate": 3.891429619581986e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25686946511268616,
"step": 910,
"valid_targets_mean": 5001.9,
"valid_targets_min": 750
},
{
"epoch": 1.3738738738738738,
"grad_norm": 0.5588622944159107,
"learning_rate": 3.888982491007705e-05,
"loss": 0.3063,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.37934252619743347,
"step": 915,
"valid_targets_mean": 4426.3,
"valid_targets_min": 480
},
{
"epoch": 1.3813813813813813,
"grad_norm": 0.5032151155279457,
"learning_rate": 3.886508877233914e-05,
"loss": 0.3002,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24294015765190125,
"step": 920,
"valid_targets_mean": 4203.2,
"valid_targets_min": 537
},
{
"epoch": 1.3888888888888888,
"grad_norm": 0.6375386060346272,
"learning_rate": 3.8840088129428594e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2843095660209656,
"step": 925,
"valid_targets_mean": 2762.1,
"valid_targets_min": 628
},
{
"epoch": 1.3963963963963963,
"grad_norm": 0.42954687639507877,
"learning_rate": 3.881482333187647e-05,
"loss": 0.2934,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24300193786621094,
"step": 930,
"valid_targets_mean": 6139.7,
"valid_targets_min": 1420
},
{
"epoch": 1.4039039039039038,
"grad_norm": 0.5288152668995841,
"learning_rate": 3.8789294733917486e-05,
"loss": 0.2809,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27250343561172485,
"step": 935,
"valid_targets_mean": 5227.9,
"valid_targets_min": 601
},
{
"epoch": 1.4114114114114114,
"grad_norm": 0.4018203487416013,
"learning_rate": 3.876350269348509e-05,
"loss": 0.2843,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2769063115119934,
"step": 940,
"valid_targets_mean": 7001.6,
"valid_targets_min": 791
},
{
"epoch": 1.4189189189189189,
"grad_norm": 0.4733738366398111,
"learning_rate": 3.873744757220642e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2413673847913742,
"step": 945,
"valid_targets_mean": 5955.6,
"valid_targets_min": 723
},
{
"epoch": 1.4264264264264264,
"grad_norm": 0.40178048986196624,
"learning_rate": 3.871112973539725e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22361788153648376,
"step": 950,
"valid_targets_mean": 5932.0,
"valid_targets_min": 684
},
{
"epoch": 1.4339339339339339,
"grad_norm": 0.5858661329948348,
"learning_rate": 3.868454955205685e-05,
"loss": 0.2967,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26762083172798157,
"step": 955,
"valid_targets_mean": 4612.1,
"valid_targets_min": 638
},
{
"epoch": 1.4414414414414414,
"grad_norm": 0.59370232296713,
"learning_rate": 3.86577073948628e-05,
"loss": 0.3087,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.245170459151268,
"step": 960,
"valid_targets_mean": 4544.8,
"valid_targets_min": 700
},
{
"epoch": 1.4489489489489489,
"grad_norm": 0.5776834809155071,
"learning_rate": 3.8630603640165815e-05,
"loss": 0.2795,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3211957812309265,
"step": 965,
"valid_targets_mean": 3560.0,
"valid_targets_min": 462
},
{
"epoch": 1.4564564564564564,
"grad_norm": 0.5619424459014478,
"learning_rate": 3.860323866798443e-05,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21985271573066711,
"step": 970,
"valid_targets_mean": 4147.0,
"valid_targets_min": 964
},
{
"epoch": 1.4639639639639639,
"grad_norm": 0.5783533174246083,
"learning_rate": 3.857561286199968e-05,
"loss": 0.2969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29089707136154175,
"step": 975,
"valid_targets_mean": 3580.6,
"valid_targets_min": 489
},
{
"epoch": 1.4714714714714714,
"grad_norm": 0.4955776875207588,
"learning_rate": 3.85477266095497e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2684110999107361,
"step": 980,
"valid_targets_mean": 4121.5,
"valid_targets_min": 565
},
{
"epoch": 1.478978978978979,
"grad_norm": 0.5707278559095864,
"learning_rate": 3.851958030162433e-05,
"loss": 0.274,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3071454167366028,
"step": 985,
"valid_targets_mean": 4583.5,
"valid_targets_min": 711
},
{
"epoch": 1.4864864864864864,
"grad_norm": 0.5349960494922307,
"learning_rate": 3.8491174332859625e-05,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2876233160495758,
"step": 990,
"valid_targets_mean": 3913.2,
"valid_targets_min": 652
},
{
"epoch": 1.493993993993994,
"grad_norm": 0.7242433186973595,
"learning_rate": 3.84625091015323e-05,
"loss": 0.2832,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717621624469757,
"step": 995,
"valid_targets_mean": 3196.1,
"valid_targets_min": 613
},
{
"epoch": 1.5015015015015014,
"grad_norm": 0.559821205756259,
"learning_rate": 3.843358500955416e-05,
"loss": 0.277,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27973076701164246,
"step": 1000,
"valid_targets_mean": 3837.9,
"valid_targets_min": 875
},
{
"epoch": 1.509009009009009,
"grad_norm": 0.5377924424199211,
"learning_rate": 3.840440246246648e-05,
"loss": 0.2818,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2526509165763855,
"step": 1005,
"valid_targets_mean": 3364.9,
"valid_targets_min": 732
},
{
"epoch": 1.5165165165165164,
"grad_norm": 0.6037241854694765,
"learning_rate": 3.837496186943428e-05,
"loss": 0.2838,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3358380198478699,
"step": 1010,
"valid_targets_mean": 4278.9,
"valid_targets_min": 638
},
{
"epoch": 1.524024024024024,
"grad_norm": 0.4711675437570829,
"learning_rate": 3.8345263643240634e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26968130469322205,
"step": 1015,
"valid_targets_mean": 5544.2,
"valid_targets_min": 648
},
{
"epoch": 1.5315315315315314,
"grad_norm": 0.5958428128963504,
"learning_rate": 3.831530820028084e-05,
"loss": 0.3192,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32176512479782104,
"step": 1020,
"valid_targets_mean": 3855.1,
"valid_targets_min": 674
},
{
"epoch": 1.539039039039039,
"grad_norm": 0.4865056298850766,
"learning_rate": 3.828509596055662e-05,
"loss": 0.2712,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525503635406494,
"step": 1025,
"valid_targets_mean": 6991.5,
"valid_targets_min": 567
},
{
"epoch": 1.5465465465465464,
"grad_norm": 0.5566299314673824,
"learning_rate": 3.82546273476702e-05,
"loss": 0.3577,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2959470748901367,
"step": 1030,
"valid_targets_mean": 4056.7,
"valid_targets_min": 528
},
{
"epoch": 1.554054054054054,
"grad_norm": 0.6266122143638768,
"learning_rate": 3.822390278881839e-05,
"loss": 0.2924,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31994956731796265,
"step": 1035,
"valid_targets_mean": 3313.5,
"valid_targets_min": 870
},
{
"epoch": 1.5615615615615615,
"grad_norm": 0.5379754675133966,
"learning_rate": 3.819292271478659e-05,
"loss": 0.2853,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26793667674064636,
"step": 1040,
"valid_targets_mean": 3280.4,
"valid_targets_min": 540
},
{
"epoch": 1.569069069069069,
"grad_norm": 0.42701565978810035,
"learning_rate": 3.816168755994274e-05,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21840263903141022,
"step": 1045,
"valid_targets_mean": 4529.6,
"valid_targets_min": 904
},
{
"epoch": 1.5765765765765765,
"grad_norm": 0.5000336725002723,
"learning_rate": 3.813019776223124e-05,
"loss": 0.286,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2662447690963745,
"step": 1050,
"valid_targets_mean": 4867.2,
"valid_targets_min": 988
},
{
"epoch": 1.584084084084084,
"grad_norm": 0.5648658240320987,
"learning_rate": 3.809845376316681e-05,
"loss": 0.3156,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29331260919570923,
"step": 1055,
"valid_targets_mean": 4341.2,
"valid_targets_min": 328
},
{
"epoch": 1.5915915915915915,
"grad_norm": 0.5284383529439995,
"learning_rate": 3.8066456007828304e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23197105526924133,
"step": 1060,
"valid_targets_mean": 3968.8,
"valid_targets_min": 389
},
{
"epoch": 1.599099099099099,
"grad_norm": 0.5216262376393843,
"learning_rate": 3.803420494485244e-05,
"loss": 0.273,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2597469687461853,
"step": 1065,
"valid_targets_mean": 4115.9,
"valid_targets_min": 579
},
{
"epoch": 1.6066066066066065,
"grad_norm": 0.4939695307516829,
"learning_rate": 3.800170102642757e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23144802451133728,
"step": 1070,
"valid_targets_mean": 3866.6,
"valid_targets_min": 486
},
{
"epoch": 1.614114114114114,
"grad_norm": 0.5829421644769698,
"learning_rate": 3.796894470828726e-05,
"loss": 0.267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.222642183303833,
"step": 1075,
"valid_targets_mean": 4570.8,
"valid_targets_min": 844
},
{
"epoch": 1.6216216216216215,
"grad_norm": 0.5335734411442947,
"learning_rate": 3.793593644970397e-05,
"loss": 0.2881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2972537577152252,
"step": 1080,
"valid_targets_mean": 4192.4,
"valid_targets_min": 648
},
{
"epoch": 1.629129129129129,
"grad_norm": 0.7509523435082093,
"learning_rate": 3.7902676713482584e-05,
"loss": 0.2991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3354663848876953,
"step": 1085,
"valid_targets_mean": 3534.2,
"valid_targets_min": 875
},
{
"epoch": 1.6366366366366365,
"grad_norm": 0.45680598867761874,
"learning_rate": 3.786916596595391e-05,
"loss": 0.2835,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2275020182132721,
"step": 1090,
"valid_targets_mean": 4664.6,
"valid_targets_min": 768
},
{
"epoch": 1.644144144144144,
"grad_norm": 0.614422278972368,
"learning_rate": 3.783540467696817e-05,
"loss": 0.2845,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28407660126686096,
"step": 1095,
"valid_targets_mean": 3863.8,
"valid_targets_min": 409
},
{
"epoch": 1.6516516516516515,
"grad_norm": 0.5074836388259119,
"learning_rate": 3.78013933198884e-05,
"loss": 0.2611,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23754659295082092,
"step": 1100,
"valid_targets_mean": 3914.6,
"valid_targets_min": 1027
},
{
"epoch": 1.659159159159159,
"grad_norm": 0.45212979425084815,
"learning_rate": 3.776713237158379e-05,
"loss": 0.2728,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2909110188484192,
"step": 1105,
"valid_targets_mean": 5534.1,
"valid_targets_min": 655
},
{
"epoch": 1.6666666666666665,
"grad_norm": 0.6316240705989837,
"learning_rate": 3.773262231242305e-05,
"loss": 0.3053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2717238664627075,
"step": 1110,
"valid_targets_mean": 3312.1,
"valid_targets_min": 367
},
{
"epoch": 1.674174174174174,
"grad_norm": 0.5332254751800973,
"learning_rate": 3.7697863626267615e-05,
"loss": 0.3138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2853066623210907,
"step": 1115,
"valid_targets_mean": 3955.4,
"valid_targets_min": 731
},
{
"epoch": 1.6816816816816815,
"grad_norm": 0.6436721167931566,
"learning_rate": 3.7662856800464907e-05,
"loss": 0.2876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33219900727272034,
"step": 1120,
"valid_targets_mean": 4150.2,
"valid_targets_min": 402
},
{
"epoch": 1.689189189189189,
"grad_norm": 0.41517090061996553,
"learning_rate": 3.762760232584148e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2333643138408661,
"step": 1125,
"valid_targets_mean": 5115.1,
"valid_targets_min": 841
},
{
"epoch": 1.6966966966966965,
"grad_norm": 0.5176992190887993,
"learning_rate": 3.7592100696696134e-05,
"loss": 0.2732,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2570965886116028,
"step": 1130,
"valid_targets_mean": 3668.6,
"valid_targets_min": 656
},
{
"epoch": 1.704204204204204,
"grad_norm": 0.511279913702578,
"learning_rate": 3.755635241079301e-05,
"loss": 0.2719,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22817838191986084,
"step": 1135,
"valid_targets_mean": 3872.6,
"valid_targets_min": 475
},
{
"epoch": 1.7117117117117115,
"grad_norm": 0.6164706177166612,
"learning_rate": 3.7520357969354584e-05,
"loss": 0.2907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3176250457763672,
"step": 1140,
"valid_targets_mean": 3526.4,
"valid_targets_min": 693
},
{
"epoch": 1.7192192192192193,
"grad_norm": 0.4109077325218178,
"learning_rate": 3.748411787705466e-05,
"loss": 0.3218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2506415843963623,
"step": 1145,
"valid_targets_mean": 5783.5,
"valid_targets_min": 524
},
{
"epoch": 1.7267267267267268,
"grad_norm": 0.47340788265525957,
"learning_rate": 3.744763264201125e-05,
"loss": 0.259,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28487300872802734,
"step": 1150,
"valid_targets_mean": 5147.9,
"valid_targets_min": 311
},
{
"epoch": 1.7342342342342343,
"grad_norm": 0.6361764376110007,
"learning_rate": 3.741090277577953e-05,
"loss": 0.2747,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33571434020996094,
"step": 1155,
"valid_targets_mean": 3613.9,
"valid_targets_min": 633
},
{
"epoch": 1.7417417417417418,
"grad_norm": 0.7263029802880552,
"learning_rate": 3.73739287933446e-05,
"loss": 0.3013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30988189578056335,
"step": 1160,
"valid_targets_mean": 2780.0,
"valid_targets_min": 388
},
{
"epoch": 1.7492492492492493,
"grad_norm": 0.5312249305901402,
"learning_rate": 3.733671121311426e-05,
"loss": 0.2691,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25757136940956116,
"step": 1165,
"valid_targets_mean": 4026.9,
"valid_targets_min": 605
},
{
"epoch": 1.7567567567567568,
"grad_norm": 0.5476708426420898,
"learning_rate": 3.729925055691182e-05,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30963361263275146,
"step": 1170,
"valid_targets_mean": 4677.7,
"valid_targets_min": 434
},
{
"epoch": 1.7642642642642643,
"grad_norm": 0.613322007834183,
"learning_rate": 3.7261547349968675e-05,
"loss": 0.2902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34018972516059875,
"step": 1175,
"valid_targets_mean": 3271.2,
"valid_targets_min": 407
},
{
"epoch": 1.7717717717717718,
"grad_norm": 0.6162258596946204,
"learning_rate": 3.722360212091703e-05,
"loss": 0.3093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32241833209991455,
"step": 1180,
"valid_targets_mean": 3718.6,
"valid_targets_min": 466
},
{
"epoch": 1.7792792792792793,
"grad_norm": 0.664703409023323,
"learning_rate": 3.7185415401782434e-05,
"loss": 0.2791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33108675479888916,
"step": 1185,
"valid_targets_mean": 5692.8,
"valid_targets_min": 702
},
{
"epoch": 1.7867867867867868,
"grad_norm": 0.5138638922358946,
"learning_rate": 3.7146987727976354e-05,
"loss": 0.2819,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30338913202285767,
"step": 1190,
"valid_targets_mean": 5333.4,
"valid_targets_min": 752
},
{
"epoch": 1.7942942942942943,
"grad_norm": 0.4986654846084407,
"learning_rate": 3.7108319638288654e-05,
"loss": 0.2899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2863334119319916,
"step": 1195,
"valid_targets_mean": 4185.2,
"valid_targets_min": 683
},
{
"epoch": 1.8018018018018018,
"grad_norm": 0.514824462976426,
"learning_rate": 3.706941167488002e-05,
"loss": 0.305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3966107666492462,
"step": 1200,
"valid_targets_mean": 4997.3,
"valid_targets_min": 583
},
{
"epoch": 1.8093093093093093,
"grad_norm": 0.5002026479937768,
"learning_rate": 3.70302643832744e-05,
"loss": 0.3046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3028540015220642,
"step": 1205,
"valid_targets_mean": 4384.4,
"valid_targets_min": 646
},
{
"epoch": 1.8168168168168168,
"grad_norm": 0.5733662063497278,
"learning_rate": 3.699087831235133e-05,
"loss": 0.271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28234004974365234,
"step": 1210,
"valid_targets_mean": 3882.9,
"valid_targets_min": 781
},
{
"epoch": 1.8243243243243243,
"grad_norm": 0.49934816295444895,
"learning_rate": 3.6951254014338236e-05,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27083009481430054,
"step": 1215,
"valid_targets_mean": 4725.4,
"valid_targets_min": 497
},
{
"epoch": 1.8318318318318318,
"grad_norm": 0.732103811366184,
"learning_rate": 3.69113920448027e-05,
"loss": 0.2718,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3054293394088745,
"step": 1220,
"valid_targets_mean": 2746.9,
"valid_targets_min": 478
},
{
"epoch": 1.8393393393393394,
"grad_norm": 0.6337417424539031,
"learning_rate": 3.687129296264468e-05,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26185324788093567,
"step": 1225,
"valid_targets_mean": 4788.4,
"valid_targets_min": 695
},
{
"epoch": 1.8468468468468469,
"grad_norm": 0.5621683788362308,
"learning_rate": 3.683095733008864e-05,
"loss": 0.2693,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2606724202632904,
"step": 1230,
"valid_targets_mean": 3237.6,
"valid_targets_min": 534
},
{
"epoch": 1.8543543543543544,
"grad_norm": 0.5288214426455534,
"learning_rate": 3.6790385712675705e-05,
"loss": 0.2837,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3149155378341675,
"step": 1235,
"valid_targets_mean": 3973.2,
"valid_targets_min": 572
},
{
"epoch": 1.8618618618618619,
"grad_norm": 0.4813442560130786,
"learning_rate": 3.6749578679255715e-05,
"loss": 0.2996,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2811282277107239,
"step": 1240,
"valid_targets_mean": 5313.8,
"valid_targets_min": 420
},
{
"epoch": 1.8693693693693694,
"grad_norm": 0.6170835431330234,
"learning_rate": 3.6708536801979246e-05,
"loss": 0.2905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32795318961143494,
"step": 1245,
"valid_targets_mean": 3692.1,
"valid_targets_min": 724
},
{
"epoch": 1.8768768768768769,
"grad_norm": 0.5375710532679772,
"learning_rate": 3.666726065628959e-05,
"loss": 0.2688,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23410853743553162,
"step": 1250,
"valid_targets_mean": 3626.6,
"valid_targets_min": 663
},
{
"epoch": 1.8843843843843844,
"grad_norm": 0.5400535513286914,
"learning_rate": 3.6625750820914694e-05,
"loss": 0.2569,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3105897903442383,
"step": 1255,
"valid_targets_mean": 3530.0,
"valid_targets_min": 400
},
{
"epoch": 1.8918918918918919,
"grad_norm": 0.7192704328062035,
"learning_rate": 3.658400787785903e-05,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31259477138519287,
"step": 1260,
"valid_targets_mean": 2492.8,
"valid_targets_min": 367
},
{
"epoch": 1.8993993993993994,
"grad_norm": 0.5689420833987145,
"learning_rate": 3.654203241239546e-05,
"loss": 0.2752,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2669737935066223,
"step": 1265,
"valid_targets_mean": 5125.1,
"valid_targets_min": 766
},
{
"epoch": 1.906906906906907,
"grad_norm": 0.6991606704570577,
"learning_rate": 3.649982501305701e-05,
"loss": 0.2681,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3605828285217285,
"step": 1270,
"valid_targets_mean": 2681.3,
"valid_targets_min": 603
},
{
"epoch": 1.9144144144144144,
"grad_norm": 0.5136360235806671,
"learning_rate": 3.6457386271628615e-05,
"loss": 0.2815,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2559846043586731,
"step": 1275,
"valid_targets_mean": 4230.4,
"valid_targets_min": 467
},
{
"epoch": 1.921921921921922,
"grad_norm": 0.5755425636039267,
"learning_rate": 3.641471678313883e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32143378257751465,
"step": 1280,
"valid_targets_mean": 4531.5,
"valid_targets_min": 723
},
{
"epoch": 1.9294294294294294,
"grad_norm": 0.5172980766220905,
"learning_rate": 3.6371817145851514e-05,
"loss": 0.2902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3124349117279053,
"step": 1285,
"valid_targets_mean": 5154.6,
"valid_targets_min": 690
},
{
"epoch": 1.936936936936937,
"grad_norm": 0.5579160547269432,
"learning_rate": 3.6328687961257374e-05,
"loss": 0.2863,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23261310160160065,
"step": 1290,
"valid_targets_mean": 3315.2,
"valid_targets_min": 432
},
{
"epoch": 1.9444444444444444,
"grad_norm": 0.471485760499144,
"learning_rate": 3.62853298340656e-05,
"loss": 0.2875,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23489312827587128,
"step": 1295,
"valid_targets_mean": 4736.7,
"valid_targets_min": 689
},
{
"epoch": 1.951951951951952,
"grad_norm": 0.45892772148849675,
"learning_rate": 3.624174337219536e-05,
"loss": 0.2919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23488348722457886,
"step": 1300,
"valid_targets_mean": 4925.0,
"valid_targets_min": 602
},
{
"epoch": 1.9594594594594594,
"grad_norm": 0.6569352257148999,
"learning_rate": 3.6197929186767255e-05,
"loss": 0.2827,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26401716470718384,
"step": 1305,
"valid_targets_mean": 3648.6,
"valid_targets_min": 358
},
{
"epoch": 1.966966966966967,
"grad_norm": 0.47233655136122743,
"learning_rate": 3.6153887892094786e-05,
"loss": 0.292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2689140737056732,
"step": 1310,
"valid_targets_mean": 4251.4,
"valid_targets_min": 521
},
{
"epoch": 1.9744744744744744,
"grad_norm": 0.4937344312534394,
"learning_rate": 3.6109620105675734e-05,
"loss": 0.2502,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2564142346382141,
"step": 1315,
"valid_targets_mean": 4050.1,
"valid_targets_min": 846
},
{
"epoch": 1.981981981981982,
"grad_norm": 0.5040985465764987,
"learning_rate": 3.606512644818347e-05,
"loss": 0.2959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27598607540130615,
"step": 1320,
"valid_targets_mean": 5606.7,
"valid_targets_min": 561
},
{
"epoch": 1.9894894894894894,
"grad_norm": 0.503656514625708,
"learning_rate": 3.6020407543458295e-05,
"loss": 0.2656,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24646782875061035,
"step": 1325,
"valid_targets_mean": 4084.1,
"valid_targets_min": 542
},
{
"epoch": 1.996996996996997,
"grad_norm": 0.48663621599509704,
"learning_rate": 3.597546401849866e-05,
"loss": 0.2877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3501949608325958,
"step": 1330,
"valid_targets_mean": 6161.8,
"valid_targets_min": 829
},
{
"epoch": 2.0045045045045047,
"grad_norm": 0.4886145150612323,
"learning_rate": 3.593029650345242e-05,
"loss": 0.248,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2267410159111023,
"step": 1335,
"valid_targets_mean": 4201.8,
"valid_targets_min": 585
},
{
"epoch": 2.012012012012012,
"grad_norm": 0.918223183885553,
"learning_rate": 3.588490563160793e-05,
"loss": 0.263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20230059325695038,
"step": 1340,
"valid_targets_mean": 3759.8,
"valid_targets_min": 668
},
{
"epoch": 2.0195195195195197,
"grad_norm": 0.41635246230968925,
"learning_rate": 3.583929203938523e-05,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20971567928791046,
"step": 1345,
"valid_targets_mean": 6513.2,
"valid_targets_min": 506
},
{
"epoch": 2.027027027027027,
"grad_norm": 0.5324224076323132,
"learning_rate": 3.5793456366327074e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2577601969242096,
"step": 1350,
"valid_targets_mean": 4199.0,
"valid_targets_min": 611
},
{
"epoch": 2.0345345345345347,
"grad_norm": 0.666399334701293,
"learning_rate": 3.5747399255090016e-05,
"loss": 0.2532,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25944650173187256,
"step": 1355,
"valid_targets_mean": 3050.4,
"valid_targets_min": 513
},
{
"epoch": 2.042042042042042,
"grad_norm": 0.5560230204936001,
"learning_rate": 3.5701121351435346e-05,
"loss": 0.2565,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30907580256462097,
"step": 1360,
"valid_targets_mean": 4342.1,
"valid_targets_min": 483
},
{
"epoch": 2.0495495495495497,
"grad_norm": 0.5093455715924559,
"learning_rate": 3.565462330422006e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23613181710243225,
"step": 1365,
"valid_targets_mean": 4160.1,
"valid_targets_min": 624
},
{
"epoch": 2.057057057057057,
"grad_norm": 0.5143252526017971,
"learning_rate": 3.560790576538777e-05,
"loss": 0.2441,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28200429677963257,
"step": 1370,
"valid_targets_mean": 5243.5,
"valid_targets_min": 529
},
{
"epoch": 2.0645645645645647,
"grad_norm": 0.6420496487933931,
"learning_rate": 3.556096938995953e-05,
"loss": 0.2644,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3083629906177521,
"step": 1375,
"valid_targets_mean": 3444.8,
"valid_targets_min": 474
},
{
"epoch": 2.0720720720720722,
"grad_norm": 0.6041025909633767,
"learning_rate": 3.551381483602472e-05,
"loss": 0.3043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34277862310409546,
"step": 1380,
"valid_targets_mean": 5168.2,
"valid_targets_min": 656
},
{
"epoch": 2.0795795795795797,
"grad_norm": 0.5065151180208464,
"learning_rate": 3.546644276473174e-05,
"loss": 0.2703,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22405189275741577,
"step": 1385,
"valid_targets_mean": 4451.1,
"valid_targets_min": 653
},
{
"epoch": 2.0870870870870872,
"grad_norm": 0.4653600091882295,
"learning_rate": 3.541885384027877e-05,
"loss": 0.2867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23494037985801697,
"step": 1390,
"valid_targets_mean": 4773.1,
"valid_targets_min": 515
},
{
"epoch": 2.0945945945945947,
"grad_norm": 0.4737552542155004,
"learning_rate": 3.53710487299045e-05,
"loss": 0.2301,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20185862481594086,
"step": 1395,
"valid_targets_mean": 4372.3,
"valid_targets_min": 656
},
{
"epoch": 2.1021021021021022,
"grad_norm": 0.618244462622168,
"learning_rate": 3.5323028103878695e-05,
"loss": 0.2647,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28137439489364624,
"step": 1400,
"valid_targets_mean": 3066.6,
"valid_targets_min": 558
},
{
"epoch": 2.1096096096096097,
"grad_norm": 0.6276854706539091,
"learning_rate": 3.527479263549287e-05,
"loss": 0.2567,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24222517013549805,
"step": 1405,
"valid_targets_mean": 3623.4,
"valid_targets_min": 562
},
{
"epoch": 2.1171171171171173,
"grad_norm": 0.5119888962756797,
"learning_rate": 3.52263430010508e-05,
"loss": 0.2456,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24120667576789856,
"step": 1410,
"valid_targets_mean": 4184.2,
"valid_targets_min": 571
},
{
"epoch": 2.1246246246246248,
"grad_norm": 0.40193152670779986,
"learning_rate": 3.517767987985906e-05,
"loss": 0.2543,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21013514697551727,
"step": 1415,
"valid_targets_mean": 7112.9,
"valid_targets_min": 958
},
{
"epoch": 2.1321321321321323,
"grad_norm": 0.6042469303834141,
"learning_rate": 3.5128803954217516e-05,
"loss": 0.245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24615558981895447,
"step": 1420,
"valid_targets_mean": 3546.8,
"valid_targets_min": 647
},
{
"epoch": 2.1396396396396398,
"grad_norm": 0.517598650535331,
"learning_rate": 3.507971590940972e-05,
"loss": 0.2361,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2518162727355957,
"step": 1425,
"valid_targets_mean": 4095.2,
"valid_targets_min": 700
},
{
"epoch": 2.1471471471471473,
"grad_norm": 0.5314103976572915,
"learning_rate": 3.503041643369332e-05,
"loss": 0.2657,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29391518235206604,
"step": 1430,
"valid_targets_mean": 4662.9,
"valid_targets_min": 673
},
{
"epoch": 2.1546546546546548,
"grad_norm": 0.7994874645886633,
"learning_rate": 3.4980906218290425e-05,
"loss": 0.2778,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24668291211128235,
"step": 1435,
"valid_targets_mean": 4393.5,
"valid_targets_min": 639
},
{
"epoch": 2.1621621621621623,
"grad_norm": 0.5508650913511237,
"learning_rate": 3.493118595737789e-05,
"loss": 0.2655,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26784124970436096,
"step": 1440,
"valid_targets_mean": 3928.2,
"valid_targets_min": 482
},
{
"epoch": 2.16966966966967,
"grad_norm": 0.48256368285307105,
"learning_rate": 3.4881256348077606e-05,
"loss": 0.2493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2078143209218979,
"step": 1445,
"valid_targets_mean": 4895.9,
"valid_targets_min": 605
},
{
"epoch": 2.1771771771771773,
"grad_norm": 0.5518092824723564,
"learning_rate": 3.4831118090446695e-05,
"loss": 0.2614,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27934592962265015,
"step": 1450,
"valid_targets_mean": 4175.9,
"valid_targets_min": 557
},
{
"epoch": 2.184684684684685,
"grad_norm": 0.6510442042007786,
"learning_rate": 3.478077188746774e-05,
"loss": 0.2825,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25130707025527954,
"step": 1455,
"valid_targets_mean": 2940.2,
"valid_targets_min": 746
},
{
"epoch": 2.1921921921921923,
"grad_norm": 0.6653821572090174,
"learning_rate": 3.473021844503885e-05,
"loss": 0.2915,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29144030809402466,
"step": 1460,
"valid_targets_mean": 3176.5,
"valid_targets_min": 466
},
{
"epoch": 2.1996996996997,
"grad_norm": 0.5835363387672817,
"learning_rate": 3.4679458471963876e-05,
"loss": 0.2609,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2668296694755554,
"step": 1465,
"valid_targets_mean": 3661.9,
"valid_targets_min": 657
},
{
"epoch": 2.2072072072072073,
"grad_norm": 0.473510630048058,
"learning_rate": 3.462849267994237e-05,
"loss": 0.2391,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2349366545677185,
"step": 1470,
"valid_targets_mean": 4610.1,
"valid_targets_min": 583
},
{
"epoch": 2.214714714714715,
"grad_norm": 0.5034796149297331,
"learning_rate": 3.457732178355966e-05,
"loss": 0.2786,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22843249142169952,
"step": 1475,
"valid_targets_mean": 4560.3,
"valid_targets_min": 870
},
{
"epoch": 2.2222222222222223,
"grad_norm": 0.6628701647407635,
"learning_rate": 3.4525946500276815e-05,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33600878715515137,
"step": 1480,
"valid_targets_mean": 4715.0,
"valid_targets_min": 409
},
{
"epoch": 2.22972972972973,
"grad_norm": 0.4438069409661387,
"learning_rate": 3.447436755042059e-05,
"loss": 0.2579,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23582454025745392,
"step": 1485,
"valid_targets_mean": 6454.2,
"valid_targets_min": 720
},
{
"epoch": 2.2372372372372373,
"grad_norm": 0.5589297614395898,
"learning_rate": 3.442258565717333e-05,
"loss": 0.2906,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3400152325630188,
"step": 1490,
"valid_targets_mean": 5422.4,
"valid_targets_min": 928
},
{
"epoch": 2.244744744744745,
"grad_norm": 0.5331121771902878,
"learning_rate": 3.437060154656281e-05,
"loss": 0.2911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31767523288726807,
"step": 1495,
"valid_targets_mean": 4458.2,
"valid_targets_min": 291
},
{
"epoch": 2.2522522522522523,
"grad_norm": 0.40712934057436334,
"learning_rate": 3.4318415947452085e-05,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28288692235946655,
"step": 1500,
"valid_targets_mean": 6532.0,
"valid_targets_min": 648
},
{
"epoch": 2.25975975975976,
"grad_norm": 0.45673386040732317,
"learning_rate": 3.4266029591529246e-05,
"loss": 0.2864,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2521343529224396,
"step": 1505,
"valid_targets_mean": 5607.8,
"valid_targets_min": 725
},
{
"epoch": 2.2672672672672673,
"grad_norm": 0.6013211253935284,
"learning_rate": 3.421344321329719e-05,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28024786710739136,
"step": 1510,
"valid_targets_mean": 3546.8,
"valid_targets_min": 515
},
{
"epoch": 2.274774774774775,
"grad_norm": 0.9210774515682121,
"learning_rate": 3.4160657550063286e-05,
"loss": 0.262,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2434246838092804,
"step": 1515,
"valid_targets_mean": 3957.6,
"valid_targets_min": 444
},
{
"epoch": 2.2822822822822824,
"grad_norm": 0.5034622925230656,
"learning_rate": 3.410767334192905e-05,
"loss": 0.2519,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2538553476333618,
"step": 1520,
"valid_targets_mean": 4692.2,
"valid_targets_min": 605
},
{
"epoch": 2.28978978978979,
"grad_norm": 0.6140827528489169,
"learning_rate": 3.40544913317798e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2580946087837219,
"step": 1525,
"valid_targets_mean": 3429.3,
"valid_targets_min": 549
},
{
"epoch": 2.2972972972972974,
"grad_norm": 0.4522744249612033,
"learning_rate": 3.400111226527417e-05,
"loss": 0.2326,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22649413347244263,
"step": 1530,
"valid_targets_mean": 5068.2,
"valid_targets_min": 731
},
{
"epoch": 2.304804804804805,
"grad_norm": 0.49640935192095975,
"learning_rate": 3.3947536890833744e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2515903115272522,
"step": 1535,
"valid_targets_mean": 4226.1,
"valid_targets_min": 726
},
{
"epoch": 2.3123123123123124,
"grad_norm": 1.016722378855143,
"learning_rate": 3.389376595963248e-05,
"loss": 0.2882,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.40263426303863525,
"step": 1540,
"valid_targets_mean": 3808.3,
"valid_targets_min": 756
},
{
"epoch": 2.31981981981982,
"grad_norm": 0.520047683970159,
"learning_rate": 3.3839800225586233e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24709469079971313,
"step": 1545,
"valid_targets_mean": 4321.6,
"valid_targets_min": 663
},
{
"epoch": 2.3273273273273274,
"grad_norm": 0.4955591390887456,
"learning_rate": 3.378564044534216e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24357634782791138,
"step": 1550,
"valid_targets_mean": 4470.6,
"valid_targets_min": 670
},
{
"epoch": 2.334834834834835,
"grad_norm": 0.5304638752162832,
"learning_rate": 3.373128737826812e-05,
"loss": 0.2625,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27869170904159546,
"step": 1555,
"valid_targets_mean": 3793.8,
"valid_targets_min": 252
},
{
"epoch": 2.3423423423423424,
"grad_norm": 0.6052044405674071,
"learning_rate": 3.367674178644201e-05,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2955855429172516,
"step": 1560,
"valid_targets_mean": 3434.8,
"valid_targets_min": 662
},
{
"epoch": 2.34984984984985,
"grad_norm": 0.45641925043102494,
"learning_rate": 3.362200443464112e-05,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25648972392082214,
"step": 1565,
"valid_targets_mean": 5664.2,
"valid_targets_min": 487
},
{
"epoch": 2.3573573573573574,
"grad_norm": 0.4104470454624804,
"learning_rate": 3.356707609033136e-05,
"loss": 0.2382,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1871146857738495,
"step": 1570,
"valid_targets_mean": 5469.4,
"valid_targets_min": 650
},
{
"epoch": 2.364864864864865,
"grad_norm": 0.5305663319530391,
"learning_rate": 3.351195752365654e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20778313279151917,
"step": 1575,
"valid_targets_mean": 3653.4,
"valid_targets_min": 548
},
{
"epoch": 2.3723723723723724,
"grad_norm": 0.952177731638365,
"learning_rate": 3.3456649507427537e-05,
"loss": 0.2785,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30603039264678955,
"step": 1580,
"valid_targets_mean": 3391.8,
"valid_targets_min": 541
},
{
"epoch": 2.37987987987988,
"grad_norm": 0.625558644174225,
"learning_rate": 3.340115281711149e-05,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2915250360965729,
"step": 1585,
"valid_targets_mean": 3354.9,
"valid_targets_min": 376
},
{
"epoch": 2.3873873873873874,
"grad_norm": 0.4383965531441897,
"learning_rate": 3.3345468230820924e-05,
"loss": 0.2545,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20519056916236877,
"step": 1590,
"valid_targets_mean": 5249.9,
"valid_targets_min": 576
},
{
"epoch": 2.394894894894895,
"grad_norm": 0.7263449171228276,
"learning_rate": 3.32895965293028e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24948550760746002,
"step": 1595,
"valid_targets_mean": 3813.8,
"valid_targets_min": 700
},
{
"epoch": 2.4024024024024024,
"grad_norm": 0.7704936140888641,
"learning_rate": 3.323353849592764e-05,
"loss": 0.27,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3838420808315277,
"step": 1600,
"valid_targets_mean": 4764.8,
"valid_targets_min": 930
},
{
"epoch": 2.40990990990991,
"grad_norm": 0.5262208670623167,
"learning_rate": 3.317729491667848e-05,
"loss": 0.2854,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26990848779678345,
"step": 1605,
"valid_targets_mean": 4314.4,
"valid_targets_min": 728
},
{
"epoch": 2.4174174174174174,
"grad_norm": 0.4905094743952616,
"learning_rate": 3.3120866580139856e-05,
"loss": 0.2678,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24697014689445496,
"step": 1610,
"valid_targets_mean": 5779.1,
"valid_targets_min": 863
},
{
"epoch": 2.424924924924925,
"grad_norm": 0.5795672522700869,
"learning_rate": 3.306425427748681e-05,
"loss": 0.2753,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3122454881668091,
"step": 1615,
"valid_targets_mean": 4678.4,
"valid_targets_min": 597
},
{
"epoch": 2.4324324324324325,
"grad_norm": 0.5127623781647497,
"learning_rate": 3.3007458802473705e-05,
"loss": 0.2418,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2780628502368927,
"step": 1620,
"valid_targets_mean": 5270.1,
"valid_targets_min": 408
},
{
"epoch": 2.43993993993994,
"grad_norm": 0.6000042814068866,
"learning_rate": 3.2950480951423166e-05,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26539573073387146,
"step": 1625,
"valid_targets_mean": 2969.9,
"valid_targets_min": 292
},
{
"epoch": 2.4474474474474475,
"grad_norm": 0.5601820602459276,
"learning_rate": 3.289332152321489e-05,
"loss": 0.2744,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34554967284202576,
"step": 1630,
"valid_targets_mean": 4328.4,
"valid_targets_min": 570
},
{
"epoch": 2.454954954954955,
"grad_norm": 0.5017335839364364,
"learning_rate": 3.2835981319274436e-05,
"loss": 0.3016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31424376368522644,
"step": 1635,
"valid_targets_mean": 4981.0,
"valid_targets_min": 513
},
{
"epoch": 2.4624624624624625,
"grad_norm": 0.5989444157971933,
"learning_rate": 3.277846114356201e-05,
"loss": 0.2812,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29167452454566956,
"step": 1640,
"valid_targets_mean": 4280.9,
"valid_targets_min": 583
},
{
"epoch": 2.46996996996997,
"grad_norm": 0.4818252524686284,
"learning_rate": 3.272076180256117e-05,
"loss": 0.2503,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2451312243938446,
"step": 1645,
"valid_targets_mean": 5266.5,
"valid_targets_min": 456
},
{
"epoch": 2.4774774774774775,
"grad_norm": 0.5474083922971454,
"learning_rate": 3.2662884105267545e-05,
"loss": 0.2802,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28529974818229675,
"step": 1650,
"valid_targets_mean": 4656.7,
"valid_targets_min": 323
},
{
"epoch": 2.484984984984985,
"grad_norm": 0.3927761927981878,
"learning_rate": 3.260482886317745e-05,
"loss": 0.2586,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2354969084262848,
"step": 1655,
"valid_targets_mean": 6819.5,
"valid_targets_min": 769
},
{
"epoch": 2.4924924924924925,
"grad_norm": 0.5095139881585496,
"learning_rate": 3.254659689027656e-05,
"loss": 0.2822,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25443506240844727,
"step": 1660,
"valid_targets_mean": 4691.8,
"valid_targets_min": 754
},
{
"epoch": 2.5,
"grad_norm": 0.48122470806496775,
"learning_rate": 3.2488189003028456e-05,
"loss": 0.2512,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25341033935546875,
"step": 1665,
"valid_targets_mean": 5473.4,
"valid_targets_min": 667
},
{
"epoch": 2.5075075075075075,
"grad_norm": 0.535101793490416,
"learning_rate": 3.24296060203632e-05,
"loss": 0.2725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29341810941696167,
"step": 1670,
"valid_targets_mean": 4545.0,
"valid_targets_min": 727
},
{
"epoch": 2.515015015015015,
"grad_norm": 0.5407510878775967,
"learning_rate": 3.2370848763665854e-05,
"loss": 0.2631,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.298563152551651,
"step": 1675,
"valid_targets_mean": 4343.1,
"valid_targets_min": 487
},
{
"epoch": 2.5225225225225225,
"grad_norm": 0.7328443730397846,
"learning_rate": 3.231191805676494e-05,
"loss": 0.2687,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24576136469841003,
"step": 1680,
"valid_targets_mean": 4246.7,
"valid_targets_min": 381
},
{
"epoch": 2.53003003003003,
"grad_norm": 0.4953608748768144,
"learning_rate": 3.22528147259209e-05,
"loss": 0.2894,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3240085542201996,
"step": 1685,
"valid_targets_mean": 5762.2,
"valid_targets_min": 734
},
{
"epoch": 2.5375375375375375,
"grad_norm": 0.6439990940182198,
"learning_rate": 3.2193539599814546e-05,
"loss": 0.2563,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2948322892189026,
"step": 1690,
"valid_targets_mean": 3211.7,
"valid_targets_min": 785
},
{
"epoch": 2.545045045045045,
"grad_norm": 0.5649997969615153,
"learning_rate": 3.213409350953539e-05,
"loss": 0.2763,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2883799374103546,
"step": 1695,
"valid_targets_mean": 3863.2,
"valid_targets_min": 655
},
{
"epoch": 2.5525525525525525,
"grad_norm": 0.6654178682497041,
"learning_rate": 3.207447728857e-05,
"loss": 0.2697,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2643584907054901,
"step": 1700,
"valid_targets_mean": 3119.7,
"valid_targets_min": 557
},
{
"epoch": 2.56006006006006,
"grad_norm": 0.6865303086852059,
"learning_rate": 3.201469177279036e-05,
"loss": 0.2489,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27196943759918213,
"step": 1705,
"valid_targets_mean": 2167.2,
"valid_targets_min": 570
},
{
"epoch": 2.5675675675675675,
"grad_norm": 0.5565838052443746,
"learning_rate": 3.195473780044208e-05,
"loss": 0.2622,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2557700276374817,
"step": 1710,
"valid_targets_mean": 3659.3,
"valid_targets_min": 446
},
{
"epoch": 2.575075075075075,
"grad_norm": 0.5197442676457078,
"learning_rate": 3.189461621213271e-05,
"loss": 0.2617,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2678113579750061,
"step": 1715,
"valid_targets_mean": 4663.4,
"valid_targets_min": 609
},
{
"epoch": 2.5825825825825826,
"grad_norm": 0.5166944613990696,
"learning_rate": 3.18343278508199e-05,
"loss": 0.2584,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24757936596870422,
"step": 1720,
"valid_targets_mean": 4511.7,
"valid_targets_min": 460
},
{
"epoch": 2.59009009009009,
"grad_norm": 0.4761985812024692,
"learning_rate": 3.177387356179962e-05,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20293045043945312,
"step": 1725,
"valid_targets_mean": 4317.4,
"valid_targets_min": 477
},
{
"epoch": 2.5975975975975976,
"grad_norm": 0.5529954148422914,
"learning_rate": 3.1713254192694284e-05,
"loss": 0.2407,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24401406943798065,
"step": 1730,
"valid_targets_mean": 3834.1,
"valid_targets_min": 610
},
{
"epoch": 2.605105105105105,
"grad_norm": 0.4955364019562657,
"learning_rate": 3.1652470593440885e-05,
"loss": 0.2746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22095078229904175,
"step": 1735,
"valid_targets_mean": 5501.8,
"valid_targets_min": 681
},
{
"epoch": 2.6126126126126126,
"grad_norm": 0.45641687982187235,
"learning_rate": 3.1591523616279055e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20338258147239685,
"step": 1740,
"valid_targets_mean": 4772.7,
"valid_targets_min": 700
},
{
"epoch": 2.62012012012012,
"grad_norm": 0.6226280659286444,
"learning_rate": 3.153041411573914e-05,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3405519723892212,
"step": 1745,
"valid_targets_mean": 4217.1,
"valid_targets_min": 518
},
{
"epoch": 2.6276276276276276,
"grad_norm": 0.6357283334230661,
"learning_rate": 3.1469142948630194e-05,
"loss": 0.2552,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27663713693618774,
"step": 1750,
"valid_targets_mean": 3277.6,
"valid_targets_min": 416
},
{
"epoch": 2.635135135135135,
"grad_norm": 0.5459413685496709,
"learning_rate": 3.140771097402798e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257800430059433,
"step": 1755,
"valid_targets_mean": 4285.2,
"valid_targets_min": 485
},
{
"epoch": 2.6426426426426426,
"grad_norm": 0.5121436251283435,
"learning_rate": 3.134611905326295e-05,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2595219910144806,
"step": 1760,
"valid_targets_mean": 4998.1,
"valid_targets_min": 900
},
{
"epoch": 2.65015015015015,
"grad_norm": 0.5290785372037086,
"learning_rate": 3.12843680499081e-05,
"loss": 0.2823,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.380996972322464,
"step": 1765,
"valid_targets_mean": 5265.2,
"valid_targets_min": 668
},
{
"epoch": 2.6576576576576576,
"grad_norm": 0.7048181374115327,
"learning_rate": 3.122245882976693e-05,
"loss": 0.2989,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2908703684806824,
"step": 1770,
"valid_targets_mean": 2736.2,
"valid_targets_min": 909
},
{
"epoch": 2.665165165165165,
"grad_norm": 0.47236135012538977,
"learning_rate": 3.116039226086128e-05,
"loss": 0.2746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30878859758377075,
"step": 1775,
"valid_targets_mean": 5567.8,
"valid_targets_min": 635
},
{
"epoch": 2.6726726726726726,
"grad_norm": 0.5445102500932314,
"learning_rate": 3.1098169213419155e-05,
"loss": 0.2366,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2582714259624481,
"step": 1780,
"valid_targets_mean": 3773.7,
"valid_targets_min": 376
},
{
"epoch": 2.68018018018018,
"grad_norm": 0.4265129001988632,
"learning_rate": 3.103579055986251e-05,
"loss": 0.2629,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2143097072839737,
"step": 1785,
"valid_targets_mean": 5390.5,
"valid_targets_min": 704
},
{
"epoch": 2.6876876876876876,
"grad_norm": 0.5312743639290497,
"learning_rate": 3.0973257174795074e-05,
"loss": 0.2788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3563080430030823,
"step": 1790,
"valid_targets_mean": 4896.1,
"valid_targets_min": 666
},
{
"epoch": 2.695195195195195,
"grad_norm": 0.46913349560934214,
"learning_rate": 3.0910569934990004e-05,
"loss": 0.2995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22366014122962952,
"step": 1795,
"valid_targets_mean": 5595.9,
"valid_targets_min": 764
},
{
"epoch": 2.7027027027027026,
"grad_norm": 0.4542845059111592,
"learning_rate": 3.084772971937766e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.238237202167511,
"step": 1800,
"valid_targets_mean": 4653.6,
"valid_targets_min": 745
},
{
"epoch": 2.71021021021021,
"grad_norm": 0.5378230783334604,
"learning_rate": 3.078473740903325e-05,
"loss": 0.2585,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30502867698669434,
"step": 1805,
"valid_targets_mean": 4299.5,
"valid_targets_min": 755
},
{
"epoch": 2.7177177177177176,
"grad_norm": 0.5591431243642122,
"learning_rate": 3.07215938871645e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.232755646109581,
"step": 1810,
"valid_targets_mean": 3461.2,
"valid_targets_min": 744
},
{
"epoch": 2.725225225225225,
"grad_norm": 0.6091187770028943,
"learning_rate": 3.0658300039099235e-05,
"loss": 0.2612,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2591820955276489,
"step": 1815,
"valid_targets_mean": 3384.4,
"valid_targets_min": 685
},
{
"epoch": 2.7327327327327327,
"grad_norm": 0.6447111768897391,
"learning_rate": 3.0594856752272987e-05,
"loss": 0.2546,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25599902868270874,
"step": 1820,
"valid_targets_mean": 3581.4,
"valid_targets_min": 657
},
{
"epoch": 2.74024024024024,
"grad_norm": 0.44894238539094306,
"learning_rate": 3.053126491621657e-05,
"loss": 0.2745,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2371259331703186,
"step": 1825,
"valid_targets_mean": 4889.4,
"valid_targets_min": 511
},
{
"epoch": 2.7477477477477477,
"grad_norm": 0.5214275290965238,
"learning_rate": 3.046752542254357e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22412139177322388,
"step": 1830,
"valid_targets_mean": 3863.1,
"valid_targets_min": 670
},
{
"epoch": 2.755255255255255,
"grad_norm": 0.5573497856924043,
"learning_rate": 3.0403639164937865e-05,
"loss": 0.2636,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24575021862983704,
"step": 1835,
"valid_targets_mean": 3198.3,
"valid_targets_min": 461
},
{
"epoch": 2.7627627627627627,
"grad_norm": 0.47880699639373114,
"learning_rate": 3.0339607039141107e-05,
"loss": 0.2303,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25173407793045044,
"step": 1840,
"valid_targets_mean": 4396.7,
"valid_targets_min": 277
},
{
"epoch": 2.77027027027027,
"grad_norm": 0.5293345660103224,
"learning_rate": 3.027542994294013e-05,
"loss": 0.2464,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24035535752773285,
"step": 1845,
"valid_targets_mean": 3506.6,
"valid_targets_min": 562
},
{
"epoch": 2.7777777777777777,
"grad_norm": 0.5030154656400301,
"learning_rate": 3.0211108776154394e-05,
"loss": 0.27,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24871063232421875,
"step": 1850,
"valid_targets_mean": 4511.1,
"valid_targets_min": 654
},
{
"epoch": 2.785285285285285,
"grad_norm": 0.4172382663816932,
"learning_rate": 3.0146644440623355e-05,
"loss": 0.2676,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22848474979400635,
"step": 1855,
"valid_targets_mean": 5617.8,
"valid_targets_min": 761
},
{
"epoch": 2.7927927927927927,
"grad_norm": 0.6045475468870822,
"learning_rate": 3.0082037840193812e-05,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26820242404937744,
"step": 1860,
"valid_targets_mean": 3179.9,
"valid_targets_min": 612
},
{
"epoch": 2.8003003003003,
"grad_norm": 0.5418178665003754,
"learning_rate": 3.001728988070724e-05,
"loss": 0.3025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3145066499710083,
"step": 1865,
"valid_targets_mean": 4837.1,
"valid_targets_min": 709
},
{
"epoch": 2.8078078078078077,
"grad_norm": 0.5134558903404736,
"learning_rate": 2.995240146998712e-05,
"loss": 0.2523,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21890783309936523,
"step": 1870,
"valid_targets_mean": 4246.1,
"valid_targets_min": 536
},
{
"epoch": 2.815315315315315,
"grad_norm": 0.583571397927643,
"learning_rate": 2.9887373517826153e-05,
"loss": 0.2692,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27330344915390015,
"step": 1875,
"valid_targets_mean": 3632.4,
"valid_targets_min": 630
},
{
"epoch": 2.8228228228228227,
"grad_norm": 0.47961940508462947,
"learning_rate": 2.9822206935973548e-05,
"loss": 0.2635,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2063194215297699,
"step": 1880,
"valid_targets_mean": 4621.7,
"valid_targets_min": 492
},
{
"epoch": 2.83033033033033,
"grad_norm": 0.5920736352732671,
"learning_rate": 2.9756902638122213e-05,
"loss": 0.2319,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23864233493804932,
"step": 1885,
"valid_targets_mean": 4123.9,
"valid_targets_min": 629
},
{
"epoch": 2.8378378378378377,
"grad_norm": 0.5565272788823533,
"learning_rate": 2.969146153989598e-05,
"loss": 0.2509,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22772765159606934,
"step": 1890,
"valid_targets_mean": 3277.6,
"valid_targets_min": 713
},
{
"epoch": 2.8453453453453452,
"grad_norm": 0.6239789579469722,
"learning_rate": 2.9625884558836716e-05,
"loss": 0.2457,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26187804341316223,
"step": 1895,
"valid_targets_mean": 2902.2,
"valid_targets_min": 503
},
{
"epoch": 2.8528528528528527,
"grad_norm": 0.5680461426104465,
"learning_rate": 2.95601726143915e-05,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3167528510093689,
"step": 1900,
"valid_targets_mean": 4054.1,
"valid_targets_min": 697
},
{
"epoch": 2.8603603603603602,
"grad_norm": 0.45456838507650504,
"learning_rate": 2.949432662789971e-05,
"loss": 0.2483,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29696983098983765,
"step": 1905,
"valid_targets_mean": 6072.6,
"valid_targets_min": 598
},
{
"epoch": 2.8678678678678677,
"grad_norm": 0.496183629571747,
"learning_rate": 2.942834752258012e-05,
"loss": 0.2392,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21913406252861023,
"step": 1910,
"valid_targets_mean": 4109.5,
"valid_targets_min": 879
},
{
"epoch": 2.8753753753753752,
"grad_norm": 0.5334630488557025,
"learning_rate": 2.936223622351794e-05,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31040453910827637,
"step": 1915,
"valid_targets_mean": 4864.2,
"valid_targets_min": 328
},
{
"epoch": 2.8828828828828827,
"grad_norm": 0.5005858977972606,
"learning_rate": 2.929599365765185e-05,
"loss": 0.2493,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.31291884183883667,
"step": 1920,
"valid_targets_mean": 5317.4,
"valid_targets_min": 547
},
{
"epoch": 2.8903903903903903,
"grad_norm": 0.4974443542961955,
"learning_rate": 2.9229620753761013e-05,
"loss": 0.2473,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.301303505897522,
"step": 1925,
"valid_targets_mean": 4499.8,
"valid_targets_min": 625
},
{
"epoch": 2.8978978978978978,
"grad_norm": 0.5691190427521686,
"learning_rate": 2.9163118442452046e-05,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27089810371398926,
"step": 1930,
"valid_targets_mean": 4097.7,
"valid_targets_min": 667
},
{
"epoch": 2.9054054054054053,
"grad_norm": 0.4198119186033015,
"learning_rate": 2.9096487656145968e-05,
"loss": 0.2596,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24759484827518463,
"step": 1935,
"valid_targets_mean": 6335.4,
"valid_targets_min": 564
},
{
"epoch": 2.9129129129129128,
"grad_norm": 0.5531720093912547,
"learning_rate": 2.9029729329065134e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23836839199066162,
"step": 1940,
"valid_targets_mean": 3271.4,
"valid_targets_min": 510
},
{
"epoch": 2.9204204204204203,
"grad_norm": 0.4289864597777698,
"learning_rate": 2.896284439722013e-05,
"loss": 0.2767,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2916072607040405,
"step": 1945,
"valid_targets_mean": 6052.6,
"valid_targets_min": 466
},
{
"epoch": 2.9279279279279278,
"grad_norm": 0.47685929908340674,
"learning_rate": 2.8895833798396657e-05,
"loss": 0.2414,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22440025210380554,
"step": 1950,
"valid_targets_mean": 4654.8,
"valid_targets_min": 550
},
{
"epoch": 2.9354354354354353,
"grad_norm": 0.4511746235008368,
"learning_rate": 2.882869847214237e-05,
"loss": 0.2683,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2768084406852722,
"step": 1955,
"valid_targets_mean": 6411.6,
"valid_targets_min": 648
},
{
"epoch": 2.942942942942943,
"grad_norm": 0.3897834130570682,
"learning_rate": 2.876143935975373e-05,
"loss": 0.2327,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23787030577659607,
"step": 1960,
"valid_targets_mean": 6063.3,
"valid_targets_min": 668
},
{
"epoch": 2.9504504504504503,
"grad_norm": 0.5645744222530638,
"learning_rate": 2.8694057404262757e-05,
"loss": 0.2618,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26880699396133423,
"step": 1965,
"valid_targets_mean": 3741.8,
"valid_targets_min": 651
},
{
"epoch": 2.957957957957958,
"grad_norm": 0.48669690646418146,
"learning_rate": 2.862655355042387e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33517420291900635,
"step": 1970,
"valid_targets_mean": 5469.8,
"valid_targets_min": 723
},
{
"epoch": 2.9654654654654653,
"grad_norm": 0.4988811225771945,
"learning_rate": 2.85589287447006e-05,
"loss": 0.2573,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2532571256160736,
"step": 1975,
"valid_targets_mean": 4500.7,
"valid_targets_min": 824
},
{
"epoch": 2.972972972972973,
"grad_norm": 0.5067859361295777,
"learning_rate": 2.849118393525233e-05,
"loss": 0.2958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22295460104942322,
"step": 1980,
"valid_targets_mean": 4019.2,
"valid_targets_min": 439
},
{
"epoch": 2.9804804804804803,
"grad_norm": 0.5614437078904748,
"learning_rate": 2.8423320071920986e-05,
"loss": 0.2496,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25288334488868713,
"step": 1985,
"valid_targets_mean": 3232.5,
"valid_targets_min": 790
},
{
"epoch": 2.987987987987988,
"grad_norm": 0.4074367928471507,
"learning_rate": 2.835533810621777e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22124746441841125,
"step": 1990,
"valid_targets_mean": 6511.8,
"valid_targets_min": 610
},
{
"epoch": 2.9954954954954953,
"grad_norm": 0.4746388334736856,
"learning_rate": 2.8287238991309746e-05,
"loss": 0.2591,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22991371154785156,
"step": 1995,
"valid_targets_mean": 4459.8,
"valid_targets_min": 742
},
{
"epoch": 3.003003003003003,
"grad_norm": 0.5433525185386173,
"learning_rate": 2.8219023682006533e-05,
"loss": 0.261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2538215219974518,
"step": 2000,
"valid_targets_mean": 3868.6,
"valid_targets_min": 593
},
{
"epoch": 3.0105105105105103,
"grad_norm": 0.6522092709294501,
"learning_rate": 2.8150693134746895e-05,
"loss": 0.2505,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25473958253860474,
"step": 2005,
"valid_targets_mean": 4023.8,
"valid_targets_min": 939
},
{
"epoch": 3.018018018018018,
"grad_norm": 0.4893307325525604,
"learning_rate": 2.8082248307585332e-05,
"loss": 0.2284,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20237843692302704,
"step": 2010,
"valid_targets_mean": 4555.2,
"valid_targets_min": 590
},
{
"epoch": 3.0255255255255253,
"grad_norm": 0.4667369885254396,
"learning_rate": 2.801369016017865e-05,
"loss": 0.2271,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18705838918685913,
"step": 2015,
"valid_targets_mean": 4288.2,
"valid_targets_min": 690
},
{
"epoch": 3.033033033033033,
"grad_norm": 0.49033218061993816,
"learning_rate": 2.7945019653772504e-05,
"loss": 0.2433,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2408279925584793,
"step": 2020,
"valid_targets_mean": 5262.1,
"valid_targets_min": 515
},
{
"epoch": 3.0405405405405403,
"grad_norm": 0.5391107334148109,
"learning_rate": 2.7876237751187917e-05,
"loss": 0.2436,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21394947171211243,
"step": 2025,
"valid_targets_mean": 3897.1,
"valid_targets_min": 1733
},
{
"epoch": 3.048048048048048,
"grad_norm": 0.6193116901994394,
"learning_rate": 2.7807345416807793e-05,
"loss": 0.2442,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23730601370334625,
"step": 2030,
"valid_targets_mean": 3262.4,
"valid_targets_min": 439
},
{
"epoch": 3.0555555555555554,
"grad_norm": 0.5319064047511843,
"learning_rate": 2.773834361656339e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2560746669769287,
"step": 2035,
"valid_targets_mean": 4626.2,
"valid_targets_min": 550
},
{
"epoch": 3.063063063063063,
"grad_norm": 0.7633521135620636,
"learning_rate": 2.766923331792075e-05,
"loss": 0.2507,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30914023518562317,
"step": 2040,
"valid_targets_mean": 3140.8,
"valid_targets_min": 595
},
{
"epoch": 3.0705705705705704,
"grad_norm": 1.0068010745411222,
"learning_rate": 2.7600015489867188e-05,
"loss": 0.2413,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2271232008934021,
"step": 2045,
"valid_targets_mean": 4060.6,
"valid_targets_min": 667
},
{
"epoch": 3.078078078078078,
"grad_norm": 0.5451000708994922,
"learning_rate": 2.753069110289766e-05,
"loss": 0.2459,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22742116451263428,
"step": 2050,
"valid_targets_mean": 3681.6,
"valid_targets_min": 668
},
{
"epoch": 3.0855855855855854,
"grad_norm": 0.5547733055241225,
"learning_rate": 2.7461261129001174e-05,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24244071543216705,
"step": 2055,
"valid_targets_mean": 3975.5,
"valid_targets_min": 495
},
{
"epoch": 3.093093093093093,
"grad_norm": 0.42158312641460743,
"learning_rate": 2.7391726541647163e-05,
"loss": 0.2154,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1724860966205597,
"step": 2060,
"valid_targets_mean": 5298.3,
"valid_targets_min": 423
},
{
"epoch": 3.1006006006006004,
"grad_norm": 0.5499035304566007,
"learning_rate": 2.7322088315771834e-05,
"loss": 0.2427,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24446254968643188,
"step": 2065,
"valid_targets_mean": 3607.4,
"valid_targets_min": 478
},
{
"epoch": 3.108108108108108,
"grad_norm": 0.5590055107325951,
"learning_rate": 2.725234742776448e-05,
"loss": 0.2278,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23849673569202423,
"step": 2070,
"valid_targets_mean": 5030.8,
"valid_targets_min": 659
},
{
"epoch": 3.1156156156156154,
"grad_norm": 0.478630517596832,
"learning_rate": 2.7182504855453834e-05,
"loss": 0.2499,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20381265878677368,
"step": 2075,
"valid_targets_mean": 4702.2,
"valid_targets_min": 865
},
{
"epoch": 3.123123123123123,
"grad_norm": 0.5451665017950299,
"learning_rate": 2.7112561578094327e-05,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2420223355293274,
"step": 2080,
"valid_targets_mean": 5865.1,
"valid_targets_min": 611
},
{
"epoch": 3.1306306306306304,
"grad_norm": 0.5244203768707708,
"learning_rate": 2.704251857635234e-05,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20124025642871857,
"step": 2085,
"valid_targets_mean": 3856.1,
"valid_targets_min": 622
},
{
"epoch": 3.138138138138138,
"grad_norm": 0.553596247360053,
"learning_rate": 2.69723768322925e-05,
"loss": 0.2429,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2544230818748474,
"step": 2090,
"valid_targets_mean": 3771.1,
"valid_targets_min": 479
},
{
"epoch": 3.1456456456456454,
"grad_norm": 0.5826774718951724,
"learning_rate": 2.6902137329363892e-05,
"loss": 0.2476,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27420639991760254,
"step": 2095,
"valid_targets_mean": 3996.2,
"valid_targets_min": 703
},
{
"epoch": 3.153153153153153,
"grad_norm": 0.6143348318690984,
"learning_rate": 2.683180105238625e-05,
"loss": 0.2307,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2823088765144348,
"step": 2100,
"valid_targets_mean": 3603.2,
"valid_targets_min": 664
},
{
"epoch": 3.1606606606606604,
"grad_norm": 0.5590576178147459,
"learning_rate": 2.676136898753617e-05,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25955310463905334,
"step": 2105,
"valid_targets_mean": 3985.4,
"valid_targets_min": 773
},
{
"epoch": 3.1681681681681684,
"grad_norm": 0.596190398717275,
"learning_rate": 2.6690842122333286e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24386368691921234,
"step": 2110,
"valid_targets_mean": 3912.7,
"valid_targets_min": 728
},
{
"epoch": 3.175675675675676,
"grad_norm": 0.6071315295064825,
"learning_rate": 2.6620221445626416e-05,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23695698380470276,
"step": 2115,
"valid_targets_mean": 3008.4,
"valid_targets_min": 656
},
{
"epoch": 3.1831831831831834,
"grad_norm": 0.6533097039267628,
"learning_rate": 2.6549507947579685e-05,
"loss": 0.2575,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2619466185569763,
"step": 2120,
"valid_targets_mean": 5412.9,
"valid_targets_min": 491
},
{
"epoch": 3.190690690690691,
"grad_norm": 0.49336937759151656,
"learning_rate": 2.6478702619658672e-05,
"loss": 0.2538,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23457828164100647,
"step": 2125,
"valid_targets_mean": 4639.4,
"valid_targets_min": 456
},
{
"epoch": 3.1981981981981984,
"grad_norm": 0.48643384497808734,
"learning_rate": 2.6407806454616472e-05,
"loss": 0.2368,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18629509210586548,
"step": 2130,
"valid_targets_mean": 3978.7,
"valid_targets_min": 815
},
{
"epoch": 3.205705705705706,
"grad_norm": 0.7137473060732604,
"learning_rate": 2.633682044647982e-05,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34111836552619934,
"step": 2135,
"valid_targets_mean": 2986.7,
"valid_targets_min": 211
},
{
"epoch": 3.2132132132132134,
"grad_norm": 0.4960650096175783,
"learning_rate": 2.626574559053512e-05,
"loss": 0.254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2693920433521271,
"step": 2140,
"valid_targets_mean": 6290.2,
"valid_targets_min": 728
},
{
"epoch": 3.220720720720721,
"grad_norm": 0.543711754415262,
"learning_rate": 2.619458288331449e-05,
"loss": 0.2648,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.34854060411453247,
"step": 2145,
"valid_targets_mean": 4955.6,
"valid_targets_min": 273
},
{
"epoch": 3.2282282282282284,
"grad_norm": 0.4118913840003615,
"learning_rate": 2.6123333322581806e-05,
"loss": 0.2272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22846825420856476,
"step": 2150,
"valid_targets_mean": 6945.4,
"valid_targets_min": 620
},
{
"epoch": 3.235735735735736,
"grad_norm": 0.6226838119580127,
"learning_rate": 2.6051997907318724e-05,
"loss": 0.2492,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2525981664657593,
"step": 2155,
"valid_targets_mean": 3692.9,
"valid_targets_min": 649
},
{
"epoch": 3.2432432432432434,
"grad_norm": 0.4814778903119386,
"learning_rate": 2.5980577637710632e-05,
"loss": 0.2397,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21874025464057922,
"step": 2160,
"valid_targets_mean": 5269.8,
"valid_targets_min": 814
},
{
"epoch": 3.250750750750751,
"grad_norm": 0.48643926272296106,
"learning_rate": 2.5909073515132667e-05,
"loss": 0.2508,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23266538977622986,
"step": 2165,
"valid_targets_mean": 4732.6,
"valid_targets_min": 898
},
{
"epoch": 3.2582582582582584,
"grad_norm": 0.5108891449221944,
"learning_rate": 2.5837486542135648e-05,
"loss": 0.2329,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2183685451745987,
"step": 2170,
"valid_targets_mean": 4184.6,
"valid_targets_min": 659
},
{
"epoch": 3.265765765765766,
"grad_norm": 0.5625875087588166,
"learning_rate": 2.576581772243204e-05,
"loss": 0.2766,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21907004714012146,
"step": 2175,
"valid_targets_mean": 5702.3,
"valid_targets_min": 447
},
{
"epoch": 3.2732732732732734,
"grad_norm": 0.44524330986567173,
"learning_rate": 2.5694068060881856e-05,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2379521131515503,
"step": 2180,
"valid_targets_mean": 5613.1,
"valid_targets_min": 444
},
{
"epoch": 3.280780780780781,
"grad_norm": 0.41557044227218803,
"learning_rate": 2.5622238563478603e-05,
"loss": 0.2161,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1911526620388031,
"step": 2185,
"valid_targets_mean": 6414.1,
"valid_targets_min": 926
},
{
"epoch": 3.2882882882882885,
"grad_norm": 0.6461866697440014,
"learning_rate": 2.555033023733514e-05,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2639209032058716,
"step": 2190,
"valid_targets_mean": 3629.4,
"valid_targets_min": 580
},
{
"epoch": 3.295795795795796,
"grad_norm": 0.5159050633898964,
"learning_rate": 2.547834409066958e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27777135372161865,
"step": 2195,
"valid_targets_mean": 5053.3,
"valid_targets_min": 906
},
{
"epoch": 3.3033033033033035,
"grad_norm": 0.477902570867691,
"learning_rate": 2.540628113279116e-05,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3054026961326599,
"step": 2200,
"valid_targets_mean": 6047.9,
"valid_targets_min": 806
},
{
"epoch": 3.310810810810811,
"grad_norm": 0.45215264311766057,
"learning_rate": 2.5334142374086053e-05,
"loss": 0.2229,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22195221483707428,
"step": 2205,
"valid_targets_mean": 5648.2,
"valid_targets_min": 742
},
{
"epoch": 3.3183183183183185,
"grad_norm": 0.8158948988984059,
"learning_rate": 2.5261928826003246e-05,
"loss": 0.2694,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3665313720703125,
"step": 2210,
"valid_targets_mean": 4771.2,
"valid_targets_min": 663
},
{
"epoch": 3.325825825825826,
"grad_norm": 0.6202523003371706,
"learning_rate": 2.518964150104034e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22199711203575134,
"step": 2215,
"valid_targets_mean": 2897.6,
"valid_targets_min": 698
},
{
"epoch": 3.3333333333333335,
"grad_norm": 0.6530333048449412,
"learning_rate": 2.511728141272934e-05,
"loss": 0.2304,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24529844522476196,
"step": 2220,
"valid_targets_mean": 3370.7,
"valid_targets_min": 503
},
{
"epoch": 3.340840840840841,
"grad_norm": 0.5905198582269967,
"learning_rate": 2.5044849575622458e-05,
"loss": 0.2272,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2153581976890564,
"step": 2225,
"valid_targets_mean": 4749.2,
"valid_targets_min": 668
},
{
"epoch": 3.3483483483483485,
"grad_norm": 0.4868966063934165,
"learning_rate": 2.4972347005277903e-05,
"loss": 0.2831,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2968922257423401,
"step": 2230,
"valid_targets_mean": 5965.1,
"valid_targets_min": 498
},
{
"epoch": 3.355855855855856,
"grad_norm": 0.8961039788278082,
"learning_rate": 2.489977471824561e-05,
"loss": 0.2348,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23392842710018158,
"step": 2235,
"valid_targets_mean": 3846.9,
"valid_targets_min": 368
},
{
"epoch": 3.3633633633633635,
"grad_norm": 0.6752840687920286,
"learning_rate": 2.4827133732053014e-05,
"loss": 0.2576,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25479578971862793,
"step": 2240,
"valid_targets_mean": 3281.4,
"valid_targets_min": 291
},
{
"epoch": 3.370870870870871,
"grad_norm": 0.5573523830693498,
"learning_rate": 2.475442506519077e-05,
"loss": 0.2353,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20670834183692932,
"step": 2245,
"valid_targets_mean": 3441.7,
"valid_targets_min": 637
},
{
"epoch": 3.3783783783783785,
"grad_norm": 0.47716647459061995,
"learning_rate": 2.468164973709847e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21283169090747833,
"step": 2250,
"valid_targets_mean": 4464.2,
"valid_targets_min": 910
},
{
"epoch": 3.385885885885886,
"grad_norm": 0.5064998483360107,
"learning_rate": 2.4608808768150357e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19695068895816803,
"step": 2255,
"valid_targets_mean": 3949.1,
"valid_targets_min": 738
},
{
"epoch": 3.3933933933933935,
"grad_norm": 0.5175599454597674,
"learning_rate": 2.4535903179641026e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2480076104402542,
"step": 2260,
"valid_targets_mean": 5609.1,
"valid_targets_min": 1410
},
{
"epoch": 3.400900900900901,
"grad_norm": 0.42240678217071037,
"learning_rate": 2.4462933993771088e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26719754934310913,
"step": 2265,
"valid_targets_mean": 6515.5,
"valid_targets_min": 726
},
{
"epoch": 3.4084084084084085,
"grad_norm": 0.506514863267876,
"learning_rate": 2.438990223363284e-05,
"loss": 0.2589,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25513604283332825,
"step": 2270,
"valid_targets_mean": 4471.0,
"valid_targets_min": 732
},
{
"epoch": 3.415915915915916,
"grad_norm": 0.5367632072440157,
"learning_rate": 2.4316808923195926e-05,
"loss": 0.2387,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22310830652713776,
"step": 2275,
"valid_targets_mean": 4361.2,
"valid_targets_min": 700
},
{
"epoch": 3.4234234234234235,
"grad_norm": 0.44852402801221397,
"learning_rate": 2.4243655087293e-05,
"loss": 0.2582,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26332229375839233,
"step": 2280,
"valid_targets_mean": 6653.6,
"valid_targets_min": 583
},
{
"epoch": 3.430930930930931,
"grad_norm": 0.48402583907149443,
"learning_rate": 2.4170441751605308e-05,
"loss": 0.2328,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24115243554115295,
"step": 2285,
"valid_targets_mean": 4474.8,
"valid_targets_min": 723
},
{
"epoch": 3.4384384384384385,
"grad_norm": 0.58593699094807,
"learning_rate": 2.4097169942648356e-05,
"loss": 0.2145,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16966642439365387,
"step": 2290,
"valid_targets_mean": 5481.7,
"valid_targets_min": 1177
},
{
"epoch": 3.445945945945946,
"grad_norm": 0.4710415176014163,
"learning_rate": 2.4023840687757476e-05,
"loss": 0.2432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20201632380485535,
"step": 2295,
"valid_targets_mean": 5250.4,
"valid_targets_min": 717
},
{
"epoch": 3.4534534534534536,
"grad_norm": 0.5084005135734221,
"learning_rate": 2.395045501507347e-05,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20893435180187225,
"step": 2300,
"valid_targets_mean": 4357.3,
"valid_targets_min": 489
},
{
"epoch": 3.460960960960961,
"grad_norm": 0.619899875868498,
"learning_rate": 2.387701395352815e-05,
"loss": 0.227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21758192777633667,
"step": 2305,
"valid_targets_mean": 2881.0,
"valid_targets_min": 578
},
{
"epoch": 3.4684684684684686,
"grad_norm": 0.48471567383203296,
"learning_rate": 2.380351853282992e-05,
"loss": 0.2445,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24553707242012024,
"step": 2310,
"valid_targets_mean": 5598.6,
"valid_targets_min": 552
},
{
"epoch": 3.475975975975976,
"grad_norm": 0.6056696323887422,
"learning_rate": 2.372996978344937e-05,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26694750785827637,
"step": 2315,
"valid_targets_mean": 3924.4,
"valid_targets_min": 523
},
{
"epoch": 3.4834834834834836,
"grad_norm": 0.601885827026815,
"learning_rate": 2.3656368736604786e-05,
"loss": 0.2568,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28267890214920044,
"step": 2320,
"valid_targets_mean": 3601.5,
"valid_targets_min": 724
},
{
"epoch": 3.490990990990991,
"grad_norm": 0.6254412393703039,
"learning_rate": 2.3582716424247728e-05,
"loss": 0.2711,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2540096044540405,
"step": 2325,
"valid_targets_mean": 2951.5,
"valid_targets_min": 537
},
{
"epoch": 3.4984984984984986,
"grad_norm": 0.5798449489473179,
"learning_rate": 2.3509013879048526e-05,
"loss": 0.2484,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30426591634750366,
"step": 2330,
"valid_targets_mean": 4265.3,
"valid_targets_min": 712
},
{
"epoch": 3.506006006006006,
"grad_norm": 0.4923122631477329,
"learning_rate": 2.3435262134381823e-05,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1547277569770813,
"step": 2335,
"valid_targets_mean": 4490.8,
"valid_targets_min": 620
},
{
"epoch": 3.5135135135135136,
"grad_norm": 0.49204973031276056,
"learning_rate": 2.3361462224312094e-05,
"loss": 0.2224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1860155165195465,
"step": 2340,
"valid_targets_mean": 4172.9,
"valid_targets_min": 968
},
{
"epoch": 3.521021021021021,
"grad_norm": 0.5430832529381092,
"learning_rate": 2.3287615183579126e-05,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23752620816230774,
"step": 2345,
"valid_targets_mean": 3755.6,
"valid_targets_min": 762
},
{
"epoch": 3.5285285285285286,
"grad_norm": 0.47304505139451253,
"learning_rate": 2.3213722047583517e-05,
"loss": 0.2238,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21495875716209412,
"step": 2350,
"valid_targets_mean": 5194.9,
"valid_targets_min": 781
},
{
"epoch": 3.536036036036036,
"grad_norm": 0.5593072985053018,
"learning_rate": 2.3139783852372157e-05,
"loss": 0.2415,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.32621026039123535,
"step": 2355,
"valid_targets_mean": 5330.6,
"valid_targets_min": 483
},
{
"epoch": 3.5435435435435436,
"grad_norm": 0.5133771865366825,
"learning_rate": 2.306580163462373e-05,
"loss": 0.2152,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24318471550941467,
"step": 2360,
"valid_targets_mean": 5257.0,
"valid_targets_min": 850
},
{
"epoch": 3.551051051051051,
"grad_norm": 0.7096881143231963,
"learning_rate": 2.299177643163413e-05,
"loss": 0.2412,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24741387367248535,
"step": 2365,
"valid_targets_mean": 2511.2,
"valid_targets_min": 508
},
{
"epoch": 3.5585585585585586,
"grad_norm": 0.5184545440577579,
"learning_rate": 2.2917709281301946e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28968262672424316,
"step": 2370,
"valid_targets_mean": 4808.0,
"valid_targets_min": 628
},
{
"epoch": 3.566066066066066,
"grad_norm": 0.5497412004652409,
"learning_rate": 2.2843601222113915e-05,
"loss": 0.2846,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24640163779258728,
"step": 2375,
"valid_targets_mean": 4700.1,
"valid_targets_min": 418
},
{
"epoch": 3.5735735735735736,
"grad_norm": 0.543092075993824,
"learning_rate": 2.2769453293130345e-05,
"loss": 0.2377,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2757692039012909,
"step": 2380,
"valid_targets_mean": 3818.9,
"valid_targets_min": 423
},
{
"epoch": 3.581081081081081,
"grad_norm": 0.4756311989207704,
"learning_rate": 2.2695266533970556e-05,
"loss": 0.242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2674590051174164,
"step": 2385,
"valid_targets_mean": 5847.6,
"valid_targets_min": 794
},
{
"epoch": 3.5885885885885886,
"grad_norm": 0.7040802634858209,
"learning_rate": 2.2621041984798304e-05,
"loss": 0.2401,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27846670150756836,
"step": 2390,
"valid_targets_mean": 2509.4,
"valid_targets_min": 686
},
{
"epoch": 3.596096096096096,
"grad_norm": 0.6323033311574447,
"learning_rate": 2.2546780686307183e-05,
"loss": 0.2495,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23559826612472534,
"step": 2395,
"valid_targets_mean": 4216.6,
"valid_targets_min": 608
},
{
"epoch": 3.6036036036036037,
"grad_norm": 0.5439419831820919,
"learning_rate": 2.2472483679706067e-05,
"loss": 0.2578,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.271353542804718,
"step": 2400,
"valid_targets_mean": 4691.6,
"valid_targets_min": 755
},
{
"epoch": 3.611111111111111,
"grad_norm": 0.657338134532918,
"learning_rate": 2.2398152006704463e-05,
"loss": 0.2602,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26753100752830505,
"step": 2405,
"valid_targets_mean": 3173.4,
"valid_targets_min": 404
},
{
"epoch": 3.6186186186186187,
"grad_norm": 0.45053072622125706,
"learning_rate": 2.232378670949795e-05,
"loss": 0.2137,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18780098855495453,
"step": 2410,
"valid_targets_mean": 5203.4,
"valid_targets_min": 1334
},
{
"epoch": 3.626126126126126,
"grad_norm": 0.4023749713359982,
"learning_rate": 2.2249388830753534e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17731866240501404,
"step": 2415,
"valid_targets_mean": 5612.2,
"valid_targets_min": 480
},
{
"epoch": 3.6336336336336337,
"grad_norm": 0.5062285511706474,
"learning_rate": 2.217495941359506e-05,
"loss": 0.2514,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23712016642093658,
"step": 2420,
"valid_targets_mean": 4567.2,
"valid_targets_min": 567
},
{
"epoch": 3.641141141141141,
"grad_norm": 0.5407394227692897,
"learning_rate": 2.2100499501588558e-05,
"loss": 0.2402,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25140225887298584,
"step": 2425,
"valid_targets_mean": 4480.6,
"valid_targets_min": 801
},
{
"epoch": 3.6486486486486487,
"grad_norm": 0.5432137809783814,
"learning_rate": 2.2026010138727628e-05,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23100072145462036,
"step": 2430,
"valid_targets_mean": 4535.2,
"valid_targets_min": 696
},
{
"epoch": 3.656156156156156,
"grad_norm": 0.5702741738198654,
"learning_rate": 2.1951492369418786e-05,
"loss": 0.2448,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24533988535404205,
"step": 2435,
"valid_targets_mean": 4315.2,
"valid_targets_min": 571
},
{
"epoch": 3.6636636636636637,
"grad_norm": 0.6650337977127149,
"learning_rate": 2.1876947238466838e-05,
"loss": 0.256,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2869791090488434,
"step": 2440,
"valid_targets_mean": 3385.6,
"valid_targets_min": 557
},
{
"epoch": 3.671171171171171,
"grad_norm": 0.473867504379004,
"learning_rate": 2.1802375791060232e-05,
"loss": 0.2315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18947833776474,
"step": 2445,
"valid_targets_mean": 5216.6,
"valid_targets_min": 742
},
{
"epoch": 3.6786786786786787,
"grad_norm": 0.7199290550127364,
"learning_rate": 2.1727779072756388e-05,
"loss": 0.2197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.30827030539512634,
"step": 2450,
"valid_targets_mean": 4398.8,
"valid_targets_min": 696
},
{
"epoch": 3.686186186186186,
"grad_norm": 0.6169439986122458,
"learning_rate": 2.1653158129467048e-05,
"loss": 0.281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2743998169898987,
"step": 2455,
"valid_targets_mean": 3159.7,
"valid_targets_min": 683
},
{
"epoch": 3.6936936936936937,
"grad_norm": 0.630068337186312,
"learning_rate": 2.1578514007443602e-05,
"loss": 0.2446,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2756376266479492,
"step": 2460,
"valid_targets_mean": 3321.1,
"valid_targets_min": 663
},
{
"epoch": 3.701201201201201,
"grad_norm": 8.40963413100615,
"learning_rate": 2.1503847753262447e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21705785393714905,
"step": 2465,
"valid_targets_mean": 5065.1,
"valid_targets_min": 1345
},
{
"epoch": 3.7087087087087087,
"grad_norm": 0.8840964089151675,
"learning_rate": 2.1429160413810268e-05,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2861403822898865,
"step": 2470,
"valid_targets_mean": 5522.8,
"valid_targets_min": 991
},
{
"epoch": 3.7162162162162162,
"grad_norm": 0.47904088821045393,
"learning_rate": 2.1354453036269397e-05,
"loss": 0.2283,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.182481050491333,
"step": 2475,
"valid_targets_mean": 3823.9,
"valid_targets_min": 657
},
{
"epoch": 3.7237237237237237,
"grad_norm": 0.6350177279756045,
"learning_rate": 2.1279726668103112e-05,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.289498507976532,
"step": 2480,
"valid_targets_mean": 3174.9,
"valid_targets_min": 597
},
{
"epoch": 3.7312312312312312,
"grad_norm": 0.5475085951271096,
"learning_rate": 2.1204982357040974e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2232646644115448,
"step": 2485,
"valid_targets_mean": 3746.9,
"valid_targets_min": 684
},
{
"epoch": 3.7387387387387387,
"grad_norm": 0.5721638552098921,
"learning_rate": 2.1130221151064095e-05,
"loss": 0.2408,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2669849693775177,
"step": 2490,
"valid_targets_mean": 4861.1,
"valid_targets_min": 469
},
{
"epoch": 3.7462462462462462,
"grad_norm": 0.46167196232037994,
"learning_rate": 2.105544409839048e-05,
"loss": 0.2249,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1929030418395996,
"step": 2495,
"valid_targets_mean": 4768.8,
"valid_targets_min": 888
},
{
"epoch": 3.7537537537537538,
"grad_norm": 0.5709387953688929,
"learning_rate": 2.098065224746031e-05,
"loss": 0.2465,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26624026894569397,
"step": 2500,
"valid_targets_mean": 3260.7,
"valid_targets_min": 788
},
{
"epoch": 3.7612612612612613,
"grad_norm": 0.5636970256534266,
"learning_rate": 2.0905846646921266e-05,
"loss": 0.2595,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29653650522232056,
"step": 2505,
"valid_targets_mean": 3569.1,
"valid_targets_min": 856
},
{
"epoch": 3.7687687687687688,
"grad_norm": 0.4293486036135388,
"learning_rate": 2.0831028345613807e-05,
"loss": 0.2521,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22826270759105682,
"step": 2510,
"valid_targets_mean": 5393.5,
"valid_targets_min": 404
},
{
"epoch": 3.7762762762762763,
"grad_norm": 0.5914611642027671,
"learning_rate": 2.0756198392556458e-05,
"loss": 0.2313,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22963778674602509,
"step": 2515,
"valid_targets_mean": 2932.8,
"valid_targets_min": 513
},
{
"epoch": 3.7837837837837838,
"grad_norm": 0.5163134230928269,
"learning_rate": 2.0681357836931114e-05,
"loss": 0.224,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.207438126206398,
"step": 2520,
"valid_targets_mean": 4660.4,
"valid_targets_min": 750
},
{
"epoch": 3.7912912912912913,
"grad_norm": 0.7190308106564102,
"learning_rate": 2.0606507728068338e-05,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2699480652809143,
"step": 2525,
"valid_targets_mean": 2463.4,
"valid_targets_min": 475
},
{
"epoch": 3.798798798798799,
"grad_norm": 0.6346404271383566,
"learning_rate": 2.0531649115432626e-05,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26241040229797363,
"step": 2530,
"valid_targets_mean": 3470.4,
"valid_targets_min": 613
},
{
"epoch": 3.8063063063063063,
"grad_norm": 0.5405574803276272,
"learning_rate": 2.0456783048607708e-05,
"loss": 0.234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2565130591392517,
"step": 2535,
"valid_targets_mean": 4024.1,
"valid_targets_min": 669
},
{
"epoch": 3.813813813813814,
"grad_norm": 0.604890803793606,
"learning_rate": 2.038191057728183e-05,
"loss": 0.2225,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2380007952451706,
"step": 2540,
"valid_targets_mean": 3456.8,
"valid_targets_min": 662
},
{
"epoch": 3.8213213213213213,
"grad_norm": 0.6793469587756615,
"learning_rate": 2.0307032751233038e-05,
"loss": 0.2593,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2839970290660858,
"step": 2545,
"valid_targets_mean": 4329.7,
"valid_targets_min": 681
},
{
"epoch": 3.828828828828829,
"grad_norm": 0.5213037499939942,
"learning_rate": 2.023215062031445e-05,
"loss": 0.247,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2534673511981964,
"step": 2550,
"valid_targets_mean": 4234.5,
"valid_targets_min": 437
},
{
"epoch": 3.8363363363363363,
"grad_norm": 0.48716095297652656,
"learning_rate": 2.0157265234439545e-05,
"loss": 0.2399,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17926955223083496,
"step": 2555,
"valid_targets_mean": 4508.6,
"valid_targets_min": 404
},
{
"epoch": 3.843843843843844,
"grad_norm": 0.45658767125521904,
"learning_rate": 2.0082377643567427e-05,
"loss": 0.2135,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16734261810779572,
"step": 2560,
"valid_targets_mean": 4532.5,
"valid_targets_min": 484
},
{
"epoch": 3.8513513513513513,
"grad_norm": 0.5887721035383384,
"learning_rate": 2.0007488897688145e-05,
"loss": 0.2469,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2615935802459717,
"step": 2565,
"valid_targets_mean": 3602.4,
"valid_targets_min": 596
},
{
"epoch": 3.858858858858859,
"grad_norm": 0.5556930711337941,
"learning_rate": 1.9932600046807914e-05,
"loss": 0.2355,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1911911964416504,
"step": 2570,
"valid_targets_mean": 3493.8,
"valid_targets_min": 801
},
{
"epoch": 3.8663663663663663,
"grad_norm": 0.4918999956248638,
"learning_rate": 1.985771214093444e-05,
"loss": 0.2162,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19995930790901184,
"step": 2575,
"valid_targets_mean": 4204.2,
"valid_targets_min": 634
},
{
"epoch": 3.873873873873874,
"grad_norm": 0.52841578647817,
"learning_rate": 1.9782826230062155e-05,
"loss": 0.2705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28531813621520996,
"step": 2580,
"valid_targets_mean": 4070.0,
"valid_targets_min": 731
},
{
"epoch": 3.8813813813813813,
"grad_norm": 0.5040983553316225,
"learning_rate": 1.9707943364157552e-05,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18574920296669006,
"step": 2585,
"valid_targets_mean": 3998.8,
"valid_targets_min": 416
},
{
"epoch": 3.888888888888889,
"grad_norm": 0.49554889736984387,
"learning_rate": 1.9633064593144408e-05,
"loss": 0.217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20392203330993652,
"step": 2590,
"valid_targets_mean": 4092.8,
"valid_targets_min": 638
},
{
"epoch": 3.8963963963963963,
"grad_norm": 0.4727254866083527,
"learning_rate": 1.9558190966889093e-05,
"loss": 0.2598,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21000804007053375,
"step": 2595,
"valid_targets_mean": 5088.9,
"valid_targets_min": 615
},
{
"epoch": 3.903903903903904,
"grad_norm": 0.43824564462204646,
"learning_rate": 1.9483323535185838e-05,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1834757924079895,
"step": 2600,
"valid_targets_mean": 4795.2,
"valid_targets_min": 852
},
{
"epoch": 3.9114114114114114,
"grad_norm": 0.4414256886221553,
"learning_rate": 1.940846334774203e-05,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1729404479265213,
"step": 2605,
"valid_targets_mean": 4699.6,
"valid_targets_min": 635
},
{
"epoch": 3.918918918918919,
"grad_norm": 0.5060621091961622,
"learning_rate": 1.933361145416348e-05,
"loss": 0.2215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2322886735200882,
"step": 2610,
"valid_targets_mean": 6213.0,
"valid_targets_min": 639
},
{
"epoch": 3.9264264264264264,
"grad_norm": 0.593672866808795,
"learning_rate": 1.9258768903939706e-05,
"loss": 0.2432,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24251478910446167,
"step": 2615,
"valid_targets_mean": 3359.5,
"valid_targets_min": 591
},
{
"epoch": 3.933933933933934,
"grad_norm": 0.4404905443315122,
"learning_rate": 1.9183936746429234e-05,
"loss": 0.2666,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2132512629032135,
"step": 2620,
"valid_targets_mean": 5353.2,
"valid_targets_min": 322
},
{
"epoch": 3.9414414414414414,
"grad_norm": 0.5116438369388818,
"learning_rate": 1.9109116030844874e-05,
"loss": 0.2318,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27721619606018066,
"step": 2625,
"valid_targets_mean": 4330.2,
"valid_targets_min": 757
},
{
"epoch": 3.948948948948949,
"grad_norm": 0.5905044794050749,
"learning_rate": 1.9034307806239004e-05,
"loss": 0.2603,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.33162492513656616,
"step": 2630,
"valid_targets_mean": 4979.0,
"valid_targets_min": 434
},
{
"epoch": 3.9564564564564564,
"grad_norm": 0.5353633419703424,
"learning_rate": 1.8959513121488868e-05,
"loss": 0.2544,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23549598455429077,
"step": 2635,
"valid_targets_mean": 4418.6,
"valid_targets_min": 858
},
{
"epoch": 3.963963963963964,
"grad_norm": 0.47963900371966894,
"learning_rate": 1.8884733025281876e-05,
"loss": 0.244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1948413848876953,
"step": 2640,
"valid_targets_mean": 4141.8,
"valid_targets_min": 726
},
{
"epoch": 3.9714714714714714,
"grad_norm": 0.44606918683200836,
"learning_rate": 1.880996856610088e-05,
"loss": 0.2417,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21382328867912292,
"step": 2645,
"valid_targets_mean": 5472.8,
"valid_targets_min": 745
},
{
"epoch": 3.978978978978979,
"grad_norm": 0.5149587332986721,
"learning_rate": 1.8735220792209513e-05,
"loss": 0.228,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19594892859458923,
"step": 2650,
"valid_targets_mean": 4153.9,
"valid_targets_min": 598
},
{
"epoch": 3.9864864864864864,
"grad_norm": 0.5874287195534135,
"learning_rate": 1.8660490751637435e-05,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22586959600448608,
"step": 2655,
"valid_targets_mean": 3378.9,
"valid_targets_min": 506
},
{
"epoch": 3.993993993993994,
"grad_norm": 0.46189741004980345,
"learning_rate": 1.858577949216569e-05,
"loss": 0.2134,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2193407416343689,
"step": 2660,
"valid_targets_mean": 4348.1,
"valid_targets_min": 447
},
{
"epoch": 4.001501501501502,
"grad_norm": 0.5233378328639746,
"learning_rate": 1.8511088061311982e-05,
"loss": 0.2246,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2248275727033615,
"step": 2665,
"valid_targets_mean": 3952.7,
"valid_targets_min": 671
},
{
"epoch": 4.009009009009009,
"grad_norm": 0.6071971400069938,
"learning_rate": 1.8436417506316013e-05,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23917962610721588,
"step": 2670,
"valid_targets_mean": 3420.5,
"valid_targets_min": 429
},
{
"epoch": 4.016516516516517,
"grad_norm": 0.5914162200350297,
"learning_rate": 1.8361768874124778e-05,
"loss": 0.2518,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2445971816778183,
"step": 2675,
"valid_targets_mean": 4843.9,
"valid_targets_min": 471
},
{
"epoch": 4.024024024024024,
"grad_norm": 0.547907620188072,
"learning_rate": 1.8287143211377893e-05,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1973641812801361,
"step": 2680,
"valid_targets_mean": 4041.2,
"valid_targets_min": 418
},
{
"epoch": 4.031531531531532,
"grad_norm": 0.5133198173072647,
"learning_rate": 1.8212541564392924e-05,
"loss": 0.2281,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17949888110160828,
"step": 2685,
"valid_targets_mean": 3785.6,
"valid_targets_min": 600
},
{
"epoch": 4.039039039039039,
"grad_norm": 0.47846466241843566,
"learning_rate": 1.813796497915073e-05,
"loss": 0.2478,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2564462423324585,
"step": 2690,
"valid_targets_mean": 5844.4,
"valid_targets_min": 506
},
{
"epoch": 4.046546546546547,
"grad_norm": 0.569435583148903,
"learning_rate": 1.806341450128076e-05,
"loss": 0.2314,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22870904207229614,
"step": 2695,
"valid_targets_mean": 4163.9,
"valid_targets_min": 699
},
{
"epoch": 4.054054054054054,
"grad_norm": 0.5070243213845931,
"learning_rate": 1.798889117604643e-05,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23002973198890686,
"step": 2700,
"valid_targets_mean": 4445.3,
"valid_targets_min": 705
},
{
"epoch": 4.061561561561562,
"grad_norm": 0.4867044644660382,
"learning_rate": 1.7914396048330428e-05,
"loss": 0.1903,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19053609669208527,
"step": 2705,
"valid_targets_mean": 4508.4,
"valid_targets_min": 569
},
{
"epoch": 4.069069069069069,
"grad_norm": 0.5805381784749756,
"learning_rate": 1.7839930162620128e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1698979139328003,
"step": 2710,
"valid_targets_mean": 3140.1,
"valid_targets_min": 798
},
{
"epoch": 4.076576576576577,
"grad_norm": 0.602504277734938,
"learning_rate": 1.7765494562992878e-05,
"loss": 0.2122,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18390074372291565,
"step": 2715,
"valid_targets_mean": 3297.9,
"valid_targets_min": 534
},
{
"epoch": 4.084084084084084,
"grad_norm": 0.6470125645401709,
"learning_rate": 1.7691090293101386e-05,
"loss": 0.2572,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.28710392117500305,
"step": 2720,
"valid_targets_mean": 3918.4,
"valid_targets_min": 437
},
{
"epoch": 4.091591591591592,
"grad_norm": 0.5066063002958375,
"learning_rate": 1.76167183961591e-05,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2291889488697052,
"step": 2725,
"valid_targets_mean": 5055.3,
"valid_targets_min": 388
},
{
"epoch": 4.099099099099099,
"grad_norm": 0.6455258191217119,
"learning_rate": 1.7542379914925575e-05,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23442783951759338,
"step": 2730,
"valid_targets_mean": 2962.8,
"valid_targets_min": 666
},
{
"epoch": 4.106606606606607,
"grad_norm": 0.7386040382747444,
"learning_rate": 1.7468075891691832e-05,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21252450346946716,
"step": 2735,
"valid_targets_mean": 3100.8,
"valid_targets_min": 518
},
{
"epoch": 4.114114114114114,
"grad_norm": 0.48445294014230816,
"learning_rate": 1.7393807368265777e-05,
"loss": 0.208,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22077061235904694,
"step": 2740,
"valid_targets_mean": 5577.0,
"valid_targets_min": 614
},
{
"epoch": 4.121621621621622,
"grad_norm": 0.48865023064949326,
"learning_rate": 1.731957538595756e-05,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19657564163208008,
"step": 2745,
"valid_targets_mean": 4633.6,
"valid_targets_min": 542
},
{
"epoch": 4.129129129129129,
"grad_norm": 0.6690952004993063,
"learning_rate": 1.7245380985565014e-05,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18894386291503906,
"step": 2750,
"valid_targets_mean": 3604.8,
"valid_targets_min": 437
},
{
"epoch": 4.136636636636637,
"grad_norm": 0.7195870104883615,
"learning_rate": 1.7171225207359023e-05,
"loss": 0.2258,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27104708552360535,
"step": 2755,
"valid_targets_mean": 3011.1,
"valid_targets_min": 948
},
{
"epoch": 4.1441441441441444,
"grad_norm": 0.5379416037342353,
"learning_rate": 1.7097109091068965e-05,
"loss": 0.2531,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3290520906448364,
"step": 2760,
"valid_targets_mean": 6327.2,
"valid_targets_min": 875
},
{
"epoch": 4.151651651651652,
"grad_norm": 0.4819288545219707,
"learning_rate": 1.7023033675868107e-05,
"loss": 0.2337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19341519474983215,
"step": 2765,
"valid_targets_mean": 5650.7,
"valid_targets_min": 1052
},
{
"epoch": 4.1591591591591595,
"grad_norm": 0.4339406422217775,
"learning_rate": 1.694900000035907e-05,
"loss": 0.1945,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18829095363616943,
"step": 2770,
"valid_targets_mean": 5408.4,
"valid_targets_min": 808
},
{
"epoch": 4.166666666666667,
"grad_norm": 0.5494279815313058,
"learning_rate": 1.687500910255924e-05,
"loss": 0.2345,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29033520817756653,
"step": 2775,
"valid_targets_mean": 4524.4,
"valid_targets_min": 660
},
{
"epoch": 4.1741741741741745,
"grad_norm": 0.4489742319836925,
"learning_rate": 1.6801062019886216e-05,
"loss": 0.2443,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2034509927034378,
"step": 2780,
"valid_targets_mean": 4920.3,
"valid_targets_min": 427
},
{
"epoch": 4.181681681681682,
"grad_norm": 0.5280057369516138,
"learning_rate": 1.6727159789143276e-05,
"loss": 0.2251,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25000298023223877,
"step": 2785,
"valid_targets_mean": 6445.3,
"valid_targets_min": 460
},
{
"epoch": 4.1891891891891895,
"grad_norm": 0.570852623942594,
"learning_rate": 1.665330344650484e-05,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23752200603485107,
"step": 2790,
"valid_targets_mean": 4025.2,
"valid_targets_min": 639
},
{
"epoch": 4.196696696696697,
"grad_norm": 0.5022860617467421,
"learning_rate": 1.6579494027501926e-05,
"loss": 0.2702,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25862377882003784,
"step": 2795,
"valid_targets_mean": 5591.9,
"valid_targets_min": 1079
},
{
"epoch": 4.2042042042042045,
"grad_norm": 0.5808638456409436,
"learning_rate": 1.6505732567007644e-05,
"loss": 0.2144,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2629520297050476,
"step": 2800,
"valid_targets_mean": 4279.3,
"valid_targets_min": 681
},
{
"epoch": 4.211711711711712,
"grad_norm": 0.5011677067782193,
"learning_rate": 1.6432020099222686e-05,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17377246916294098,
"step": 2805,
"valid_targets_mean": 4540.3,
"valid_targets_min": 506
},
{
"epoch": 4.2192192192192195,
"grad_norm": 0.6312221103561748,
"learning_rate": 1.635835765766082e-05,
"loss": 0.1895,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1711842268705368,
"step": 2810,
"valid_targets_mean": 4152.6,
"valid_targets_min": 576
},
{
"epoch": 4.226726726726727,
"grad_norm": 0.5455241347866726,
"learning_rate": 1.6284746275134413e-05,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2519665062427521,
"step": 2815,
"valid_targets_mean": 4392.9,
"valid_targets_min": 605
},
{
"epoch": 4.2342342342342345,
"grad_norm": 0.544839041978784,
"learning_rate": 1.621118698373992e-05,
"loss": 0.2643,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22317945957183838,
"step": 2820,
"valid_targets_mean": 4256.4,
"valid_targets_min": 508
},
{
"epoch": 4.241741741741742,
"grad_norm": 0.5207115855205976,
"learning_rate": 1.6137680814843447e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26101672649383545,
"step": 2825,
"valid_targets_mean": 4533.8,
"valid_targets_min": 702
},
{
"epoch": 4.2492492492492495,
"grad_norm": 0.7554547871541064,
"learning_rate": 1.6064228799066272e-05,
"loss": 0.2369,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2488705813884735,
"step": 2830,
"valid_targets_mean": 3717.3,
"valid_targets_min": 599
},
{
"epoch": 4.256756756756757,
"grad_norm": 0.5076882374389426,
"learning_rate": 1.5990831966270396e-05,
"loss": 0.2121,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20610791444778442,
"step": 2835,
"valid_targets_mean": 5082.6,
"valid_targets_min": 660
},
{
"epoch": 4.2642642642642645,
"grad_norm": 0.563842648058139,
"learning_rate": 1.5917491345544113e-05,
"loss": 0.2136,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18700063228607178,
"step": 2840,
"valid_targets_mean": 4268.7,
"valid_targets_min": 596
},
{
"epoch": 4.271771771771772,
"grad_norm": 0.5630065305626606,
"learning_rate": 1.584420796518756e-05,
"loss": 0.244,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2228190302848816,
"step": 2845,
"valid_targets_mean": 3847.0,
"valid_targets_min": 865
},
{
"epoch": 4.2792792792792795,
"grad_norm": 0.5990679311909958,
"learning_rate": 1.5770982852698337e-05,
"loss": 0.2485,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2809998095035553,
"step": 2850,
"valid_targets_mean": 3885.7,
"valid_targets_min": 634
},
{
"epoch": 4.286786786786787,
"grad_norm": 0.5512552937482088,
"learning_rate": 1.5697817034757052e-05,
"loss": 0.2027,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1838597059249878,
"step": 2855,
"valid_targets_mean": 3917.1,
"valid_targets_min": 550
},
{
"epoch": 4.2942942942942945,
"grad_norm": 0.560081521292376,
"learning_rate": 1.5624711537212967e-05,
"loss": 0.2265,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20176030695438385,
"step": 2860,
"valid_targets_mean": 3504.7,
"valid_targets_min": 694
},
{
"epoch": 4.301801801801802,
"grad_norm": 0.7258528593213625,
"learning_rate": 1.5551667385069593e-05,
"loss": 0.2005,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22372370958328247,
"step": 2865,
"valid_targets_mean": 2295.4,
"valid_targets_min": 423
},
{
"epoch": 4.3093093093093096,
"grad_norm": 0.7471444365279868,
"learning_rate": 1.5478685602470324e-05,
"loss": 0.2511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24615955352783203,
"step": 2870,
"valid_targets_mean": 3811.6,
"valid_targets_min": 748
},
{
"epoch": 4.316816816816817,
"grad_norm": 0.6829203066694415,
"learning_rate": 1.5405767212684078e-05,
"loss": 0.2372,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21476216614246368,
"step": 2875,
"valid_targets_mean": 3288.6,
"valid_targets_min": 535
},
{
"epoch": 4.324324324324325,
"grad_norm": 0.5733535380374483,
"learning_rate": 1.5332913238090962e-05,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2381066530942917,
"step": 2880,
"valid_targets_mean": 3251.5,
"valid_targets_min": 697
},
{
"epoch": 4.331831831831832,
"grad_norm": 0.6499639228286483,
"learning_rate": 1.52601247001679e-05,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23366223275661469,
"step": 2885,
"valid_targets_mean": 2987.1,
"valid_targets_min": 539
},
{
"epoch": 4.33933933933934,
"grad_norm": 0.6285744664120035,
"learning_rate": 1.5187402619474361e-05,
"loss": 0.2083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.195681631565094,
"step": 2890,
"valid_targets_mean": 4077.1,
"valid_targets_min": 678
},
{
"epoch": 4.346846846846847,
"grad_norm": 0.6210882117570284,
"learning_rate": 1.5114748015638013e-05,
"loss": 0.2127,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21708352863788605,
"step": 2895,
"valid_targets_mean": 4107.8,
"valid_targets_min": 760
},
{
"epoch": 4.354354354354355,
"grad_norm": 0.5855096649034774,
"learning_rate": 1.5042161907340438e-05,
"loss": 0.2292,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25563323497772217,
"step": 2900,
"valid_targets_mean": 3565.5,
"valid_targets_min": 562
},
{
"epoch": 4.361861861861862,
"grad_norm": 0.5300025815920703,
"learning_rate": 1.4969645312302851e-05,
"loss": 0.2197,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22752434015274048,
"step": 2905,
"valid_targets_mean": 4113.8,
"valid_targets_min": 381
},
{
"epoch": 4.36936936936937,
"grad_norm": 0.5804189010231626,
"learning_rate": 1.4897199247271842e-05,
"loss": 0.2025,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1874658167362213,
"step": 2910,
"valid_targets_mean": 3798.9,
"valid_targets_min": 452
},
{
"epoch": 4.376876876876877,
"grad_norm": 0.48760141515061334,
"learning_rate": 1.4824824728005092e-05,
"loss": 0.2434,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.257068395614624,
"step": 2915,
"valid_targets_mean": 5025.7,
"valid_targets_min": 584
},
{
"epoch": 4.384384384384385,
"grad_norm": 0.658477050968013,
"learning_rate": 1.4752522769257152e-05,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22656235098838806,
"step": 2920,
"valid_targets_mean": 3549.4,
"valid_targets_min": 624
},
{
"epoch": 4.391891891891892,
"grad_norm": 0.7492347794498558,
"learning_rate": 1.468029438476521e-05,
"loss": 0.2305,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22716817259788513,
"step": 2925,
"valid_targets_mean": 2520.4,
"valid_targets_min": 536
},
{
"epoch": 4.3993993993994,
"grad_norm": 0.5532580940259121,
"learning_rate": 1.4608140587234887e-05,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20708701014518738,
"step": 2930,
"valid_targets_mean": 3850.1,
"valid_targets_min": 761
},
{
"epoch": 4.406906906906907,
"grad_norm": 0.4546505507730152,
"learning_rate": 1.453606238832602e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21117320656776428,
"step": 2935,
"valid_targets_mean": 6005.3,
"valid_targets_min": 813
},
{
"epoch": 4.414414414414415,
"grad_norm": 0.7252302746614107,
"learning_rate": 1.4464060798638484e-05,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18549787998199463,
"step": 2940,
"valid_targets_mean": 3605.3,
"valid_targets_min": 847
},
{
"epoch": 4.421921921921922,
"grad_norm": 0.43525814011469965,
"learning_rate": 1.4392136827698032e-05,
"loss": 0.1929,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16544996201992035,
"step": 2945,
"valid_targets_mean": 5133.1,
"valid_targets_min": 591
},
{
"epoch": 4.42942942942943,
"grad_norm": 0.6290052391762472,
"learning_rate": 1.4320291483942135e-05,
"loss": 0.2245,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21728135645389557,
"step": 2950,
"valid_targets_mean": 3071.6,
"valid_targets_min": 601
},
{
"epoch": 4.436936936936937,
"grad_norm": 0.568290272425125,
"learning_rate": 1.424852577470584e-05,
"loss": 0.2298,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18296922743320465,
"step": 2955,
"valid_targets_mean": 5362.2,
"valid_targets_min": 803
},
{
"epoch": 4.444444444444445,
"grad_norm": 0.603259783928807,
"learning_rate": 1.417684070620764e-05,
"loss": 0.2261,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23192979395389557,
"step": 2960,
"valid_targets_mean": 3260.2,
"valid_targets_min": 713
},
{
"epoch": 4.451951951951952,
"grad_norm": 0.5712898946994219,
"learning_rate": 1.4105237283535376e-05,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2266012728214264,
"step": 2965,
"valid_targets_mean": 4215.6,
"valid_targets_min": 691
},
{
"epoch": 4.45945945945946,
"grad_norm": 0.6445579585402789,
"learning_rate": 1.403371651063216e-05,
"loss": 0.2363,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24278521537780762,
"step": 2970,
"valid_targets_mean": 3313.9,
"valid_targets_min": 374
},
{
"epoch": 4.466966966966967,
"grad_norm": 0.5733027694106058,
"learning_rate": 1.3962279390282261e-05,
"loss": 0.243,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2066403329372406,
"step": 2975,
"valid_targets_mean": 4162.3,
"valid_targets_min": 764
},
{
"epoch": 4.474474474474475,
"grad_norm": 0.613924525173538,
"learning_rate": 1.3890926924097071e-05,
"loss": 0.1938,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20435193181037903,
"step": 2980,
"valid_targets_mean": 3513.4,
"valid_targets_min": 652
},
{
"epoch": 4.481981981981982,
"grad_norm": 0.5403888711125328,
"learning_rate": 1.3819660112501054e-05,
"loss": 0.2242,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20203976333141327,
"step": 2985,
"valid_targets_mean": 4108.9,
"valid_targets_min": 655
},
{
"epoch": 4.48948948948949,
"grad_norm": 0.5594472556122174,
"learning_rate": 1.3748479954717735e-05,
"loss": 0.2462,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20039498805999756,
"step": 2990,
"valid_targets_mean": 3769.4,
"valid_targets_min": 504
},
{
"epoch": 4.496996996996997,
"grad_norm": 0.5426786497323537,
"learning_rate": 1.3677387448755657e-05,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21668657660484314,
"step": 2995,
"valid_targets_mean": 3945.2,
"valid_targets_min": 667
},
{
"epoch": 4.504504504504505,
"grad_norm": 0.4470248026304529,
"learning_rate": 1.360638359139442e-05,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2280035763978958,
"step": 3000,
"valid_targets_mean": 5678.4,
"valid_targets_min": 1551
},
{
"epoch": 4.512012012012012,
"grad_norm": 0.609794314414809,
"learning_rate": 1.3535469378170683e-05,
"loss": 0.239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2744963467121124,
"step": 3005,
"valid_targets_mean": 3750.4,
"valid_targets_min": 674
},
{
"epoch": 4.51951951951952,
"grad_norm": 0.4627448347366898,
"learning_rate": 1.3464645803364228e-05,
"loss": 0.2439,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21215581893920898,
"step": 3010,
"valid_targets_mean": 5590.1,
"valid_targets_min": 528
},
{
"epoch": 4.527027027027027,
"grad_norm": 0.6035357299819745,
"learning_rate": 1.3393913859983996e-05,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2198573499917984,
"step": 3015,
"valid_targets_mean": 6302.9,
"valid_targets_min": 789
},
{
"epoch": 4.534534534534535,
"grad_norm": 0.5643676209847303,
"learning_rate": 1.3323274539754177e-05,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25696855783462524,
"step": 3020,
"valid_targets_mean": 4303.8,
"valid_targets_min": 634
},
{
"epoch": 4.542042042042042,
"grad_norm": 0.570048922978165,
"learning_rate": 1.3252728833100296e-05,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19746547937393188,
"step": 3025,
"valid_targets_mean": 3560.8,
"valid_targets_min": 598
},
{
"epoch": 4.54954954954955,
"grad_norm": 0.4464417263684137,
"learning_rate": 1.3182277729135358e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19879616796970367,
"step": 3030,
"valid_targets_mean": 7131.6,
"valid_targets_min": 460
},
{
"epoch": 4.557057057057057,
"grad_norm": 0.5089601591681008,
"learning_rate": 1.3111922215645922e-05,
"loss": 0.2126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23360319435596466,
"step": 3035,
"valid_targets_mean": 4634.0,
"valid_targets_min": 654
},
{
"epoch": 4.564564564564565,
"grad_norm": 0.6823720809640251,
"learning_rate": 1.3041663279078311e-05,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2097683995962143,
"step": 3040,
"valid_targets_mean": 2433.6,
"valid_targets_min": 562
},
{
"epoch": 4.572072072072072,
"grad_norm": 0.6700606322768459,
"learning_rate": 1.297150190452473e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2061670869588852,
"step": 3045,
"valid_targets_mean": 2720.6,
"valid_targets_min": 529
},
{
"epoch": 4.57957957957958,
"grad_norm": 0.6228866174244457,
"learning_rate": 1.2901439075709506e-05,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18749915063381195,
"step": 3050,
"valid_targets_mean": 3271.4,
"valid_targets_min": 416
},
{
"epoch": 4.587087087087087,
"grad_norm": 0.600075319444778,
"learning_rate": 1.2831475774975247e-05,
"loss": 0.2088,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24314680695533752,
"step": 3055,
"valid_targets_mean": 4222.2,
"valid_targets_min": 520
},
{
"epoch": 4.594594594594595,
"grad_norm": 0.4219894648635082,
"learning_rate": 1.2761612983269094e-05,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18051698803901672,
"step": 3060,
"valid_targets_mean": 6413.9,
"valid_targets_min": 703
},
{
"epoch": 4.602102102102102,
"grad_norm": 0.5430062852225149,
"learning_rate": 1.2691851680128966e-05,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18320244550704956,
"step": 3065,
"valid_targets_mean": 3880.8,
"valid_targets_min": 727
},
{
"epoch": 4.60960960960961,
"grad_norm": 0.4910324433811435,
"learning_rate": 1.2622192843669826e-05,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1959684193134308,
"step": 3070,
"valid_targets_mean": 5296.5,
"valid_targets_min": 512
},
{
"epoch": 4.617117117117117,
"grad_norm": 0.5134831494706088,
"learning_rate": 1.255263745056996e-05,
"loss": 0.2051,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21355494856834412,
"step": 3075,
"valid_targets_mean": 5030.8,
"valid_targets_min": 469
},
{
"epoch": 4.624624624624625,
"grad_norm": 0.5527873198315599,
"learning_rate": 1.2483186476057281e-05,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1989469826221466,
"step": 3080,
"valid_targets_mean": 3602.9,
"valid_targets_min": 630
},
{
"epoch": 4.632132132132132,
"grad_norm": 0.7003658441849595,
"learning_rate": 1.2413840893895668e-05,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20069898664951324,
"step": 3085,
"valid_targets_mean": 3747.1,
"valid_targets_min": 474
},
{
"epoch": 4.63963963963964,
"grad_norm": 0.5774616260959406,
"learning_rate": 1.2344601676371312e-05,
"loss": 0.2107,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2032512128353119,
"step": 3090,
"valid_targets_mean": 5143.7,
"valid_targets_min": 1085
},
{
"epoch": 4.647147147147147,
"grad_norm": 0.609625942880746,
"learning_rate": 1.2275469794279068e-05,
"loss": 0.2376,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24463210999965668,
"step": 3095,
"valid_targets_mean": 3302.1,
"valid_targets_min": 211
},
{
"epoch": 4.654654654654655,
"grad_norm": 0.5539889957775487,
"learning_rate": 1.220644621690885e-05,
"loss": 0.2184,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19467709958553314,
"step": 3100,
"valid_targets_mean": 3723.1,
"valid_targets_min": 637
},
{
"epoch": 4.662162162162162,
"grad_norm": 0.5324494392088087,
"learning_rate": 1.2137531912032058e-05,
"loss": 0.2179,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2482069581747055,
"step": 3105,
"valid_targets_mean": 4753.6,
"valid_targets_min": 634
},
{
"epoch": 4.66966966966967,
"grad_norm": 0.5048180559075982,
"learning_rate": 1.2068727845887995e-05,
"loss": 0.2118,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24020060896873474,
"step": 3110,
"valid_targets_mean": 5051.0,
"valid_targets_min": 462
},
{
"epoch": 4.677177177177177,
"grad_norm": 0.4832724873118443,
"learning_rate": 1.2000034983170305e-05,
"loss": 0.2357,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22151488065719604,
"step": 3115,
"valid_targets_mean": 5193.5,
"valid_targets_min": 674
},
{
"epoch": 4.684684684684685,
"grad_norm": 0.5679523589750985,
"learning_rate": 1.193145428701347e-05,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2017378807067871,
"step": 3120,
"valid_targets_mean": 4752.9,
"valid_targets_min": 764
},
{
"epoch": 4.692192192192192,
"grad_norm": 0.8966754020165514,
"learning_rate": 1.18629867189793e-05,
"loss": 0.2302,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24184086918830872,
"step": 3125,
"valid_targets_mean": 2982.5,
"valid_targets_min": 515
},
{
"epoch": 4.6996996996997,
"grad_norm": 0.49411819508382815,
"learning_rate": 1.1794633239043449e-05,
"loss": 0.2028,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2202903926372528,
"step": 3130,
"valid_targets_mean": 4615.9,
"valid_targets_min": 738
},
{
"epoch": 4.707207207207207,
"grad_norm": 0.4928998645668594,
"learning_rate": 1.1726394805581957e-05,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21853674948215485,
"step": 3135,
"valid_targets_mean": 5042.8,
"valid_targets_min": 656
},
{
"epoch": 4.714714714714715,
"grad_norm": 0.5803190883509034,
"learning_rate": 1.1658272375357797e-05,
"loss": 0.2426,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24375799298286438,
"step": 3140,
"valid_targets_mean": 4044.2,
"valid_targets_min": 525
},
{
"epoch": 4.722222222222222,
"grad_norm": 0.5795814998007034,
"learning_rate": 1.1590266903507499e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2230663299560547,
"step": 3145,
"valid_targets_mean": 4489.6,
"valid_targets_min": 930
},
{
"epoch": 4.72972972972973,
"grad_norm": 0.6742257430638947,
"learning_rate": 1.1522379343527708e-05,
"loss": 0.2535,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23786276578903198,
"step": 3150,
"valid_targets_mean": 4348.9,
"valid_targets_min": 534
},
{
"epoch": 4.737237237237237,
"grad_norm": 0.49627665219198364,
"learning_rate": 1.1454610647261859e-05,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2170691192150116,
"step": 3155,
"valid_targets_mean": 4579.3,
"valid_targets_min": 701
},
{
"epoch": 4.744744744744745,
"grad_norm": 0.4965773011218609,
"learning_rate": 1.1386961764886806e-05,
"loss": 0.2299,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21680960059165955,
"step": 3160,
"valid_targets_mean": 4751.6,
"valid_targets_min": 970
},
{
"epoch": 4.752252252252252,
"grad_norm": 0.46564876478736006,
"learning_rate": 1.1319433644899496e-05,
"loss": 0.2346,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20024517178535461,
"step": 3165,
"valid_targets_mean": 5608.7,
"valid_targets_min": 565
},
{
"epoch": 4.75975975975976,
"grad_norm": 0.8219903727111237,
"learning_rate": 1.1252027234103709e-05,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21334412693977356,
"step": 3170,
"valid_targets_mean": 3558.3,
"valid_targets_min": 684
},
{
"epoch": 4.767267267267267,
"grad_norm": 0.5331331638771257,
"learning_rate": 1.118474347759673e-05,
"loss": 0.2032,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23813585937023163,
"step": 3175,
"valid_targets_mean": 4562.6,
"valid_targets_min": 700
},
{
"epoch": 4.774774774774775,
"grad_norm": 0.7204879070632291,
"learning_rate": 1.1117583318756128e-05,
"loss": 0.2218,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21081534028053284,
"step": 3180,
"valid_targets_mean": 4559.9,
"valid_targets_min": 347
},
{
"epoch": 4.782282282282282,
"grad_norm": 0.6342862982793008,
"learning_rate": 1.1050547699226522e-05,
"loss": 0.2234,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21464157104492188,
"step": 3185,
"valid_targets_mean": 4187.8,
"valid_targets_min": 611
},
{
"epoch": 4.78978978978979,
"grad_norm": 0.5094911353991051,
"learning_rate": 1.09836375589064e-05,
"loss": 0.2126,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21020804345607758,
"step": 3190,
"valid_targets_mean": 5157.7,
"valid_targets_min": 1150
},
{
"epoch": 4.797297297297297,
"grad_norm": 0.47526721126268623,
"learning_rate": 1.0916853835934891e-05,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22524023056030273,
"step": 3195,
"valid_targets_mean": 5497.2,
"valid_targets_min": 714
},
{
"epoch": 4.804804804804805,
"grad_norm": 0.7451217907444951,
"learning_rate": 1.0850197466678662e-05,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20764270424842834,
"step": 3200,
"valid_targets_mean": 4149.2,
"valid_targets_min": 628
},
{
"epoch": 4.812312312312312,
"grad_norm": 0.4957698184650846,
"learning_rate": 1.0783669385718762e-05,
"loss": 0.2371,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21627801656723022,
"step": 3205,
"valid_targets_mean": 5803.0,
"valid_targets_min": 790
},
{
"epoch": 4.81981981981982,
"grad_norm": 0.5309967929446427,
"learning_rate": 1.0717270525837523e-05,
"loss": 0.2449,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2549176514148712,
"step": 3210,
"valid_targets_mean": 5175.2,
"valid_targets_min": 558
},
{
"epoch": 4.827327327327327,
"grad_norm": 0.6675846311975975,
"learning_rate": 1.0651001818005487e-05,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2339574694633484,
"step": 3215,
"valid_targets_mean": 3242.3,
"valid_targets_min": 499
},
{
"epoch": 4.834834834834835,
"grad_norm": 0.5348472304451167,
"learning_rate": 1.0584864191368345e-05,
"loss": 0.2287,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2503393888473511,
"step": 3220,
"valid_targets_mean": 5664.9,
"valid_targets_min": 487
},
{
"epoch": 4.842342342342342,
"grad_norm": 0.5338144959827715,
"learning_rate": 1.0518858573233911e-05,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21501460671424866,
"step": 3225,
"valid_targets_mean": 4275.4,
"valid_targets_min": 631
},
{
"epoch": 4.84984984984985,
"grad_norm": 0.583867201837148,
"learning_rate": 1.0452985889059151e-05,
"loss": 0.2321,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2584874629974365,
"step": 3230,
"valid_targets_mean": 3758.3,
"valid_targets_min": 367
},
{
"epoch": 4.857357357357357,
"grad_norm": 0.4704381431905369,
"learning_rate": 1.0387247062437144e-05,
"loss": 0.2159,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2556239068508148,
"step": 3235,
"valid_targets_mean": 5887.3,
"valid_targets_min": 489
},
{
"epoch": 4.864864864864865,
"grad_norm": 0.6249528070324213,
"learning_rate": 1.0321643015084187e-05,
"loss": 0.2111,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23891428112983704,
"step": 3240,
"valid_targets_mean": 3309.9,
"valid_targets_min": 301
},
{
"epoch": 4.872372372372372,
"grad_norm": 0.44764920429718186,
"learning_rate": 1.0256174666826841e-05,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19511452317237854,
"step": 3245,
"valid_targets_mean": 5169.8,
"valid_targets_min": 980
},
{
"epoch": 4.87987987987988,
"grad_norm": 0.5340956174536189,
"learning_rate": 1.0190842935589065e-05,
"loss": 0.206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18626420199871063,
"step": 3250,
"valid_targets_mean": 3967.4,
"valid_targets_min": 798
},
{
"epoch": 4.887387387387387,
"grad_norm": 0.56288269038886,
"learning_rate": 1.0125648737379307e-05,
"loss": 0.2185,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20922933518886566,
"step": 3255,
"valid_targets_mean": 4145.1,
"valid_targets_min": 511
},
{
"epoch": 4.894894894894895,
"grad_norm": 0.4659624202841574,
"learning_rate": 1.0060592986277693e-05,
"loss": 0.2216,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18871676921844482,
"step": 3260,
"valid_targets_mean": 5421.9,
"valid_targets_min": 2150
},
{
"epoch": 4.902402402402402,
"grad_norm": 0.5691277577002785,
"learning_rate": 9.995676594423186e-06,
"loss": 0.2241,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22213050723075867,
"step": 3265,
"valid_targets_mean": 4555.8,
"valid_targets_min": 839
},
{
"epoch": 4.90990990990991,
"grad_norm": 0.6445683801786387,
"learning_rate": 9.930900472000834e-06,
"loss": 0.1918,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20591846108436584,
"step": 3270,
"valid_targets_mean": 3039.4,
"valid_targets_min": 574
},
{
"epoch": 4.9174174174174174,
"grad_norm": 0.48632405588473493,
"learning_rate": 9.866265527228961e-06,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.224864199757576,
"step": 3275,
"valid_targets_mean": 5041.8,
"valid_targets_min": 562
},
{
"epoch": 4.924924924924925,
"grad_norm": 0.4551299572592259,
"learning_rate": 9.801772666346462e-06,
"loss": 0.2383,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17636257410049438,
"step": 3280,
"valid_targets_mean": 5264.3,
"valid_targets_min": 260
},
{
"epoch": 4.9324324324324325,
"grad_norm": 0.5303503051433811,
"learning_rate": 9.737422793600092e-06,
"loss": 0.2529,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2605491876602173,
"step": 3285,
"valid_targets_mean": 4923.2,
"valid_targets_min": 551
},
{
"epoch": 4.93993993993994,
"grad_norm": 0.5619328215648045,
"learning_rate": 9.67321681123179e-06,
"loss": 0.2219,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21425651013851166,
"step": 3290,
"valid_targets_mean": 4545.6,
"valid_targets_min": 515
},
{
"epoch": 4.9474474474474475,
"grad_norm": 0.4969814195952852,
"learning_rate": 9.609155619466016e-06,
"loss": 0.202,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19319353997707367,
"step": 3295,
"valid_targets_mean": 4383.9,
"valid_targets_min": 711
},
{
"epoch": 4.954954954954955,
"grad_norm": 0.6244151395343142,
"learning_rate": 9.545240116497143e-06,
"loss": 0.2181,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18449707329273224,
"step": 3300,
"valid_targets_mean": 3211.4,
"valid_targets_min": 484
},
{
"epoch": 4.9624624624624625,
"grad_norm": 0.5893223235253725,
"learning_rate": 9.481471198476855e-06,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22556568682193756,
"step": 3305,
"valid_targets_mean": 5031.6,
"valid_targets_min": 684
},
{
"epoch": 4.96996996996997,
"grad_norm": 0.4915902916242456,
"learning_rate": 9.417849759501603e-06,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2357444167137146,
"step": 3310,
"valid_targets_mean": 5379.2,
"valid_targets_min": 860
},
{
"epoch": 4.9774774774774775,
"grad_norm": 0.5245483991646102,
"learning_rate": 9.354376691600034e-06,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18305274844169617,
"step": 3315,
"valid_targets_mean": 4195.8,
"valid_targets_min": 388
},
{
"epoch": 4.984984984984985,
"grad_norm": 0.49053726456598334,
"learning_rate": 9.2910528847205e-06,
"loss": 0.2419,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23515072464942932,
"step": 3320,
"valid_targets_mean": 4802.1,
"valid_targets_min": 666
},
{
"epoch": 4.9924924924924925,
"grad_norm": 0.5458070078892359,
"learning_rate": 9.227879226718595e-06,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2729540467262268,
"step": 3325,
"valid_targets_mean": 4229.2,
"valid_targets_min": 716
},
{
"epoch": 5.0,
"grad_norm": 0.4617612878592164,
"learning_rate": 9.164856603344681e-06,
"loss": 0.2209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19838783144950867,
"step": 3330,
"valid_targets_mean": 5383.6,
"valid_targets_min": 1005
},
{
"epoch": 5.0075075075075075,
"grad_norm": 0.5006372512661854,
"learning_rate": 9.10198589823149e-06,
"loss": 0.2043,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21871143579483032,
"step": 3335,
"valid_targets_mean": 4899.0,
"valid_targets_min": 478
},
{
"epoch": 5.015015015015015,
"grad_norm": 0.493071836759497,
"learning_rate": 9.039267992881724e-06,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15860621631145477,
"step": 3340,
"valid_targets_mean": 4637.3,
"valid_targets_min": 539
},
{
"epoch": 5.0225225225225225,
"grad_norm": 0.5942000008682329,
"learning_rate": 8.97670376665569e-06,
"loss": 0.212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21339187026023865,
"step": 3345,
"valid_targets_mean": 4111.1,
"valid_targets_min": 482
},
{
"epoch": 5.03003003003003,
"grad_norm": 0.5098653931776418,
"learning_rate": 8.914294096758995e-06,
"loss": 0.2524,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21369382739067078,
"step": 3350,
"valid_targets_mean": 5529.7,
"valid_targets_min": 571
},
{
"epoch": 5.0375375375375375,
"grad_norm": 0.48801798277011926,
"learning_rate": 8.852039858230217e-06,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16710881888866425,
"step": 3355,
"valid_targets_mean": 4623.7,
"valid_targets_min": 694
},
{
"epoch": 5.045045045045045,
"grad_norm": 0.5406142033120225,
"learning_rate": 8.78994192392865e-06,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18688131868839264,
"step": 3360,
"valid_targets_mean": 3961.8,
"valid_targets_min": 529
},
{
"epoch": 5.0525525525525525,
"grad_norm": 0.49064863606657333,
"learning_rate": 8.728001164522068e-06,
"loss": 0.2054,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19211602210998535,
"step": 3365,
"valid_targets_mean": 5132.5,
"valid_targets_min": 557
},
{
"epoch": 5.06006006006006,
"grad_norm": 0.5428647141950651,
"learning_rate": 8.666218448474517e-06,
"loss": 0.2235,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19043126702308655,
"step": 3370,
"valid_targets_mean": 4518.9,
"valid_targets_min": 623
},
{
"epoch": 5.0675675675675675,
"grad_norm": 0.5285735991494391,
"learning_rate": 8.604594642034126e-06,
"loss": 0.2093,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22566662728786469,
"step": 3375,
"valid_targets_mean": 4554.3,
"valid_targets_min": 628
},
{
"epoch": 5.075075075075075,
"grad_norm": 0.6397497283612681,
"learning_rate": 8.543130609220982e-06,
"loss": 0.1913,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17037567496299744,
"step": 3380,
"valid_targets_mean": 3197.0,
"valid_targets_min": 631
},
{
"epoch": 5.0825825825825826,
"grad_norm": 0.5624772140252701,
"learning_rate": 8.481827211814991e-06,
"loss": 0.2315,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2726784348487854,
"step": 3385,
"valid_targets_mean": 4160.6,
"valid_targets_min": 727
},
{
"epoch": 5.09009009009009,
"grad_norm": 0.5877366129284431,
"learning_rate": 8.420685309343835e-06,
"loss": 0.2131,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20283541083335876,
"step": 3390,
"valid_targets_mean": 3707.2,
"valid_targets_min": 663
},
{
"epoch": 5.097597597597598,
"grad_norm": 0.6489090565754443,
"learning_rate": 8.35970575907087e-06,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2192349135875702,
"step": 3395,
"valid_targets_mean": 5407.1,
"valid_targets_min": 672
},
{
"epoch": 5.105105105105105,
"grad_norm": 0.5565202403018633,
"learning_rate": 8.298889415983142e-06,
"loss": 0.2057,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1590254306793213,
"step": 3400,
"valid_targets_mean": 3583.3,
"valid_targets_min": 735
},
{
"epoch": 5.112612612612613,
"grad_norm": 0.41960211523789304,
"learning_rate": 8.23823713277938e-06,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14446228742599487,
"step": 3405,
"valid_targets_mean": 5082.1,
"valid_targets_min": 276
},
{
"epoch": 5.12012012012012,
"grad_norm": 0.6517049110770983,
"learning_rate": 8.17774975985806e-06,
"loss": 0.207,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23023463785648346,
"step": 3410,
"valid_targets_mean": 4596.8,
"valid_targets_min": 786
},
{
"epoch": 5.127627627627628,
"grad_norm": 0.8256063611735115,
"learning_rate": 8.117428145305464e-06,
"loss": 0.1705,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19371360540390015,
"step": 3415,
"valid_targets_mean": 3733.1,
"valid_targets_min": 946
},
{
"epoch": 5.135135135135135,
"grad_norm": 0.47817908036094603,
"learning_rate": 8.057273134883794e-06,
"loss": 0.2065,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20559421181678772,
"step": 3420,
"valid_targets_mean": 5914.1,
"valid_targets_min": 746
},
{
"epoch": 5.142642642642643,
"grad_norm": 0.6404035798093046,
"learning_rate": 7.997285572019316e-06,
"loss": 0.2294,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19509994983673096,
"step": 3425,
"valid_targets_mean": 3609.6,
"valid_targets_min": 719
},
{
"epoch": 5.15015015015015,
"grad_norm": 0.7814615076086997,
"learning_rate": 7.937466297790542e-06,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17219263315200806,
"step": 3430,
"valid_targets_mean": 4124.9,
"valid_targets_min": 593
},
{
"epoch": 5.157657657657658,
"grad_norm": 0.5711178140418124,
"learning_rate": 7.877816150916422e-06,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20192334055900574,
"step": 3435,
"valid_targets_mean": 4497.1,
"valid_targets_min": 673
},
{
"epoch": 5.165165165165165,
"grad_norm": 0.6605000045012411,
"learning_rate": 7.81833596774459e-06,
"loss": 0.1922,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21957352757453918,
"step": 3440,
"valid_targets_mean": 3223.1,
"valid_targets_min": 617
},
{
"epoch": 5.172672672672673,
"grad_norm": 1.2228952471867771,
"learning_rate": 7.759026582239639e-06,
"loss": 0.1919,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2631041407585144,
"step": 3445,
"valid_targets_mean": 4348.8,
"valid_targets_min": 574
},
{
"epoch": 5.18018018018018,
"grad_norm": 0.858620752436695,
"learning_rate": 7.699888825971433e-06,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.162127286195755,
"step": 3450,
"valid_targets_mean": 6938.4,
"valid_targets_min": 683
},
{
"epoch": 5.187687687687688,
"grad_norm": 0.6070759956430632,
"learning_rate": 7.640923528103441e-06,
"loss": 0.2168,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2934483289718628,
"step": 3455,
"valid_targets_mean": 4662.9,
"valid_targets_min": 739
},
{
"epoch": 5.195195195195195,
"grad_norm": 0.5186921298999412,
"learning_rate": 7.582131515381108e-06,
"loss": 0.203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2093011438846588,
"step": 3460,
"valid_targets_mean": 4782.7,
"valid_targets_min": 492
},
{
"epoch": 5.202702702702703,
"grad_norm": 0.5661778349613429,
"learning_rate": 7.5235136121202675e-06,
"loss": 0.2171,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24795249104499817,
"step": 3465,
"valid_targets_mean": 4599.2,
"valid_targets_min": 324
},
{
"epoch": 5.21021021021021,
"grad_norm": 0.5360911975296877,
"learning_rate": 7.465070640195606e-06,
"loss": 0.2068,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26138007640838623,
"step": 3470,
"valid_targets_mean": 4960.6,
"valid_targets_min": 376
},
{
"epoch": 5.217717717717718,
"grad_norm": 0.5642393094183789,
"learning_rate": 7.406803419029094e-06,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24130575358867645,
"step": 3475,
"valid_targets_mean": 4966.7,
"valid_targets_min": 821
},
{
"epoch": 5.225225225225225,
"grad_norm": 0.4550076790955841,
"learning_rate": 7.3487127655785295e-06,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1952485740184784,
"step": 3480,
"valid_targets_mean": 5512.1,
"valid_targets_min": 622
},
{
"epoch": 5.232732732732733,
"grad_norm": 0.6885372734490723,
"learning_rate": 7.290799494326077e-06,
"loss": 0.2016,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16893789172172546,
"step": 3485,
"valid_targets_mean": 4656.0,
"valid_targets_min": 477
},
{
"epoch": 5.24024024024024,
"grad_norm": 0.5045869253443142,
"learning_rate": 7.233064417266846e-06,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16010183095932007,
"step": 3490,
"valid_targets_mean": 3909.6,
"valid_targets_min": 609
},
{
"epoch": 5.247747747747748,
"grad_norm": 0.6679277663347103,
"learning_rate": 7.1755083438975056e-06,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2579156756401062,
"step": 3495,
"valid_targets_mean": 3035.2,
"valid_targets_min": 410
},
{
"epoch": 5.255255255255255,
"grad_norm": 0.48166787337419537,
"learning_rate": 7.118132081204936e-06,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17768923938274384,
"step": 3500,
"valid_targets_mean": 4611.5,
"valid_targets_min": 540
},
{
"epoch": 5.262762762762763,
"grad_norm": 0.6437356623831512,
"learning_rate": 7.060936433654901e-06,
"loss": 0.2106,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22873665392398834,
"step": 3505,
"valid_targets_mean": 4224.2,
"valid_targets_min": 1214
},
{
"epoch": 5.27027027027027,
"grad_norm": 0.5041184297812231,
"learning_rate": 7.003922203180813e-06,
"loss": 0.1829,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17131251096725464,
"step": 3510,
"valid_targets_mean": 4996.4,
"valid_targets_min": 762
},
{
"epoch": 5.277777777777778,
"grad_norm": 0.42636959404581054,
"learning_rate": 6.947090189172425e-06,
"loss": 0.1905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17408744990825653,
"step": 3515,
"valid_targets_mean": 6548.1,
"valid_targets_min": 681
},
{
"epoch": 5.285285285285285,
"grad_norm": 0.7004634661839949,
"learning_rate": 6.89044118846467e-06,
"loss": 0.1871,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21478641033172607,
"step": 3520,
"valid_targets_mean": 3402.0,
"valid_targets_min": 534
},
{
"epoch": 5.292792792792793,
"grad_norm": 0.6584020869113968,
"learning_rate": 6.833975995326465e-06,
"loss": 0.2226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17992106080055237,
"step": 3525,
"valid_targets_mean": 3046.6,
"valid_targets_min": 592
},
{
"epoch": 5.3003003003003,
"grad_norm": 0.505387458907387,
"learning_rate": 6.777695401449591e-06,
"loss": 0.1905,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20670431852340698,
"step": 3530,
"valid_targets_mean": 5285.2,
"valid_targets_min": 893
},
{
"epoch": 5.307807807807808,
"grad_norm": 0.5767720272580488,
"learning_rate": 6.721600195937578e-06,
"loss": 0.1898,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18273615837097168,
"step": 3535,
"valid_targets_mean": 3702.8,
"valid_targets_min": 877
},
{
"epoch": 5.315315315315315,
"grad_norm": 0.5468384364940457,
"learning_rate": 6.665691165294654e-06,
"loss": 0.2308,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2389727234840393,
"step": 3540,
"valid_targets_mean": 4842.5,
"valid_targets_min": 1056
},
{
"epoch": 5.322822822822823,
"grad_norm": 0.5417666029457835,
"learning_rate": 6.609969093414699e-06,
"loss": 0.2186,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2088838666677475,
"step": 3545,
"valid_targets_mean": 4254.4,
"valid_targets_min": 367
},
{
"epoch": 5.33033033033033,
"grad_norm": 0.5649058281181645,
"learning_rate": 6.55443476157029e-06,
"loss": 0.1991,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1812952756881714,
"step": 3550,
"valid_targets_mean": 4252.7,
"valid_targets_min": 673
},
{
"epoch": 5.337837837837838,
"grad_norm": 0.5452388205148444,
"learning_rate": 6.4990889484017e-06,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1796906590461731,
"step": 3555,
"valid_targets_mean": 3792.6,
"valid_targets_min": 600
},
{
"epoch": 5.345345345345345,
"grad_norm": 0.5732225965401323,
"learning_rate": 6.443932429906013e-06,
"loss": 0.2323,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2930184006690979,
"step": 3560,
"valid_targets_mean": 4310.6,
"valid_targets_min": 541
},
{
"epoch": 5.352852852852853,
"grad_norm": 0.6028750589087655,
"learning_rate": 6.3889659794262334e-06,
"loss": 0.2129,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21735335886478424,
"step": 3565,
"valid_targets_mean": 3685.1,
"valid_targets_min": 583
},
{
"epoch": 5.36036036036036,
"grad_norm": 0.602478347893381,
"learning_rate": 6.334190367640449e-06,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18190817534923553,
"step": 3570,
"valid_targets_mean": 4439.8,
"valid_targets_min": 656
},
{
"epoch": 5.367867867867868,
"grad_norm": 0.5557346424426345,
"learning_rate": 6.279606362551016e-06,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1880781054496765,
"step": 3575,
"valid_targets_mean": 4198.0,
"valid_targets_min": 456
},
{
"epoch": 5.375375375375375,
"grad_norm": 0.4806991447402713,
"learning_rate": 6.225214729473794e-06,
"loss": 0.2637,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22571183741092682,
"step": 3580,
"valid_targets_mean": 5347.3,
"valid_targets_min": 652
},
{
"epoch": 5.382882882882883,
"grad_norm": 0.6189915178471305,
"learning_rate": 6.171016231027418e-06,
"loss": 0.2266,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22540658712387085,
"step": 3585,
"valid_targets_mean": 3396.4,
"valid_targets_min": 619
},
{
"epoch": 5.39039039039039,
"grad_norm": 0.4781145702083429,
"learning_rate": 6.117011627122617e-06,
"loss": 0.2178,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22122199833393097,
"step": 3590,
"valid_targets_mean": 5498.2,
"valid_targets_min": 407
},
{
"epoch": 5.397897897897898,
"grad_norm": 0.501236643073855,
"learning_rate": 6.063201674951535e-06,
"loss": 0.2113,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19432801008224487,
"step": 3595,
"valid_targets_mean": 4399.0,
"valid_targets_min": 748
},
{
"epoch": 5.405405405405405,
"grad_norm": 0.5083333895430631,
"learning_rate": 6.009587128977128e-06,
"loss": 0.1969,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21600385010242462,
"step": 3600,
"valid_targets_mean": 4527.8,
"valid_targets_min": 441
},
{
"epoch": 5.412912912912913,
"grad_norm": 0.43801311222355105,
"learning_rate": 5.956168740922592e-06,
"loss": 0.2232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17686530947685242,
"step": 3605,
"valid_targets_mean": 5968.8,
"valid_targets_min": 650
},
{
"epoch": 5.42042042042042,
"grad_norm": 0.5142170347253675,
"learning_rate": 5.902947259760805e-06,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16562317311763763,
"step": 3610,
"valid_targets_mean": 4170.2,
"valid_targets_min": 562
},
{
"epoch": 5.427927927927928,
"grad_norm": 0.57494822664475,
"learning_rate": 5.84992343170385e-06,
"loss": 0.2344,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19728896021842957,
"step": 3615,
"valid_targets_mean": 3665.9,
"valid_targets_min": 602
},
{
"epoch": 5.435435435435435,
"grad_norm": 0.6682604390565138,
"learning_rate": 5.797098000192527e-06,
"loss": 0.194,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18809694051742554,
"step": 3620,
"valid_targets_mean": 5038.7,
"valid_targets_min": 709
},
{
"epoch": 5.442942942942943,
"grad_norm": 0.5420242165199347,
"learning_rate": 5.744471705885946e-06,
"loss": 0.2203,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19964119791984558,
"step": 3625,
"valid_targets_mean": 4113.4,
"valid_targets_min": 400
},
{
"epoch": 5.45045045045045,
"grad_norm": 0.4897694331671357,
"learning_rate": 5.692045286651145e-06,
"loss": 0.2233,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21164345741271973,
"step": 3630,
"valid_targets_mean": 5133.8,
"valid_targets_min": 842
},
{
"epoch": 5.457957957957958,
"grad_norm": 0.5130796784439051,
"learning_rate": 5.6398194775527305e-06,
"loss": 0.2175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1640782356262207,
"step": 3635,
"valid_targets_mean": 4620.8,
"valid_targets_min": 957
},
{
"epoch": 5.465465465465465,
"grad_norm": 0.7096256538606244,
"learning_rate": 5.587795010842578e-06,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.229142963886261,
"step": 3640,
"valid_targets_mean": 3584.5,
"valid_targets_min": 291
},
{
"epoch": 5.472972972972973,
"grad_norm": 0.45320281126185963,
"learning_rate": 5.535972615949565e-06,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15912821888923645,
"step": 3645,
"valid_targets_mean": 6046.6,
"valid_targets_min": 565
},
{
"epoch": 5.48048048048048,
"grad_norm": 0.6580766138686164,
"learning_rate": 5.484353019469344e-06,
"loss": 0.2385,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24230948090553284,
"step": 3650,
"valid_targets_mean": 3922.4,
"valid_targets_min": 618
},
{
"epoch": 5.487987987987988,
"grad_norm": 0.560301246319454,
"learning_rate": 5.432936945154159e-06,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18417420983314514,
"step": 3655,
"valid_targets_mean": 4271.6,
"valid_targets_min": 590
},
{
"epoch": 5.495495495495495,
"grad_norm": 0.6206056063840636,
"learning_rate": 5.381725113902689e-06,
"loss": 0.1936,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17472167313098907,
"step": 3660,
"valid_targets_mean": 3848.2,
"valid_targets_min": 581
},
{
"epoch": 5.503003003003003,
"grad_norm": 0.4966662168616601,
"learning_rate": 5.330718243749942e-06,
"loss": 0.1978,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.191782146692276,
"step": 3665,
"valid_targets_mean": 4883.6,
"valid_targets_min": 648
},
{
"epoch": 5.51051051051051,
"grad_norm": 0.5471645413638431,
"learning_rate": 5.279917049857209e-06,
"loss": 0.1937,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17728394269943237,
"step": 3670,
"valid_targets_mean": 3883.9,
"valid_targets_min": 531
},
{
"epoch": 5.518018018018018,
"grad_norm": 0.49020284035840306,
"learning_rate": 5.229322244501996e-06,
"loss": 0.1986,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2151007056236267,
"step": 3675,
"valid_targets_mean": 5625.6,
"valid_targets_min": 710
},
{
"epoch": 5.525525525525525,
"grad_norm": 0.502623769306998,
"learning_rate": 5.1789345370680726e-06,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18778328597545624,
"step": 3680,
"valid_targets_mean": 5465.0,
"valid_targets_min": 604
},
{
"epoch": 5.533033033033033,
"grad_norm": 0.6082538279267172,
"learning_rate": 5.128754634035509e-06,
"loss": 0.2006,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2307537943124771,
"step": 3685,
"valid_targets_mean": 3897.9,
"valid_targets_min": 475
},
{
"epoch": 5.54054054054054,
"grad_norm": 0.4677087975060976,
"learning_rate": 5.078783238970775e-06,
"loss": 0.1746,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1452668309211731,
"step": 3690,
"valid_targets_mean": 4697.0,
"valid_targets_min": 820
},
{
"epoch": 5.548048048048048,
"grad_norm": 0.5258809236597033,
"learning_rate": 5.029021052516874e-06,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1686006635427475,
"step": 3695,
"valid_targets_mean": 5070.6,
"valid_targets_min": 874
},
{
"epoch": 5.555555555555555,
"grad_norm": 0.5418543854859791,
"learning_rate": 4.979468772383525e-06,
"loss": 0.2528,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23895879089832306,
"step": 3700,
"valid_targets_mean": 4703.9,
"valid_targets_min": 799
},
{
"epoch": 5.563063063063063,
"grad_norm": 0.5580957987554833,
"learning_rate": 4.93012709333736e-06,
"loss": 0.2182,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18779677152633667,
"step": 3705,
"valid_targets_mean": 3780.4,
"valid_targets_min": 700
},
{
"epoch": 5.57057057057057,
"grad_norm": 0.5796418427811311,
"learning_rate": 4.880996707192227e-06,
"loss": 0.2076,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18160055577754974,
"step": 3710,
"valid_targets_mean": 3617.5,
"valid_targets_min": 691
},
{
"epoch": 5.578078078078078,
"grad_norm": 0.625613489620117,
"learning_rate": 4.832078302799437e-06,
"loss": 0.231,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2596314549446106,
"step": 3715,
"valid_targets_mean": 4067.5,
"valid_targets_min": 928
},
{
"epoch": 5.585585585585585,
"grad_norm": 0.4752383217997911,
"learning_rate": 4.7833725660381356e-06,
"loss": 0.21,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15992337465286255,
"step": 3720,
"valid_targets_mean": 4770.9,
"valid_targets_min": 761
},
{
"epoch": 5.593093093093093,
"grad_norm": 0.5779722936684374,
"learning_rate": 4.734880179805685e-06,
"loss": 0.2091,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18457244336605072,
"step": 3725,
"valid_targets_mean": 3342.9,
"valid_targets_min": 691
},
{
"epoch": 5.6006006006006,
"grad_norm": 0.550075630002128,
"learning_rate": 4.686601824008079e-06,
"loss": 0.2177,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18044841289520264,
"step": 3730,
"valid_targets_mean": 4945.1,
"valid_targets_min": 906
},
{
"epoch": 5.608108108108108,
"grad_norm": 0.631353153629254,
"learning_rate": 4.638538175550422e-06,
"loss": 0.195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21107108891010284,
"step": 3735,
"valid_targets_mean": 3289.5,
"valid_targets_min": 552
},
{
"epoch": 5.615615615615615,
"grad_norm": 0.7558092942754301,
"learning_rate": 4.590689908327428e-06,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20774057507514954,
"step": 3740,
"valid_targets_mean": 2326.2,
"valid_targets_min": 684
},
{
"epoch": 5.623123123123123,
"grad_norm": 0.6050928606517935,
"learning_rate": 4.543057693213973e-06,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.230237677693367,
"step": 3745,
"valid_targets_mean": 3875.2,
"valid_targets_min": 504
},
{
"epoch": 5.63063063063063,
"grad_norm": 0.5844617202863044,
"learning_rate": 4.495642198055707e-06,
"loss": 0.2215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2029937505722046,
"step": 3750,
"valid_targets_mean": 4027.4,
"valid_targets_min": 536
},
{
"epoch": 5.638138138138138,
"grad_norm": 0.7169568097777915,
"learning_rate": 4.4484440876596625e-06,
"loss": 0.2364,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22157275676727295,
"step": 3755,
"valid_targets_mean": 2619.1,
"valid_targets_min": 657
},
{
"epoch": 5.645645645645645,
"grad_norm": 0.5563696214524937,
"learning_rate": 4.401464023784945e-06,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1895512342453003,
"step": 3760,
"valid_targets_mean": 4033.1,
"valid_targets_min": 639
},
{
"epoch": 5.653153153153153,
"grad_norm": 0.7184497569373026,
"learning_rate": 4.354702665133457e-06,
"loss": 0.2035,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17378777265548706,
"step": 3765,
"valid_targets_mean": 4711.1,
"valid_targets_min": 460
},
{
"epoch": 5.66066066066066,
"grad_norm": 0.672562372546706,
"learning_rate": 4.308160667340671e-06,
"loss": 0.22,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23928751051425934,
"step": 3770,
"valid_targets_mean": 2964.8,
"valid_targets_min": 402
},
{
"epoch": 5.668168168168168,
"grad_norm": 0.4887664405970491,
"learning_rate": 4.261838682966413e-06,
"loss": 0.2001,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19159993529319763,
"step": 3775,
"valid_targets_mean": 5129.8,
"valid_targets_min": 752
},
{
"epoch": 5.675675675675675,
"grad_norm": 0.5457059516129726,
"learning_rate": 4.215737361485737e-06,
"loss": 0.2193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21986320614814758,
"step": 3780,
"valid_targets_mean": 5641.1,
"valid_targets_min": 915
},
{
"epoch": 5.683183183183183,
"grad_norm": 0.5115604631418055,
"learning_rate": 4.1698573492798e-06,
"loss": 0.198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1333058923482895,
"step": 3785,
"valid_targets_mean": 3278.0,
"valid_targets_min": 647
},
{
"epoch": 5.6906906906906904,
"grad_norm": 0.7200821505353998,
"learning_rate": 4.124199289626818e-06,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22922024130821228,
"step": 3790,
"valid_targets_mean": 2683.2,
"valid_targets_min": 625
},
{
"epoch": 5.698198198198198,
"grad_norm": 0.42145237729701907,
"learning_rate": 4.078763822693021e-06,
"loss": 0.206,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18455691635608673,
"step": 3795,
"valid_targets_mean": 6690.8,
"valid_targets_min": 920
},
{
"epoch": 5.7057057057057055,
"grad_norm": 0.5325975126541347,
"learning_rate": 4.033551585523716e-06,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19546617567539215,
"step": 3800,
"valid_targets_mean": 5228.1,
"valid_targets_min": 594
},
{
"epoch": 5.713213213213213,
"grad_norm": 0.6601846614023362,
"learning_rate": 3.988563212034315e-06,
"loss": 0.2511,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15158836543560028,
"step": 3805,
"valid_targets_mean": 3667.6,
"valid_targets_min": 358
},
{
"epoch": 5.7207207207207205,
"grad_norm": 0.6027115950409477,
"learning_rate": 3.943799333001466e-06,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19812247157096863,
"step": 3810,
"valid_targets_mean": 3187.2,
"valid_targets_min": 542
},
{
"epoch": 5.728228228228228,
"grad_norm": 0.7999468435844861,
"learning_rate": 3.899260576054209e-06,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24161022901535034,
"step": 3815,
"valid_targets_mean": 2608.4,
"valid_targets_min": 416
},
{
"epoch": 5.7357357357357355,
"grad_norm": 0.6197457192371475,
"learning_rate": 3.854947565665172e-06,
"loss": 0.2337,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20346400141716003,
"step": 3820,
"valid_targets_mean": 3887.9,
"valid_targets_min": 641
},
{
"epoch": 5.743243243243243,
"grad_norm": 0.5811299922570492,
"learning_rate": 3.810860923141824e-06,
"loss": 0.2173,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2590106129646301,
"step": 3825,
"valid_targets_mean": 4175.2,
"valid_targets_min": 750
},
{
"epoch": 5.7507507507507505,
"grad_norm": 0.6108735444142156,
"learning_rate": 3.767001266617747e-06,
"loss": 0.2198,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21409021317958832,
"step": 3830,
"valid_targets_mean": 3856.4,
"valid_targets_min": 504
},
{
"epoch": 5.758258258258258,
"grad_norm": 0.5427297235952976,
"learning_rate": 3.7233692110439814e-06,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20367692410945892,
"step": 3835,
"valid_targets_mean": 4545.9,
"valid_targets_min": 666
},
{
"epoch": 5.7657657657657655,
"grad_norm": 0.4682965132065941,
"learning_rate": 3.679965368180416e-06,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1938939094543457,
"step": 3840,
"valid_targets_mean": 5888.4,
"valid_targets_min": 915
},
{
"epoch": 5.773273273273273,
"grad_norm": 0.5399446918848115,
"learning_rate": 3.6367903465871755e-06,
"loss": 0.2268,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24548377096652985,
"step": 3845,
"valid_targets_mean": 5109.5,
"valid_targets_min": 602
},
{
"epoch": 5.7807807807807805,
"grad_norm": 0.4864834575204545,
"learning_rate": 3.59384475161612e-06,
"loss": 0.2163,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21027377247810364,
"step": 3850,
"valid_targets_mean": 4894.0,
"valid_targets_min": 636
},
{
"epoch": 5.788288288288288,
"grad_norm": 0.5438912695013488,
"learning_rate": 3.5511291854023466e-06,
"loss": 0.2059,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23461908102035522,
"step": 3855,
"valid_targets_mean": 4590.5,
"valid_targets_min": 666
},
{
"epoch": 5.7957957957957955,
"grad_norm": 0.5232434234880898,
"learning_rate": 3.508644246855739e-06,
"loss": 0.2097,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20156699419021606,
"step": 3860,
"valid_targets_mean": 4557.0,
"valid_targets_min": 694
},
{
"epoch": 5.803303303303303,
"grad_norm": 0.5868070563906084,
"learning_rate": 3.466390531652588e-06,
"loss": 0.2079,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19073697924613953,
"step": 3865,
"valid_targets_mean": 4407.1,
"valid_targets_min": 259
},
{
"epoch": 5.8108108108108105,
"grad_norm": 0.5169034481605863,
"learning_rate": 3.4243686322272195e-06,
"loss": 0.2133,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2452038675546646,
"step": 3870,
"valid_targets_mean": 5199.6,
"valid_targets_min": 564
},
{
"epoch": 5.818318318318318,
"grad_norm": 0.5384261747880087,
"learning_rate": 3.3825791377636998e-06,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2101140320301056,
"step": 3875,
"valid_targets_mean": 4844.0,
"valid_targets_min": 427
},
{
"epoch": 5.8258258258258255,
"grad_norm": 0.7881322308404421,
"learning_rate": 3.341022634187585e-06,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23327091336250305,
"step": 3880,
"valid_targets_mean": 3447.8,
"valid_targets_min": 485
},
{
"epoch": 5.833333333333333,
"grad_norm": 0.5514296552758701,
"learning_rate": 3.2996997041576795e-06,
"loss": 0.2105,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20250976085662842,
"step": 3885,
"valid_targets_mean": 4440.7,
"valid_targets_min": 434
},
{
"epoch": 5.8408408408408405,
"grad_norm": 0.651802460092001,
"learning_rate": 3.2586109270578836e-06,
"loss": 0.193,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2257906049489975,
"step": 3890,
"valid_targets_mean": 4516.6,
"valid_targets_min": 623
},
{
"epoch": 5.848348348348348,
"grad_norm": 0.5643346645467794,
"learning_rate": 3.217756878989069e-06,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22649335861206055,
"step": 3895,
"valid_targets_mean": 4361.2,
"valid_targets_min": 764
},
{
"epoch": 5.8558558558558556,
"grad_norm": 0.6943626771374626,
"learning_rate": 3.1771381327609997e-06,
"loss": 0.2263,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23687607049942017,
"step": 3900,
"valid_targets_mean": 3878.1,
"valid_targets_min": 391
},
{
"epoch": 5.863363363363363,
"grad_norm": 0.5703396214687839,
"learning_rate": 3.1367552578842986e-06,
"loss": 0.1972,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22399486601352692,
"step": 3905,
"valid_targets_mean": 4644.7,
"valid_targets_min": 439
},
{
"epoch": 5.870870870870871,
"grad_norm": 3.5482019538966396,
"learning_rate": 3.096608820562468e-06,
"loss": 0.1959,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14243656396865845,
"step": 3910,
"valid_targets_mean": 3601.3,
"valid_targets_min": 723
},
{
"epoch": 5.878378378378378,
"grad_norm": 0.6997352643905546,
"learning_rate": 3.0566993836839387e-06,
"loss": 0.2354,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22578692436218262,
"step": 3915,
"valid_targets_mean": 2871.8,
"valid_targets_min": 481
},
{
"epoch": 5.885885885885886,
"grad_norm": 0.61982038677274,
"learning_rate": 3.017027506814203e-06,
"loss": 0.2138,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.212412029504776,
"step": 3920,
"valid_targets_mean": 3693.6,
"valid_targets_min": 641
},
{
"epoch": 5.893393393393393,
"grad_norm": 0.502898749801898,
"learning_rate": 2.9775937461879368e-06,
"loss": 0.2034,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18976537883281708,
"step": 3925,
"valid_targets_mean": 5294.2,
"valid_targets_min": 649
},
{
"epoch": 5.900900900900901,
"grad_norm": 0.705380106461315,
"learning_rate": 2.9383986547012222e-06,
"loss": 0.2052,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21276956796646118,
"step": 3930,
"valid_targets_mean": 2696.2,
"valid_targets_min": 569
},
{
"epoch": 5.908408408408408,
"grad_norm": 0.6824495687596949,
"learning_rate": 2.8994427819037873e-06,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27314475178718567,
"step": 3935,
"valid_targets_mean": 5253.1,
"valid_targets_min": 879
},
{
"epoch": 5.915915915915916,
"grad_norm": 0.6133652704497186,
"learning_rate": 2.8607266739913077e-06,
"loss": 0.2078,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24844960868358612,
"step": 3940,
"valid_targets_mean": 4655.8,
"valid_targets_min": 819
},
{
"epoch": 5.923423423423423,
"grad_norm": 0.5714988842182993,
"learning_rate": 2.822250873797743e-06,
"loss": 0.226,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19975441694259644,
"step": 3945,
"valid_targets_mean": 4395.9,
"valid_targets_min": 726
},
{
"epoch": 5.930930930930931,
"grad_norm": 0.8230004411475231,
"learning_rate": 2.784015920787719e-06,
"loss": 0.2254,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3142227828502655,
"step": 3950,
"valid_targets_mean": 4321.6,
"valid_targets_min": 853
},
{
"epoch": 5.938438438438438,
"grad_norm": 0.572231017896013,
"learning_rate": 2.746022351048978e-06,
"loss": 0.2267,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2292689085006714,
"step": 3955,
"valid_targets_mean": 4084.4,
"valid_targets_min": 615
},
{
"epoch": 5.945945945945946,
"grad_norm": 0.8188722407870543,
"learning_rate": 2.708270697284865e-06,
"loss": 0.2123,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24927443265914917,
"step": 3960,
"valid_targets_mean": 3767.1,
"valid_targets_min": 686
},
{
"epoch": 5.953453453453453,
"grad_norm": 0.5185251151107919,
"learning_rate": 2.6707614888068365e-06,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19668208062648773,
"step": 3965,
"valid_targets_mean": 4310.9,
"valid_targets_min": 423
},
{
"epoch": 5.960960960960961,
"grad_norm": 0.5542673950873109,
"learning_rate": 2.633495251527054e-06,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24870452284812927,
"step": 3970,
"valid_targets_mean": 5467.7,
"valid_targets_min": 973
},
{
"epoch": 5.968468468468468,
"grad_norm": 0.6048295638583769,
"learning_rate": 2.5964725079510134e-06,
"loss": 0.2045,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17934688925743103,
"step": 3975,
"valid_targets_mean": 3691.8,
"valid_targets_min": 715
},
{
"epoch": 5.975975975975976,
"grad_norm": 0.5714679755869654,
"learning_rate": 2.5596937771702113e-06,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18001726269721985,
"step": 3980,
"valid_targets_mean": 3830.1,
"valid_targets_min": 698
},
{
"epoch": 5.983483483483483,
"grad_norm": 0.5678385470019257,
"learning_rate": 2.523159574854872e-06,
"loss": 0.2096,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19507171213626862,
"step": 3985,
"valid_targets_mean": 3516.0,
"valid_targets_min": 311
},
{
"epoch": 5.990990990990991,
"grad_norm": 0.685934053595724,
"learning_rate": 2.4868704132467115e-06,
"loss": 0.2047,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2302461564540863,
"step": 3990,
"valid_targets_mean": 2869.4,
"valid_targets_min": 584
},
{
"epoch": 5.998498498498498,
"grad_norm": 0.6065925509118129,
"learning_rate": 2.45082680115176e-06,
"loss": 0.2199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19993174076080322,
"step": 3995,
"valid_targets_mean": 3674.2,
"valid_targets_min": 414
},
{
"epoch": 6.006006006006006,
"grad_norm": 0.4490328583511514,
"learning_rate": 2.4150292439332355e-06,
"loss": 0.1979,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19256381690502167,
"step": 4000,
"valid_targets_mean": 5463.9,
"valid_targets_min": 623
},
{
"epoch": 6.013513513513513,
"grad_norm": 0.5503944239111109,
"learning_rate": 2.3794782435044384e-06,
"loss": 0.1788,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17218606173992157,
"step": 4005,
"valid_targets_mean": 3465.8,
"valid_targets_min": 930
},
{
"epoch": 6.021021021021021,
"grad_norm": 0.5533090724442471,
"learning_rate": 2.344174298321733e-06,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.213973268866539,
"step": 4010,
"valid_targets_mean": 4543.8,
"valid_targets_min": 570
},
{
"epoch": 6.028528528528528,
"grad_norm": 0.6792685607327363,
"learning_rate": 2.3091179033775445e-06,
"loss": 0.2038,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2688198983669281,
"step": 4015,
"valid_targets_mean": 3235.7,
"valid_targets_min": 605
},
{
"epoch": 6.036036036036036,
"grad_norm": 0.46026148213907403,
"learning_rate": 2.27430955019343e-06,
"loss": 0.2157,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1564239263534546,
"step": 4020,
"valid_targets_mean": 5029.9,
"valid_targets_min": 1069
},
{
"epoch": 6.043543543543543,
"grad_norm": 0.5322076051668858,
"learning_rate": 2.239749726813183e-06,
"loss": 0.2239,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19674474000930786,
"step": 4025,
"valid_targets_mean": 4798.2,
"valid_targets_min": 478
},
{
"epoch": 6.051051051051051,
"grad_norm": 0.5891185848467975,
"learning_rate": 2.20543891779599e-06,
"loss": 0.199,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18149876594543457,
"step": 4030,
"valid_targets_mean": 4520.9,
"valid_targets_min": 648
},
{
"epoch": 6.058558558558558,
"grad_norm": 0.6755239064217278,
"learning_rate": 2.1713776042096302e-06,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2210536003112793,
"step": 4035,
"valid_targets_mean": 3545.1,
"valid_targets_min": 665
},
{
"epoch": 6.066066066066066,
"grad_norm": 0.6088360110015828,
"learning_rate": 2.1375662636237493e-06,
"loss": 0.1992,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22115203738212585,
"step": 4040,
"valid_targets_mean": 5270.9,
"valid_targets_min": 656
},
{
"epoch": 6.073573573573573,
"grad_norm": 0.5822383908375098,
"learning_rate": 2.1040053701031414e-06,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21398739516735077,
"step": 4045,
"valid_targets_mean": 4107.5,
"valid_targets_min": 483
},
{
"epoch": 6.081081081081081,
"grad_norm": 0.6863357601545187,
"learning_rate": 2.0706953942011165e-06,
"loss": 0.2227,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21303421258926392,
"step": 4050,
"valid_targets_mean": 3397.6,
"valid_targets_min": 691
},
{
"epoch": 6.088588588588588,
"grad_norm": 0.6835718993938039,
"learning_rate": 2.0376368029528935e-06,
"loss": 0.2104,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2734207510948181,
"step": 4055,
"valid_targets_mean": 3650.6,
"valid_targets_min": 652
},
{
"epoch": 6.096096096096096,
"grad_norm": 0.45120552286100196,
"learning_rate": 2.0048300598690627e-06,
"loss": 0.2164,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.25283950567245483,
"step": 4060,
"valid_targets_mean": 7365.3,
"valid_targets_min": 993
},
{
"epoch": 6.103603603603603,
"grad_norm": 0.63959559159808,
"learning_rate": 1.9722756249290785e-06,
"loss": 0.2116,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2537308633327484,
"step": 4065,
"valid_targets_mean": 4346.6,
"valid_targets_min": 668
},
{
"epoch": 6.111111111111111,
"grad_norm": 0.6496824147481889,
"learning_rate": 1.939973954574812e-06,
"loss": 0.175,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15889085829257965,
"step": 4070,
"valid_targets_mean": 3991.0,
"valid_targets_min": 738
},
{
"epoch": 6.118618618618618,
"grad_norm": 0.5705409403401243,
"learning_rate": 1.9079255017041487e-06,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17797492444515228,
"step": 4075,
"valid_targets_mean": 4241.4,
"valid_targets_min": 618
},
{
"epoch": 6.126126126126126,
"grad_norm": 0.4815875979801429,
"learning_rate": 1.8761307156646547e-06,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15079014003276825,
"step": 4080,
"valid_targets_mean": 4996.1,
"valid_targets_min": 513
},
{
"epoch": 6.133633633633633,
"grad_norm": 0.5146233292308801,
"learning_rate": 1.8445900422472495e-06,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18511003255844116,
"step": 4085,
"valid_targets_mean": 4634.7,
"valid_targets_min": 685
},
{
"epoch": 6.141141141141141,
"grad_norm": 0.5624700118014101,
"learning_rate": 1.8133039236799788e-06,
"loss": 0.2067,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2083277553319931,
"step": 4090,
"valid_targets_mean": 4171.3,
"valid_targets_min": 511
},
{
"epoch": 6.148648648648648,
"grad_norm": 0.7177782923244695,
"learning_rate": 1.7822727986217957e-06,
"loss": 0.2237,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18404030799865723,
"step": 4095,
"valid_targets_mean": 2409.4,
"valid_targets_min": 593
},
{
"epoch": 6.156156156156156,
"grad_norm": 0.5228873362141804,
"learning_rate": 1.7514971021564275e-06,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1940818727016449,
"step": 4100,
"valid_targets_mean": 4779.9,
"valid_targets_min": 511
},
{
"epoch": 6.163663663663663,
"grad_norm": 0.4487406897661156,
"learning_rate": 1.7209772657862657e-06,
"loss": 0.1958,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1845383495092392,
"step": 4105,
"valid_targets_mean": 6135.4,
"valid_targets_min": 515
},
{
"epoch": 6.171171171171171,
"grad_norm": 0.5106337969240039,
"learning_rate": 1.6907137174263156e-06,
"loss": 0.2004,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17622476816177368,
"step": 4110,
"valid_targets_mean": 4512.0,
"valid_targets_min": 463
},
{
"epoch": 6.178678678678678,
"grad_norm": 0.6441468445611757,
"learning_rate": 1.6607068813981952e-06,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2345384955406189,
"step": 4115,
"valid_targets_mean": 3844.5,
"valid_targets_min": 471
},
{
"epoch": 6.186186186186186,
"grad_norm": 0.5581311436354888,
"learning_rate": 1.6309571784242062e-06,
"loss": 0.2017,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17409540712833405,
"step": 4120,
"valid_targets_mean": 4888.1,
"valid_targets_min": 645
},
{
"epoch": 6.193693693693693,
"grad_norm": 0.5762764403446647,
"learning_rate": 1.601465025621398e-06,
"loss": 0.2212,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22839732468128204,
"step": 4125,
"valid_targets_mean": 4442.8,
"valid_targets_min": 669
},
{
"epoch": 6.201201201201201,
"grad_norm": 0.488635665892412,
"learning_rate": 1.5722308364957517e-06,
"loss": 0.1868,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19067010283470154,
"step": 4130,
"valid_targets_mean": 5109.4,
"valid_targets_min": 606
},
{
"epoch": 6.208708708708708,
"grad_norm": 0.5702695176534012,
"learning_rate": 1.5432550209363606e-06,
"loss": 0.2119,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19797605276107788,
"step": 4135,
"valid_targets_mean": 4942.1,
"valid_targets_min": 694
},
{
"epoch": 6.216216216216216,
"grad_norm": 0.5547765610808129,
"learning_rate": 1.5145379852097054e-06,
"loss": 0.1995,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21563218533992767,
"step": 4140,
"valid_targets_mean": 4537.9,
"valid_targets_min": 498
},
{
"epoch": 6.223723723723724,
"grad_norm": 0.6133297188420032,
"learning_rate": 1.4860801319539354e-06,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2022094428539276,
"step": 4145,
"valid_targets_mean": 3766.9,
"valid_targets_min": 602
},
{
"epoch": 6.231231231231231,
"grad_norm": 0.5500242111051548,
"learning_rate": 1.457881860173236e-06,
"loss": 0.1928,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14841407537460327,
"step": 4150,
"valid_targets_mean": 3554.3,
"valid_targets_min": 628
},
{
"epoch": 6.238738738738739,
"grad_norm": 0.6493235742255749,
"learning_rate": 1.429943565232228e-06,
"loss": 0.2165,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29499688744544983,
"step": 4155,
"valid_targets_mean": 4105.4,
"valid_targets_min": 391
},
{
"epoch": 6.246246246246246,
"grad_norm": 0.46401350568259536,
"learning_rate": 1.4022656388504418e-06,
"loss": 0.2026,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1871238350868225,
"step": 4160,
"valid_targets_mean": 5385.7,
"valid_targets_min": 467
},
{
"epoch": 6.253753753753754,
"grad_norm": 0.5751734802750025,
"learning_rate": 1.3748484690967967e-06,
"loss": 0.1754,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17546819150447845,
"step": 4165,
"valid_targets_mean": 4171.8,
"valid_targets_min": 564
},
{
"epoch": 6.261261261261261,
"grad_norm": 0.824863745151526,
"learning_rate": 1.3476924403841762e-06,
"loss": 0.2352,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21639591455459595,
"step": 4170,
"valid_targets_mean": 2713.2,
"valid_targets_min": 473
},
{
"epoch": 6.268768768768769,
"grad_norm": 0.570544358689332,
"learning_rate": 1.3207979334640419e-06,
"loss": 0.2095,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20927639305591583,
"step": 4175,
"valid_targets_mean": 4503.6,
"valid_targets_min": 774
},
{
"epoch": 6.276276276276276,
"grad_norm": 0.5313264329238784,
"learning_rate": 1.294165325421084e-06,
"loss": 0.2398,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.29111388325691223,
"step": 4180,
"valid_targets_mean": 5414.2,
"valid_targets_min": 731
},
{
"epoch": 6.283783783783784,
"grad_norm": 0.5675843811457961,
"learning_rate": 1.2677949896679408e-06,
"loss": 0.2117,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20922914147377014,
"step": 4185,
"valid_targets_mean": 4288.4,
"valid_targets_min": 434
},
{
"epoch": 6.291291291291291,
"grad_norm": 0.5380343131647501,
"learning_rate": 1.241687295939966e-06,
"loss": 0.1725,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14380943775177002,
"step": 4190,
"valid_targets_mean": 4689.5,
"valid_targets_min": 367
},
{
"epoch": 6.298798798798799,
"grad_norm": 0.5899919262888533,
"learning_rate": 1.2158426102900345e-06,
"loss": 0.189,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19863969087600708,
"step": 4195,
"valid_targets_mean": 4058.4,
"valid_targets_min": 727
},
{
"epoch": 6.306306306306306,
"grad_norm": 0.5264653142973713,
"learning_rate": 1.1902612950834213e-06,
"loss": 0.2007,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.197919100522995,
"step": 4200,
"valid_targets_mean": 4504.0,
"valid_targets_min": 727
},
{
"epoch": 6.313813813813814,
"grad_norm": 0.5816807471532681,
"learning_rate": 1.164943708992714e-06,
"loss": 0.1954,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19351375102996826,
"step": 4205,
"valid_targets_mean": 3772.9,
"valid_targets_min": 725
},
{
"epoch": 6.321321321321321,
"grad_norm": 0.6196400182011077,
"learning_rate": 1.1398902069927842e-06,
"loss": 0.232,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3165440261363983,
"step": 4210,
"valid_targets_mean": 4516.8,
"valid_targets_min": 374
},
{
"epoch": 6.328828828828829,
"grad_norm": 0.5403053431375547,
"learning_rate": 1.115101140355812e-06,
"loss": 0.2077,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20008732378482819,
"step": 4215,
"valid_targets_mean": 4993.6,
"valid_targets_min": 667
},
{
"epoch": 6.336336336336337,
"grad_norm": 0.5311224743152807,
"learning_rate": 1.0905768566463593e-06,
"loss": 0.2158,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2345670610666275,
"step": 4220,
"valid_targets_mean": 5031.6,
"valid_targets_min": 559
},
{
"epoch": 6.343843843843844,
"grad_norm": 0.7193489501948159,
"learning_rate": 1.0663176997165037e-06,
"loss": 0.2083,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18373778462409973,
"step": 4225,
"valid_targets_mean": 2563.9,
"valid_targets_min": 614
},
{
"epoch": 6.351351351351352,
"grad_norm": 0.6194973179199644,
"learning_rate": 1.0423240097010056e-06,
"loss": 0.1904,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17724689841270447,
"step": 4230,
"valid_targets_mean": 2932.5,
"valid_targets_min": 550
},
{
"epoch": 6.358858858858859,
"grad_norm": 0.5938101431895507,
"learning_rate": 1.018596123012545e-06,
"loss": 0.2014,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15485897660255432,
"step": 4235,
"valid_targets_mean": 3859.1,
"valid_targets_min": 565
},
{
"epoch": 6.366366366366367,
"grad_norm": 0.5832105338347596,
"learning_rate": 9.951343723370145e-07,
"loss": 0.2217,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.27296674251556396,
"step": 4240,
"valid_targets_mean": 4697.3,
"valid_targets_min": 651
},
{
"epoch": 6.373873873873874,
"grad_norm": 0.6257938479877299,
"learning_rate": 9.719390866288325e-07,
"loss": 0.2018,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21452078223228455,
"step": 4245,
"valid_targets_mean": 3980.8,
"valid_targets_min": 644
},
{
"epoch": 6.381381381381382,
"grad_norm": 0.4748467821348681,
"learning_rate": 9.490105911063519e-07,
"loss": 0.1984,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19311422109603882,
"step": 4250,
"valid_targets_mean": 4970.2,
"valid_targets_min": 958
},
{
"epoch": 6.388888888888889,
"grad_norm": 0.49848343014176094,
"learning_rate": 9.263492072472879e-07,
"loss": 0.2041,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20664718747138977,
"step": 4255,
"valid_targets_mean": 5091.6,
"valid_targets_min": 530
},
{
"epoch": 6.396396396396397,
"grad_norm": 0.4839998287321489,
"learning_rate": 9.039552527842188e-07,
"loss": 0.1931,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15590183436870575,
"step": 4260,
"valid_targets_mean": 4334.7,
"valid_targets_min": 755
},
{
"epoch": 6.403903903903904,
"grad_norm": 0.47675581127591066,
"learning_rate": 8.818290417001218e-07,
"loss": 0.1877,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18418073654174805,
"step": 4265,
"valid_targets_mean": 5461.1,
"valid_targets_min": 875
},
{
"epoch": 6.411411411411412,
"grad_norm": 0.5148421630943572,
"learning_rate": 8.599708842239795e-07,
"loss": 0.2056,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1673521250486374,
"step": 4270,
"valid_targets_mean": 5613.2,
"valid_targets_min": 791
},
{
"epoch": 6.418918918918919,
"grad_norm": 0.6034041442260967,
"learning_rate": 8.383810868264253e-07,
"loss": 0.2101,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2042214274406433,
"step": 4275,
"valid_targets_mean": 4745.4,
"valid_targets_min": 521
},
{
"epoch": 6.426426426426427,
"grad_norm": 0.44620270158602615,
"learning_rate": 8.17059952215451e-07,
"loss": 0.1892,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14886009693145752,
"step": 4280,
"valid_targets_mean": 5529.8,
"valid_targets_min": 1189
},
{
"epoch": 6.433933933933934,
"grad_norm": 0.5070235125913082,
"learning_rate": 7.960077793321552e-07,
"loss": 0.1769,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19193494319915771,
"step": 4285,
"valid_targets_mean": 5251.6,
"valid_targets_min": 425
},
{
"epoch": 6.441441441441442,
"grad_norm": 0.5615395471791965,
"learning_rate": 7.752248633465576e-07,
"loss": 0.215,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22860676050186157,
"step": 4290,
"valid_targets_mean": 3936.7,
"valid_targets_min": 583
},
{
"epoch": 6.448948948948949,
"grad_norm": 0.5442260146056317,
"learning_rate": 7.547114956534574e-07,
"loss": 0.1909,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1491059809923172,
"step": 4295,
"valid_targets_mean": 3889.1,
"valid_targets_min": 485
},
{
"epoch": 6.456456456456457,
"grad_norm": 0.5835357955664173,
"learning_rate": 7.344679638683527e-07,
"loss": 0.2332,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2454603910446167,
"step": 4300,
"valid_targets_mean": 5267.1,
"valid_targets_min": 578
},
{
"epoch": 6.463963963963964,
"grad_norm": 0.6370221393360167,
"learning_rate": 7.144945518234014e-07,
"loss": 0.2188,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.20245075225830078,
"step": 4305,
"valid_targets_mean": 3993.6,
"valid_targets_min": 292
},
{
"epoch": 6.471471471471472,
"grad_norm": 0.487081794320264,
"learning_rate": 6.947915395634463e-07,
"loss": 0.2125,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22089102864265442,
"step": 4310,
"valid_targets_mean": 4927.1,
"valid_targets_min": 801
},
{
"epoch": 6.478978978978979,
"grad_norm": 0.6970402670081776,
"learning_rate": 6.753592033420809e-07,
"loss": 0.1902,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19842252135276794,
"step": 4315,
"valid_targets_mean": 2896.4,
"valid_targets_min": 475
},
{
"epoch": 6.486486486486487,
"grad_norm": 0.5079593962075888,
"learning_rate": 6.561978156177939e-07,
"loss": 0.1899,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1689176708459854,
"step": 4320,
"valid_targets_mean": 4254.1,
"valid_targets_min": 861
},
{
"epoch": 6.493993993993994,
"grad_norm": 0.6574113141398381,
"learning_rate": 6.37307645050127e-07,
"loss": 0.2036,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2085978239774704,
"step": 4325,
"valid_targets_mean": 3372.8,
"valid_targets_min": 478
},
{
"epoch": 6.501501501501502,
"grad_norm": 0.508520487800978,
"learning_rate": 6.186889564959209e-07,
"loss": 0.2103,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23924149572849274,
"step": 4330,
"valid_targets_mean": 5251.2,
"valid_targets_min": 565
},
{
"epoch": 6.509009009009009,
"grad_norm": 0.6324952400411343,
"learning_rate": 6.003420110056035e-07,
"loss": 0.204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2557426691055298,
"step": 4335,
"valid_targets_mean": 4012.0,
"valid_targets_min": 503
},
{
"epoch": 6.516516516516517,
"grad_norm": 0.553904609232918,
"learning_rate": 5.822670658195173e-07,
"loss": 0.1907,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21928340196609497,
"step": 4340,
"valid_targets_mean": 4482.4,
"valid_targets_min": 462
},
{
"epoch": 6.524024024024024,
"grad_norm": 0.616465266517478,
"learning_rate": 5.644643743643308e-07,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21219468116760254,
"step": 4345,
"valid_targets_mean": 3722.6,
"valid_targets_min": 504
},
{
"epoch": 6.531531531531532,
"grad_norm": 0.7300734830816725,
"learning_rate": 5.469341862494637e-07,
"loss": 0.2046,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2306327223777771,
"step": 4350,
"valid_targets_mean": 2665.6,
"valid_targets_min": 527
},
{
"epoch": 6.539039039039039,
"grad_norm": 0.5642202986656522,
"learning_rate": 5.296767472636077e-07,
"loss": 0.1916,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1920192539691925,
"step": 4355,
"valid_targets_mean": 3940.9,
"valid_targets_min": 461
},
{
"epoch": 6.546546546546547,
"grad_norm": 0.5150972885704285,
"learning_rate": 5.12692299371269e-07,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14734071493148804,
"step": 4360,
"valid_targets_mean": 4389.3,
"valid_targets_min": 590
},
{
"epoch": 6.554054054054054,
"grad_norm": 0.6913329068038451,
"learning_rate": 4.959810807093779e-07,
"loss": 0.2347,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2543680667877197,
"step": 4365,
"valid_targets_mean": 4525.6,
"valid_targets_min": 554
},
{
"epoch": 6.561561561561562,
"grad_norm": 0.5451201542998624,
"learning_rate": 4.795433255839488e-07,
"loss": 0.2049,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21131403744220734,
"step": 4370,
"valid_targets_mean": 4360.6,
"valid_targets_min": 654
},
{
"epoch": 6.569069069069069,
"grad_norm": 0.47040078136948726,
"learning_rate": 4.633792644667967e-07,
"loss": 0.1887,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19125640392303467,
"step": 4375,
"valid_targets_mean": 5975.6,
"valid_targets_min": 1693
},
{
"epoch": 6.576576576576577,
"grad_norm": 0.5920967555082476,
"learning_rate": 4.474891239923063e-07,
"loss": 0.209,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21285581588745117,
"step": 4380,
"valid_targets_mean": 4406.5,
"valid_targets_min": 643
},
{
"epoch": 6.584084084084084,
"grad_norm": 0.7205742446023933,
"learning_rate": 4.318731269542542e-07,
"loss": 0.1867,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21254310011863708,
"step": 4385,
"valid_targets_mean": 3167.4,
"valid_targets_min": 489
},
{
"epoch": 6.591591591591592,
"grad_norm": 0.5312844013389322,
"learning_rate": 4.1653149230268087e-07,
"loss": 0.2147,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18900719285011292,
"step": 4390,
"valid_targets_mean": 4654.4,
"valid_targets_min": 479
},
{
"epoch": 6.599099099099099,
"grad_norm": 0.5723780339209558,
"learning_rate": 4.014644351408259e-07,
"loss": 0.1911,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22007179260253906,
"step": 4395,
"valid_targets_mean": 4301.8,
"valid_targets_min": 879
},
{
"epoch": 6.606606606606607,
"grad_norm": 0.5052598547107464,
"learning_rate": 3.8667216672211515e-07,
"loss": 0.2064,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17064377665519714,
"step": 4400,
"valid_targets_mean": 4867.7,
"valid_targets_min": 651
},
{
"epoch": 6.614114114114114,
"grad_norm": 0.7316891946951816,
"learning_rate": 3.7215489444718313e-07,
"loss": 0.2098,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22059103846549988,
"step": 4405,
"valid_targets_mean": 2672.8,
"valid_targets_min": 724
},
{
"epoch": 6.621621621621622,
"grad_norm": 0.6761848493284879,
"learning_rate": 3.5791282186099064e-07,
"loss": 0.2279,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23260068893432617,
"step": 4410,
"valid_targets_mean": 3445.1,
"valid_targets_min": 613
},
{
"epoch": 6.629129129129129,
"grad_norm": 0.6708523109273121,
"learning_rate": 3.439461486499451e-07,
"loss": 0.2085,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.23754608631134033,
"step": 4415,
"valid_targets_mean": 3454.1,
"valid_targets_min": 495
},
{
"epoch": 6.636636636636637,
"grad_norm": 0.5130944622824821,
"learning_rate": 3.302550706391161e-07,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1540905237197876,
"step": 4420,
"valid_targets_mean": 4449.4,
"valid_targets_min": 676
},
{
"epoch": 6.6441441441441444,
"grad_norm": 0.5253445851442728,
"learning_rate": 3.168397797894818e-07,
"loss": 0.2039,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19345726072788239,
"step": 4425,
"valid_targets_mean": 5712.4,
"valid_targets_min": 814
},
{
"epoch": 6.651651651651652,
"grad_norm": 0.4999642956754218,
"learning_rate": 3.03700464195249e-07,
"loss": 0.1771,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1533123254776001,
"step": 4430,
"valid_targets_mean": 4014.4,
"valid_targets_min": 448
},
{
"epoch": 6.6591591591591595,
"grad_norm": 0.6600694282993609,
"learning_rate": 2.9083730808120214e-07,
"loss": 0.252,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26119160652160645,
"step": 4435,
"valid_targets_mean": 3377.4,
"valid_targets_min": 445
},
{
"epoch": 6.666666666666667,
"grad_norm": 0.6967687532254948,
"learning_rate": 2.78250491800125e-07,
"loss": 0.2081,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1988351047039032,
"step": 4440,
"valid_targets_mean": 2430.9,
"valid_targets_min": 396
},
{
"epoch": 6.6741741741741745,
"grad_norm": 0.6534875940602458,
"learning_rate": 2.6594019183027844e-07,
"loss": 0.2099,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2011052370071411,
"step": 4445,
"valid_targets_mean": 3745.1,
"valid_targets_min": 709
},
{
"epoch": 6.681681681681682,
"grad_norm": 0.6527183652558144,
"learning_rate": 2.5390658077292017e-07,
"loss": 0.2069,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19569085538387299,
"step": 4450,
"valid_targets_mean": 3687.9,
"valid_targets_min": 539
},
{
"epoch": 6.6891891891891895,
"grad_norm": 0.8645812862940178,
"learning_rate": 2.4214982734988013e-07,
"loss": 0.2033,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.22479039430618286,
"step": 4455,
"valid_targets_mean": 2105.8,
"valid_targets_min": 704
},
{
"epoch": 6.696696696696697,
"grad_norm": 0.5255004317144049,
"learning_rate": 2.3067009640120652e-07,
"loss": 0.2365,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.26815474033355713,
"step": 4460,
"valid_targets_mean": 5218.8,
"valid_targets_min": 565
},
{
"epoch": 6.7042042042042045,
"grad_norm": 0.5916763601809271,
"learning_rate": 2.194675488828457e-07,
"loss": 0.1791,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1834341287612915,
"step": 4465,
"valid_targets_mean": 3968.9,
"valid_targets_min": 704
},
{
"epoch": 6.711711711711712,
"grad_norm": 0.614175690495789,
"learning_rate": 2.0854234186438837e-07,
"loss": 0.1942,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24795103073120117,
"step": 4470,
"valid_targets_mean": 3751.3,
"valid_targets_min": 613
},
{
"epoch": 6.7192192192192195,
"grad_norm": 0.5171279571165366,
"learning_rate": 1.9789462852686237e-07,
"loss": 0.2013,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19156940281391144,
"step": 4475,
"valid_targets_mean": 4793.4,
"valid_targets_min": 679
},
{
"epoch": 6.726726726726727,
"grad_norm": 0.5178172693023037,
"learning_rate": 1.875245581605989e-07,
"loss": 0.187,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16094420850276947,
"step": 4480,
"valid_targets_mean": 4665.6,
"valid_targets_min": 471
},
{
"epoch": 6.7342342342342345,
"grad_norm": 0.48834241533960204,
"learning_rate": 1.7743227616312308e-07,
"loss": 0.213,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16197466850280762,
"step": 4485,
"valid_targets_mean": 4962.2,
"valid_targets_min": 1052
},
{
"epoch": 6.741741741741742,
"grad_norm": 0.5234925189927083,
"learning_rate": 1.676179240371245e-07,
"loss": 0.1807,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16373220086097717,
"step": 4490,
"valid_targets_mean": 3922.8,
"valid_targets_min": 464
},
{
"epoch": 6.7492492492492495,
"grad_norm": 0.6352684311920057,
"learning_rate": 1.5808163938846986e-07,
"loss": 0.1976,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19435149431228638,
"step": 4495,
"valid_targets_mean": 3218.4,
"valid_targets_min": 478
},
{
"epoch": 6.756756756756757,
"grad_norm": 0.6229594370415693,
"learning_rate": 1.4882355592427344e-07,
"loss": 0.191,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16698959469795227,
"step": 4500,
"valid_targets_mean": 3428.0,
"valid_targets_min": 665
},
{
"epoch": 6.7642642642642645,
"grad_norm": 0.6138075392270004,
"learning_rate": 1.3984380345102966e-07,
"loss": 0.2124,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21965721249580383,
"step": 4505,
"valid_targets_mean": 3452.5,
"valid_targets_min": 408
},
{
"epoch": 6.771771771771772,
"grad_norm": 0.5674625446735158,
"learning_rate": 1.3114250787278128e-07,
"loss": 0.2276,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17410314083099365,
"step": 4510,
"valid_targets_mean": 5005.2,
"valid_targets_min": 560
},
{
"epoch": 6.7792792792792795,
"grad_norm": 0.5558176857114882,
"learning_rate": 1.2271979118936074e-07,
"loss": 0.2114,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17912578582763672,
"step": 4515,
"valid_targets_mean": 3863.8,
"valid_targets_min": 853
},
{
"epoch": 6.786786786786787,
"grad_norm": 0.635474987483276,
"learning_rate": 1.1457577149468268e-07,
"loss": 0.1884,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17979639768600464,
"step": 4520,
"valid_targets_mean": 3391.7,
"valid_targets_min": 429
},
{
"epoch": 6.7942942942942945,
"grad_norm": 0.794907141047451,
"learning_rate": 1.0671056297507642e-07,
"loss": 0.2055,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19865292310714722,
"step": 4525,
"valid_targets_mean": 2033.5,
"valid_targets_min": 584
},
{
"epoch": 6.801801801801802,
"grad_norm": 0.49215782912003203,
"learning_rate": 9.91242759077049e-08,
"loss": 0.2204,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15488871932029724,
"step": 4530,
"valid_targets_mean": 4630.8,
"valid_targets_min": 639
},
{
"epoch": 6.8093093093093096,
"grad_norm": 0.6173142764754961,
"learning_rate": 9.181701665899268e-08,
"loss": 0.1977,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18007370829582214,
"step": 4535,
"valid_targets_mean": 4323.4,
"valid_targets_min": 696
},
{
"epoch": 6.816816816816817,
"grad_norm": 0.7575394360176801,
"learning_rate": 8.47888876831604e-08,
"loss": 0.2296,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24876675009727478,
"step": 4540,
"valid_targets_mean": 3193.3,
"valid_targets_min": 277
},
{
"epoch": 6.824324324324325,
"grad_norm": 0.5819569698944355,
"learning_rate": 7.803998752076824e-08,
"loss": 0.1881,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17346233129501343,
"step": 4545,
"valid_targets_mean": 5187.9,
"valid_targets_min": 643
},
{
"epoch": 6.831831831831832,
"grad_norm": 0.4396136217756035,
"learning_rate": 7.157041079734584e-08,
"loss": 0.2325,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.18130743503570557,
"step": 4550,
"valid_targets_mean": 5762.4,
"valid_targets_min": 1228
},
{
"epoch": 6.83933933933934,
"grad_norm": 0.4687226820184863,
"learning_rate": 6.538024822206224e-08,
"loss": 0.2008,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1852032095193863,
"step": 4555,
"valid_targets_mean": 5690.4,
"valid_targets_min": 702
},
{
"epoch": 6.846846846846847,
"grad_norm": 0.6527972240202853,
"learning_rate": 5.946958658645141e-08,
"loss": 0.2255,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21088294684886932,
"step": 4560,
"valid_targets_mean": 3305.9,
"valid_targets_min": 371
},
{
"epoch": 6.854354354354355,
"grad_norm": 0.5747007613275369,
"learning_rate": 5.383850876319763e-08,
"loss": 0.1834,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16404512524604797,
"step": 4565,
"valid_targets_mean": 3822.6,
"valid_targets_min": 609
},
{
"epoch": 6.861861861861862,
"grad_norm": 0.5712891848122477,
"learning_rate": 4.848709370498084e-08,
"loss": 0.2022,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.24901172518730164,
"step": 4570,
"valid_targets_mean": 5079.1,
"valid_targets_min": 574
},
{
"epoch": 6.86936936936937,
"grad_norm": 0.4949929365077814,
"learning_rate": 4.34154164433509e-08,
"loss": 0.1955,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17748858034610748,
"step": 4575,
"valid_targets_mean": 4491.8,
"valid_targets_min": 634
},
{
"epoch": 6.876876876876877,
"grad_norm": 0.5203752172969807,
"learning_rate": 3.86235480876973e-08,
"loss": 0.2374,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2086370289325714,
"step": 4580,
"valid_targets_mean": 5460.8,
"valid_targets_min": 622
},
{
"epoch": 6.884384384384385,
"grad_norm": 0.5124535100635832,
"learning_rate": 3.411155582423664e-08,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.16645345091819763,
"step": 4585,
"valid_targets_mean": 4649.4,
"valid_targets_min": 549
},
{
"epoch": 6.891891891891892,
"grad_norm": 0.6965621530697311,
"learning_rate": 2.9879502915075574e-08,
"loss": 0.2214,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21695250272750854,
"step": 4590,
"valid_targets_mean": 3357.6,
"valid_targets_min": 704
},
{
"epoch": 6.8993993993994,
"grad_norm": 0.5009549067493665,
"learning_rate": 2.592744869732933e-08,
"loss": 0.1793,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2433704286813736,
"step": 4595,
"valid_targets_mean": 5021.1,
"valid_targets_min": 535
},
{
"epoch": 6.906906906906907,
"grad_norm": 0.6325006211055703,
"learning_rate": 2.2255448582280127e-08,
"loss": 0.1923,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1930675059556961,
"step": 4600,
"valid_targets_mean": 3954.0,
"valid_targets_min": 562
},
{
"epoch": 6.914414414414415,
"grad_norm": 0.5272145532637147,
"learning_rate": 1.8863554054606715e-08,
"loss": 0.1888,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1625824272632599,
"step": 4605,
"valid_targets_mean": 4323.2,
"valid_targets_min": 1190
},
{
"epoch": 6.921921921921922,
"grad_norm": 0.5329661463696542,
"learning_rate": 1.5751812671658264e-08,
"loss": 0.2071,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19332969188690186,
"step": 4610,
"valid_targets_mean": 4747.9,
"valid_targets_min": 906
},
{
"epoch": 6.92942942942943,
"grad_norm": 0.5417369482444132,
"learning_rate": 1.2920268062794894e-08,
"loss": 0.2086,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19969046115875244,
"step": 4615,
"valid_targets_mean": 4192.8,
"valid_targets_min": 728
},
{
"epoch": 6.936936936936937,
"grad_norm": 0.6878033594654033,
"learning_rate": 1.0368959928763744e-08,
"loss": 0.2053,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21517297625541687,
"step": 4620,
"valid_targets_mean": 3462.9,
"valid_targets_min": 709
},
{
"epoch": 6.944444444444445,
"grad_norm": 0.5692311923901623,
"learning_rate": 8.097924041157168e-09,
"loss": 0.1876,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.17874173820018768,
"step": 4625,
"valid_targets_mean": 3834.8,
"valid_targets_min": 605
},
{
"epoch": 6.951951951951952,
"grad_norm": 0.8120108501447949,
"learning_rate": 6.107192241897597e-09,
"loss": 0.1783,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.19116508960723877,
"step": 4630,
"valid_targets_mean": 3737.9,
"valid_targets_min": 756
},
{
"epoch": 6.95945945945946,
"grad_norm": 0.6343758559646698,
"learning_rate": 4.396792442800113e-09,
"loss": 0.2174,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2372244894504547,
"step": 4635,
"valid_targets_mean": 5020.9,
"valid_targets_min": 821
},
{
"epoch": 6.966966966966967,
"grad_norm": 0.4747536212588191,
"learning_rate": 2.9667486251794274e-09,
"loss": 0.1961,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.15623793005943298,
"step": 4640,
"valid_targets_mean": 5340.8,
"valid_targets_min": 611
},
{
"epoch": 6.974474474474475,
"grad_norm": 0.4663889436387785,
"learning_rate": 1.8170808395079342e-09,
"loss": 0.2291,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.204878568649292,
"step": 4645,
"valid_targets_mean": 5754.1,
"valid_targets_min": 2157
},
{
"epoch": 6.981981981981982,
"grad_norm": 0.5618969419816342,
"learning_rate": 9.47805205140373e-10,
"loss": 0.196,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.2027861475944519,
"step": 4650,
"valid_targets_mean": 4324.8,
"valid_targets_min": 736
},
{
"epoch": 6.98948948948949,
"grad_norm": 0.440752938378733,
"learning_rate": 3.589339100917855e-10,
"loss": 0.1985,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21129390597343445,
"step": 4655,
"valid_targets_mean": 6267.5,
"valid_targets_min": 686
},
{
"epoch": 6.996996996996997,
"grad_norm": 0.5759092607170879,
"learning_rate": 5.0475210853218045e-11,
"loss": 0.2195,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.21579566597938538,
"step": 4660,
"valid_targets_mean": 4775.2,
"valid_targets_min": 824
},
{
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.1870056539773941,
"step": 4662,
"total_flos": 1420700030337024.0,
"train_loss": 0.25631797409579254,
"train_runtime": 31285.8836,
"train_samples_per_second": 2.384,
"train_steps_per_second": 0.149,
"valid_targets_mean": 4345.4,
"valid_targets_min": 624
}
],
"logging_steps": 5,
"max_steps": 4662,
"num_input_tokens_seen": 0,
"num_train_epochs": 7,
"save_steps": 1500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1420700030337024.0,
"train_batch_size": 1,
"trial_name": null,
"trial_params": null
}