{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4305, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008130081300813009, "grad_norm": 10.729355259341085, "learning_rate": 3.7122969837587006e-07, "loss": 0.5735, "loss_nan_ranks": 0, "loss_rank_avg": 0.24004313349723816, "step": 5, "valid_targets_mean": 2614.5, "valid_targets_min": 988 }, { "epoch": 0.016260162601626018, "grad_norm": 9.95614411374737, "learning_rate": 8.352668213457077e-07, "loss": 0.5844, "loss_nan_ranks": 0, "loss_rank_avg": 0.3054102659225464, "step": 10, "valid_targets_mean": 6700.2, "valid_targets_min": 1022 }, { "epoch": 0.024390243902439025, "grad_norm": 8.490830318504097, "learning_rate": 1.2993039443155453e-06, "loss": 0.5273, "loss_nan_ranks": 0, "loss_rank_avg": 0.27064454555511475, "step": 15, "valid_targets_mean": 4731.8, "valid_targets_min": 1171 }, { "epoch": 0.032520325203252036, "grad_norm": 5.508858253527907, "learning_rate": 1.7633410672853829e-06, "loss": 0.5604, "loss_nan_ranks": 0, "loss_rank_avg": 0.28161105513572693, "step": 20, "valid_targets_mean": 5939.0, "valid_targets_min": 1208 }, { "epoch": 0.04065040650406504, "grad_norm": 4.244414584795395, "learning_rate": 2.2273781902552207e-06, "loss": 0.525, "loss_nan_ranks": 0, "loss_rank_avg": 0.19481831789016724, "step": 25, "valid_targets_mean": 2888.2, "valid_targets_min": 708 }, { "epoch": 0.04878048780487805, "grad_norm": 2.9008493875224715, "learning_rate": 2.691415313225058e-06, "loss": 0.4719, "loss_nan_ranks": 0, "loss_rank_avg": 0.24280954897403717, "step": 30, "valid_targets_mean": 7361.0, "valid_targets_min": 1507 }, { "epoch": 0.056910569105691054, "grad_norm": 3.4096382562645484, "learning_rate": 3.155452436194896e-06, "loss": 0.49, "loss_nan_ranks": 0, "loss_rank_avg": 0.24371470510959625, "step": 35, "valid_targets_mean": 3680.0, "valid_targets_min": 1599 }, { "epoch": 0.06504065040650407, "grad_norm": 2.056871731875376, "learning_rate": 3.6194895591647333e-06, "loss": 0.446, "loss_nan_ranks": 0, "loss_rank_avg": 0.14936479926109314, "step": 40, "valid_targets_mean": 3807.8, "valid_targets_min": 1098 }, { "epoch": 0.07317073170731707, "grad_norm": 0.9901834399287566, "learning_rate": 4.083526682134571e-06, "loss": 0.4223, "loss_nan_ranks": 0, "loss_rank_avg": 0.14713236689567566, "step": 45, "valid_targets_mean": 4927.4, "valid_targets_min": 1369 }, { "epoch": 0.08130081300813008, "grad_norm": 0.9398360387681741, "learning_rate": 4.547563805104409e-06, "loss": 0.4316, "loss_nan_ranks": 0, "loss_rank_avg": 0.16155597567558289, "step": 50, "valid_targets_mean": 4512.9, "valid_targets_min": 1585 }, { "epoch": 0.08943089430894309, "grad_norm": 0.8775743692611262, "learning_rate": 5.011600928074246e-06, "loss": 0.3961, "loss_nan_ranks": 0, "loss_rank_avg": 0.2303980439901352, "step": 55, "valid_targets_mean": 4560.0, "valid_targets_min": 985 }, { "epoch": 0.0975609756097561, "grad_norm": 0.795569922663752, "learning_rate": 5.4756380510440845e-06, "loss": 0.3787, "loss_nan_ranks": 0, "loss_rank_avg": 0.16651669144630432, "step": 60, "valid_targets_mean": 3114.6, "valid_targets_min": 1042 }, { "epoch": 0.10569105691056911, "grad_norm": 0.7519872281053458, "learning_rate": 5.939675174013921e-06, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.17810176312923431, "step": 65, "valid_targets_mean": 3038.5, "valid_targets_min": 1407 }, { "epoch": 0.11382113821138211, "grad_norm": 0.5792804598494421, "learning_rate": 6.403712296983759e-06, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.1996963620185852, "step": 70, "valid_targets_mean": 5235.0, "valid_targets_min": 1850 }, { "epoch": 0.12195121951219512, "grad_norm": 0.4824690597797212, "learning_rate": 6.867749419953597e-06, "loss": 0.3565, "loss_nan_ranks": 0, "loss_rank_avg": 0.18132978677749634, "step": 75, "valid_targets_mean": 6870.2, "valid_targets_min": 1801 }, { "epoch": 0.13008130081300814, "grad_norm": 0.5501428825070286, "learning_rate": 7.331786542923435e-06, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.163741797208786, "step": 80, "valid_targets_mean": 4903.1, "valid_targets_min": 1105 }, { "epoch": 0.13821138211382114, "grad_norm": 0.515640618796055, "learning_rate": 7.795823665893271e-06, "loss": 0.3231, "loss_nan_ranks": 0, "loss_rank_avg": 0.1189749538898468, "step": 85, "valid_targets_mean": 4170.2, "valid_targets_min": 1259 }, { "epoch": 0.14634146341463414, "grad_norm": 0.6231036421396678, "learning_rate": 8.25986078886311e-06, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.10459889471530914, "step": 90, "valid_targets_mean": 2787.4, "valid_targets_min": 820 }, { "epoch": 0.15447154471544716, "grad_norm": 0.47776022024330533, "learning_rate": 8.723897911832948e-06, "loss": 0.3215, "loss_nan_ranks": 0, "loss_rank_avg": 0.1699979603290558, "step": 95, "valid_targets_mean": 5565.5, "valid_targets_min": 691 }, { "epoch": 0.16260162601626016, "grad_norm": 0.43049029114582227, "learning_rate": 9.187935034802784e-06, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.16746115684509277, "step": 100, "valid_targets_mean": 8008.9, "valid_targets_min": 3875 }, { "epoch": 0.17073170731707318, "grad_norm": 0.5506518790709487, "learning_rate": 9.651972157772623e-06, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.17378145456314087, "step": 105, "valid_targets_mean": 5575.4, "valid_targets_min": 1059 }, { "epoch": 0.17886178861788618, "grad_norm": 0.8343481888737161, "learning_rate": 1.011600928074246e-05, "loss": 0.3039, "loss_nan_ranks": 0, "loss_rank_avg": 0.13841012120246887, "step": 110, "valid_targets_mean": 6387.9, "valid_targets_min": 1380 }, { "epoch": 0.18699186991869918, "grad_norm": 0.4678403515176022, "learning_rate": 1.0580046403712299e-05, "loss": 0.3303, "loss_nan_ranks": 0, "loss_rank_avg": 0.2064119130373001, "step": 115, "valid_targets_mean": 7768.4, "valid_targets_min": 1619 }, { "epoch": 0.1951219512195122, "grad_norm": 0.36446029955073816, "learning_rate": 1.1044083526682134e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.1493927538394928, "step": 120, "valid_targets_mean": 8210.1, "valid_targets_min": 2419 }, { "epoch": 0.2032520325203252, "grad_norm": 0.5532632575478795, "learning_rate": 1.1508120649651972e-05, "loss": 0.2989, "loss_nan_ranks": 0, "loss_rank_avg": 0.1957596093416214, "step": 125, "valid_targets_mean": 5523.8, "valid_targets_min": 1219 }, { "epoch": 0.21138211382113822, "grad_norm": 0.4918145090486274, "learning_rate": 1.197215777262181e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.1981673538684845, "step": 130, "valid_targets_mean": 8387.9, "valid_targets_min": 1912 }, { "epoch": 0.21951219512195122, "grad_norm": 0.4824040162688919, "learning_rate": 1.2436194895591649e-05, "loss": 0.3072, "loss_nan_ranks": 0, "loss_rank_avg": 0.12638956308364868, "step": 135, "valid_targets_mean": 5431.0, "valid_targets_min": 1759 }, { "epoch": 0.22764227642276422, "grad_norm": 0.5178853741428794, "learning_rate": 1.2900232018561485e-05, "loss": 0.3109, "loss_nan_ranks": 0, "loss_rank_avg": 0.18286965787410736, "step": 140, "valid_targets_mean": 4913.8, "valid_targets_min": 1029 }, { "epoch": 0.23577235772357724, "grad_norm": 0.5486837832887713, "learning_rate": 1.3364269141531323e-05, "loss": 0.3227, "loss_nan_ranks": 0, "loss_rank_avg": 0.26483672857284546, "step": 145, "valid_targets_mean": 7427.6, "valid_targets_min": 1096 }, { "epoch": 0.24390243902439024, "grad_norm": 0.47855051057921927, "learning_rate": 1.3828306264501162e-05, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.1614745557308197, "step": 150, "valid_targets_mean": 5602.1, "valid_targets_min": 961 }, { "epoch": 0.25203252032520324, "grad_norm": 0.5353775633039806, "learning_rate": 1.4292343387471e-05, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.16262441873550415, "step": 155, "valid_targets_mean": 4503.0, "valid_targets_min": 733 }, { "epoch": 0.2601626016260163, "grad_norm": 0.46885526862806487, "learning_rate": 1.4756380510440838e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.12933751940727234, "step": 160, "valid_targets_mean": 5221.4, "valid_targets_min": 456 }, { "epoch": 0.2682926829268293, "grad_norm": 0.5510357143973084, "learning_rate": 1.5220417633410673e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.14275045692920685, "step": 165, "valid_targets_mean": 3452.2, "valid_targets_min": 175 }, { "epoch": 0.2764227642276423, "grad_norm": 0.5986519641807708, "learning_rate": 1.5684454756380513e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.2011912316083908, "step": 170, "valid_targets_mean": 5387.8, "valid_targets_min": 1825 }, { "epoch": 0.2845528455284553, "grad_norm": 0.7983475971758657, "learning_rate": 1.614849187935035e-05, "loss": 0.2953, "loss_nan_ranks": 0, "loss_rank_avg": 0.1250675469636917, "step": 175, "valid_targets_mean": 2584.2, "valid_targets_min": 1308 }, { "epoch": 0.2926829268292683, "grad_norm": 0.5300705164920657, "learning_rate": 1.661252900232019e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.14062389731407166, "step": 180, "valid_targets_mean": 4876.6, "valid_targets_min": 2482 }, { "epoch": 0.3008130081300813, "grad_norm": 0.4645501589874264, "learning_rate": 1.7076566125290022e-05, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.10153844952583313, "step": 185, "valid_targets_mean": 4490.9, "valid_targets_min": 938 }, { "epoch": 0.3089430894308943, "grad_norm": 0.5394172146224312, "learning_rate": 1.7540603248259862e-05, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.1731753945350647, "step": 190, "valid_targets_mean": 6405.1, "valid_targets_min": 1564 }, { "epoch": 0.3170731707317073, "grad_norm": 0.6081161338172066, "learning_rate": 1.80046403712297e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.09163825213909149, "step": 195, "valid_targets_mean": 2425.0, "valid_targets_min": 882 }, { "epoch": 0.3252032520325203, "grad_norm": 0.39700152309765374, "learning_rate": 1.846867749419954e-05, "loss": 0.3043, "loss_nan_ranks": 0, "loss_rank_avg": 0.1639854609966278, "step": 200, "valid_targets_mean": 9026.9, "valid_targets_min": 1543 }, { "epoch": 0.3333333333333333, "grad_norm": 1.1686077596478834, "learning_rate": 1.8932714617169375e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.12743505835533142, "step": 205, "valid_targets_mean": 4637.0, "valid_targets_min": 1690 }, { "epoch": 0.34146341463414637, "grad_norm": 0.5152584843628413, "learning_rate": 1.9396751740139212e-05, "loss": 0.3006, "loss_nan_ranks": 0, "loss_rank_avg": 0.11795099079608917, "step": 210, "valid_targets_mean": 3623.4, "valid_targets_min": 1597 }, { "epoch": 0.34959349593495936, "grad_norm": 0.40931960381507093, "learning_rate": 1.986078886310905e-05, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.19876506924629211, "step": 215, "valid_targets_mean": 10234.2, "valid_targets_min": 795 }, { "epoch": 0.35772357723577236, "grad_norm": 0.5681020072245295, "learning_rate": 2.0324825986078888e-05, "loss": 0.2613, "loss_nan_ranks": 0, "loss_rank_avg": 0.138270765542984, "step": 220, "valid_targets_mean": 4483.9, "valid_targets_min": 922 }, { "epoch": 0.36585365853658536, "grad_norm": 0.6620929272244965, "learning_rate": 2.0788863109048725e-05, "loss": 0.3119, "loss_nan_ranks": 0, "loss_rank_avg": 0.26536881923675537, "step": 225, "valid_targets_mean": 4992.5, "valid_targets_min": 1766 }, { "epoch": 0.37398373983739835, "grad_norm": 0.473185582494688, "learning_rate": 2.125290023201856e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.17839691042900085, "step": 230, "valid_targets_mean": 8155.8, "valid_targets_min": 1768 }, { "epoch": 0.3821138211382114, "grad_norm": 0.5676414017591311, "learning_rate": 2.17169373549884e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.15132203698158264, "step": 235, "valid_targets_mean": 3835.4, "valid_targets_min": 1300 }, { "epoch": 0.3902439024390244, "grad_norm": 0.5829173056048123, "learning_rate": 2.2180974477958238e-05, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.10389190167188644, "step": 240, "valid_targets_mean": 3737.4, "valid_targets_min": 1126 }, { "epoch": 0.3983739837398374, "grad_norm": 0.4496112265820951, "learning_rate": 2.2645011600928078e-05, "loss": 0.2652, "loss_nan_ranks": 0, "loss_rank_avg": 0.1356901228427887, "step": 245, "valid_targets_mean": 6019.0, "valid_targets_min": 1824 }, { "epoch": 0.4065040650406504, "grad_norm": 0.6433613059763399, "learning_rate": 2.3109048723897914e-05, "loss": 0.2815, "loss_nan_ranks": 0, "loss_rank_avg": 0.13550019264221191, "step": 250, "valid_targets_mean": 3801.2, "valid_targets_min": 1174 }, { "epoch": 0.4146341463414634, "grad_norm": 0.6396160632853143, "learning_rate": 2.357308584686775e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.1697913110256195, "step": 255, "valid_targets_mean": 3961.4, "valid_targets_min": 1502 }, { "epoch": 0.42276422764227645, "grad_norm": 0.4542094599236192, "learning_rate": 2.4037122969837587e-05, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.09232847392559052, "step": 260, "valid_targets_mean": 4648.8, "valid_targets_min": 1023 }, { "epoch": 0.43089430894308944, "grad_norm": 0.5412227898339419, "learning_rate": 2.4501160092807427e-05, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.1287793219089508, "step": 265, "valid_targets_mean": 4237.9, "valid_targets_min": 1086 }, { "epoch": 0.43902439024390244, "grad_norm": 0.4177869578429799, "learning_rate": 2.4965197215777264e-05, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.1671661138534546, "step": 270, "valid_targets_mean": 9169.6, "valid_targets_min": 4230 }, { "epoch": 0.44715447154471544, "grad_norm": 0.47683007534315536, "learning_rate": 2.54292343387471e-05, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.11259545385837555, "step": 275, "valid_targets_mean": 4597.0, "valid_targets_min": 1167 }, { "epoch": 0.45528455284552843, "grad_norm": 0.528485160665934, "learning_rate": 2.589327146171694e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.11031106859445572, "step": 280, "valid_targets_mean": 5527.1, "valid_targets_min": 1031 }, { "epoch": 0.4634146341463415, "grad_norm": 0.6449048798012383, "learning_rate": 2.6357308584686777e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.16236139833927155, "step": 285, "valid_targets_mean": 3449.2, "valid_targets_min": 900 }, { "epoch": 0.4715447154471545, "grad_norm": 0.47651550237539747, "learning_rate": 2.6821345707656617e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.16859616339206696, "step": 290, "valid_targets_mean": 6841.1, "valid_targets_min": 1434 }, { "epoch": 0.4796747967479675, "grad_norm": 0.5060381133309334, "learning_rate": 2.7285382830626453e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.15308891236782074, "step": 295, "valid_targets_mean": 6108.2, "valid_targets_min": 1979 }, { "epoch": 0.4878048780487805, "grad_norm": 0.46570844149760965, "learning_rate": 2.774941995359629e-05, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.07817001640796661, "step": 300, "valid_targets_mean": 2998.5, "valid_targets_min": 1532 }, { "epoch": 0.4959349593495935, "grad_norm": 0.5748363877093409, "learning_rate": 2.8213457076566126e-05, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.2178957462310791, "step": 305, "valid_targets_mean": 4954.2, "valid_targets_min": 1530 }, { "epoch": 0.5040650406504065, "grad_norm": 0.4913109666435666, "learning_rate": 2.8677494199535966e-05, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.08731204271316528, "step": 310, "valid_targets_mean": 3538.8, "valid_targets_min": 814 }, { "epoch": 0.5121951219512195, "grad_norm": 0.4731336417357327, "learning_rate": 2.9141531322505803e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.10972920060157776, "step": 315, "valid_targets_mean": 4589.5, "valid_targets_min": 716 }, { "epoch": 0.5203252032520326, "grad_norm": 0.544587609060752, "learning_rate": 2.9605568445475643e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.10782943665981293, "step": 320, "valid_targets_mean": 3388.5, "valid_targets_min": 967 }, { "epoch": 0.5284552845528455, "grad_norm": 0.5206054830318291, "learning_rate": 3.006960556844548e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.11411543190479279, "step": 325, "valid_targets_mean": 3479.6, "valid_targets_min": 754 }, { "epoch": 0.5365853658536586, "grad_norm": 0.5109963804533619, "learning_rate": 3.053364269141532e-05, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.11475864052772522, "step": 330, "valid_targets_mean": 3898.2, "valid_targets_min": 639 }, { "epoch": 0.5447154471544715, "grad_norm": 0.49736930558210946, "learning_rate": 3.099767981438515e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.09260010719299316, "step": 335, "valid_targets_mean": 3543.0, "valid_targets_min": 1186 }, { "epoch": 0.5528455284552846, "grad_norm": 1.4224554880291065, "learning_rate": 3.146171693735499e-05, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.1166592612862587, "step": 340, "valid_targets_mean": 6083.1, "valid_targets_min": 783 }, { "epoch": 0.5609756097560976, "grad_norm": 0.6507048259502546, "learning_rate": 3.1925754060324825e-05, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.11932586133480072, "step": 345, "valid_targets_mean": 2966.4, "valid_targets_min": 1495 }, { "epoch": 0.5691056910569106, "grad_norm": 0.5262338877240812, "learning_rate": 3.2389791183294665e-05, "loss": 0.2748, "loss_nan_ranks": 0, "loss_rank_avg": 0.18811023235321045, "step": 350, "valid_targets_mean": 6847.5, "valid_targets_min": 1820 }, { "epoch": 0.5772357723577236, "grad_norm": 0.7190553945803088, "learning_rate": 3.2853828306264505e-05, "loss": 0.2788, "loss_nan_ranks": 0, "loss_rank_avg": 0.1663609743118286, "step": 355, "valid_targets_mean": 4037.1, "valid_targets_min": 1123 }, { "epoch": 0.5853658536585366, "grad_norm": 0.5338816539006683, "learning_rate": 3.3317865429234345e-05, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.13983416557312012, "step": 360, "valid_targets_mean": 5041.6, "valid_targets_min": 1378 }, { "epoch": 0.5934959349593496, "grad_norm": 0.5021054760120496, "learning_rate": 3.378190255220418e-05, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.10287587344646454, "step": 365, "valid_targets_mean": 5181.4, "valid_targets_min": 1034 }, { "epoch": 0.6016260162601627, "grad_norm": 0.6030850444597946, "learning_rate": 3.424593967517402e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.16273638606071472, "step": 370, "valid_targets_mean": 3852.2, "valid_targets_min": 1120 }, { "epoch": 0.6097560975609756, "grad_norm": 0.4200234244730862, "learning_rate": 3.470997679814386e-05, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.13301149010658264, "step": 375, "valid_targets_mean": 5999.4, "valid_targets_min": 1017 }, { "epoch": 0.6178861788617886, "grad_norm": 0.47437564358950707, "learning_rate": 3.517401392111369e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.12184874713420868, "step": 380, "valid_targets_mean": 6132.9, "valid_targets_min": 1141 }, { "epoch": 0.6260162601626016, "grad_norm": 0.5720586708854113, "learning_rate": 3.563805104408353e-05, "loss": 0.2575, "loss_nan_ranks": 0, "loss_rank_avg": 0.08667431026697159, "step": 385, "valid_targets_mean": 2480.5, "valid_targets_min": 845 }, { "epoch": 0.6341463414634146, "grad_norm": 0.45303244769740036, "learning_rate": 3.6102088167053364e-05, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.16857236623764038, "step": 390, "valid_targets_mean": 7660.0, "valid_targets_min": 711 }, { "epoch": 0.6422764227642277, "grad_norm": 0.45737182440597945, "learning_rate": 3.6566125290023204e-05, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.10698920488357544, "step": 395, "valid_targets_mean": 4812.4, "valid_targets_min": 1836 }, { "epoch": 0.6504065040650406, "grad_norm": 0.5668819902013378, "learning_rate": 3.7030162412993044e-05, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.11894096434116364, "step": 400, "valid_targets_mean": 3405.1, "valid_targets_min": 1117 }, { "epoch": 0.6585365853658537, "grad_norm": 0.4972517400541581, "learning_rate": 3.7494199535962884e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.14403322339057922, "step": 405, "valid_targets_mean": 5518.8, "valid_targets_min": 1220 }, { "epoch": 0.6666666666666666, "grad_norm": 0.4726743985096405, "learning_rate": 3.795823665893272e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.1037069782614708, "step": 410, "valid_targets_mean": 4652.2, "valid_targets_min": 971 }, { "epoch": 0.6747967479674797, "grad_norm": 0.5555072614400881, "learning_rate": 3.842227378190256e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.23938646912574768, "step": 415, "valid_targets_mean": 6567.6, "valid_targets_min": 981 }, { "epoch": 0.6829268292682927, "grad_norm": 0.48406443535669796, "learning_rate": 3.888631090487239e-05, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.0925922617316246, "step": 420, "valid_targets_mean": 4397.2, "valid_targets_min": 360 }, { "epoch": 0.6910569105691057, "grad_norm": 0.5051976310215145, "learning_rate": 3.935034802784223e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.09235464036464691, "step": 425, "valid_targets_mean": 4802.4, "valid_targets_min": 722 }, { "epoch": 0.6991869918699187, "grad_norm": 0.5776580965911587, "learning_rate": 3.981438515081207e-05, "loss": 0.2613, "loss_nan_ranks": 0, "loss_rank_avg": 0.09387768059968948, "step": 430, "valid_targets_mean": 2986.2, "valid_targets_min": 1579 }, { "epoch": 0.7073170731707317, "grad_norm": 0.4136218864471342, "learning_rate": 3.9999940813479674e-05, "loss": 0.2463, "loss_nan_ranks": 0, "loss_rank_avg": 0.07906226068735123, "step": 435, "valid_targets_mean": 3723.9, "valid_targets_min": 444 }, { "epoch": 0.7154471544715447, "grad_norm": 0.6531331123865727, "learning_rate": 3.999957911934624e-05, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.15597087144851685, "step": 440, "valid_targets_mean": 3835.9, "valid_targets_min": 1892 }, { "epoch": 0.7235772357723578, "grad_norm": 0.5556456726719008, "learning_rate": 3.9998888618418865e-05, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.1279674619436264, "step": 445, "valid_targets_mean": 4801.5, "valid_targets_min": 1082 }, { "epoch": 0.7317073170731707, "grad_norm": 0.435881099780943, "learning_rate": 3.999786932204985e-05, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.09787143021821976, "step": 450, "valid_targets_mean": 5274.4, "valid_targets_min": 1537 }, { "epoch": 0.7398373983739838, "grad_norm": 0.5828524476640174, "learning_rate": 3.999652124699712e-05, "loss": 0.2558, "loss_nan_ranks": 0, "loss_rank_avg": 0.10186605900526047, "step": 455, "valid_targets_mean": 2984.5, "valid_targets_min": 702 }, { "epoch": 0.7479674796747967, "grad_norm": 0.5608325699413138, "learning_rate": 3.999484441542395e-05, "loss": 0.2586, "loss_nan_ranks": 0, "loss_rank_avg": 0.1100446879863739, "step": 460, "valid_targets_mean": 4323.4, "valid_targets_min": 1502 }, { "epoch": 0.7560975609756098, "grad_norm": 0.4896854400312324, "learning_rate": 3.999283885489861e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.14972570538520813, "step": 465, "valid_targets_mean": 5723.0, "valid_targets_min": 909 }, { "epoch": 0.7642276422764228, "grad_norm": 0.4715745180677696, "learning_rate": 3.999050459839389e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.16658423840999603, "step": 470, "valid_targets_mean": 5921.8, "valid_targets_min": 1605 }, { "epoch": 0.7723577235772358, "grad_norm": 0.4332253434648535, "learning_rate": 3.998784168428657e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.16223764419555664, "step": 475, "valid_targets_mean": 8892.9, "valid_targets_min": 979 }, { "epoch": 0.7804878048780488, "grad_norm": 0.49416734264895223, "learning_rate": 3.998485015635677e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.08383375406265259, "step": 480, "valid_targets_mean": 3830.4, "valid_targets_min": 1198 }, { "epoch": 0.7886178861788617, "grad_norm": 0.44223369864110523, "learning_rate": 3.998153006378727e-05, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.13400453329086304, "step": 485, "valid_targets_mean": 7611.5, "valid_targets_min": 1080 }, { "epoch": 0.7967479674796748, "grad_norm": 0.4314334619419397, "learning_rate": 3.997788146116267e-05, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.17776936292648315, "step": 490, "valid_targets_mean": 8224.4, "valid_targets_min": 3429 }, { "epoch": 0.8048780487804879, "grad_norm": 0.5567932646873074, "learning_rate": 3.99739044084685e-05, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.11946548521518707, "step": 495, "valid_targets_mean": 3261.8, "valid_targets_min": 1613 }, { "epoch": 0.8130081300813008, "grad_norm": 0.448735762829862, "learning_rate": 3.9969598971090225e-05, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.11881952732801437, "step": 500, "valid_targets_mean": 5543.5, "valid_targets_min": 855 }, { "epoch": 0.8211382113821138, "grad_norm": 0.4402840571732114, "learning_rate": 3.99649652198122e-05, "loss": 0.2517, "loss_nan_ranks": 0, "loss_rank_avg": 0.06367374956607819, "step": 505, "valid_targets_mean": 2775.2, "valid_targets_min": 947 }, { "epoch": 0.8292682926829268, "grad_norm": 0.5282258088763285, "learning_rate": 3.9960003230816456e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.09785593301057816, "step": 510, "valid_targets_mean": 3915.1, "valid_targets_min": 1416 }, { "epoch": 0.8373983739837398, "grad_norm": 0.47773763553327236, "learning_rate": 3.9954713085681504e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.14291530847549438, "step": 515, "valid_targets_mean": 5950.1, "valid_targets_min": 1535 }, { "epoch": 0.8455284552845529, "grad_norm": 0.43337914617536744, "learning_rate": 3.994909487138096e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.12172655761241913, "step": 520, "valid_targets_mean": 5970.8, "valid_targets_min": 783 }, { "epoch": 0.8536585365853658, "grad_norm": 0.5378102457615822, "learning_rate": 3.994314868028212e-05, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.11482933908700943, "step": 525, "valid_targets_mean": 3605.8, "valid_targets_min": 1216 }, { "epoch": 0.8617886178861789, "grad_norm": 0.5254260728399146, "learning_rate": 3.9936874610144445e-05, "loss": 0.2507, "loss_nan_ranks": 0, "loss_rank_avg": 0.0977395549416542, "step": 530, "valid_targets_mean": 3598.8, "valid_targets_min": 1098 }, { "epoch": 0.8699186991869918, "grad_norm": 0.7023944839667103, "learning_rate": 3.993027276411793e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.15339651703834534, "step": 535, "valid_targets_mean": 5156.0, "valid_targets_min": 1823 }, { "epoch": 0.8780487804878049, "grad_norm": 0.5171186618541325, "learning_rate": 3.992334325074148e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.17998674511909485, "step": 540, "valid_targets_mean": 6728.4, "valid_targets_min": 1272 }, { "epoch": 0.8861788617886179, "grad_norm": 0.48729793764058493, "learning_rate": 3.991608618394102e-05, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.09565893560647964, "step": 545, "valid_targets_mean": 3936.9, "valid_targets_min": 857 }, { "epoch": 0.8943089430894309, "grad_norm": 0.5918156970962429, "learning_rate": 3.9908501683027726e-05, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.16014006733894348, "step": 550, "valid_targets_mean": 5782.0, "valid_targets_min": 1197 }, { "epoch": 0.9024390243902439, "grad_norm": 0.425511480308841, "learning_rate": 3.990058987269597e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.14624741673469543, "step": 555, "valid_targets_mean": 6264.9, "valid_targets_min": 1428 }, { "epoch": 0.9105691056910569, "grad_norm": 0.48528084892861983, "learning_rate": 3.9892350883021366e-05, "loss": 0.2526, "loss_nan_ranks": 0, "loss_rank_avg": 0.10608323663473129, "step": 560, "valid_targets_mean": 3923.5, "valid_targets_min": 1617 }, { "epoch": 0.9186991869918699, "grad_norm": 0.592407932354164, "learning_rate": 3.988378484945853e-05, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.16416841745376587, "step": 565, "valid_targets_mean": 5843.8, "valid_targets_min": 1822 }, { "epoch": 0.926829268292683, "grad_norm": 0.5335924146759159, "learning_rate": 3.987489191283894e-05, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.14844515919685364, "step": 570, "valid_targets_mean": 4678.9, "valid_targets_min": 1823 }, { "epoch": 0.9349593495934959, "grad_norm": 0.4675439890378004, "learning_rate": 3.9865672219368574e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.13567769527435303, "step": 575, "valid_targets_mean": 6683.4, "valid_targets_min": 1722 }, { "epoch": 0.943089430894309, "grad_norm": 0.4932120377407363, "learning_rate": 3.98561259206255e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.16627153754234314, "step": 580, "valid_targets_mean": 6879.5, "valid_targets_min": 907 }, { "epoch": 0.9512195121951219, "grad_norm": 0.5090495107560038, "learning_rate": 3.984625317355743e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.12040682882070541, "step": 585, "valid_targets_mean": 4904.8, "valid_targets_min": 1683 }, { "epoch": 0.959349593495935, "grad_norm": 0.40729208022346775, "learning_rate": 3.983605414047908e-05, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.14297154545783997, "step": 590, "valid_targets_mean": 7401.4, "valid_targets_min": 1109 }, { "epoch": 0.967479674796748, "grad_norm": 0.48289075755238997, "learning_rate": 3.982552898906956e-05, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.20392508804798126, "step": 595, "valid_targets_mean": 7309.9, "valid_targets_min": 1793 }, { "epoch": 0.975609756097561, "grad_norm": 0.5207752303596541, "learning_rate": 3.981467789236958e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.16826973855495453, "step": 600, "valid_targets_mean": 6912.4, "valid_targets_min": 1266 }, { "epoch": 0.983739837398374, "grad_norm": 0.4776035225588843, "learning_rate": 3.98035010287786e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.11448101699352264, "step": 605, "valid_targets_mean": 4544.2, "valid_targets_min": 1206 }, { "epoch": 0.991869918699187, "grad_norm": 0.5633422853253012, "learning_rate": 3.979199858205192e-05, "loss": 0.2507, "loss_nan_ranks": 0, "loss_rank_avg": 0.08251610398292542, "step": 610, "valid_targets_mean": 2942.2, "valid_targets_min": 914 }, { "epoch": 1.0, "grad_norm": 0.5823682959160317, "learning_rate": 3.9780170741297655e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.15531808137893677, "step": 615, "valid_targets_mean": 6071.1, "valid_targets_min": 1765 }, { "epoch": 1.008130081300813, "grad_norm": 0.3965158761830316, "learning_rate": 3.976801770097361e-05, "loss": 0.2104, "loss_nan_ranks": 0, "loss_rank_avg": 0.12315788865089417, "step": 620, "valid_targets_mean": 8491.0, "valid_targets_min": 1419 }, { "epoch": 1.016260162601626, "grad_norm": 0.8209524704905038, "learning_rate": 3.975553966088412e-05, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.1412154585123062, "step": 625, "valid_targets_mean": 4106.9, "valid_targets_min": 837 }, { "epoch": 1.024390243902439, "grad_norm": 0.38246309720446037, "learning_rate": 3.9742736826176706e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.10889215022325516, "step": 630, "valid_targets_mean": 6996.9, "valid_targets_min": 2431 }, { "epoch": 1.032520325203252, "grad_norm": 0.45485234575355044, "learning_rate": 3.9729609407338745e-05, "loss": 0.2061, "loss_nan_ranks": 0, "loss_rank_avg": 0.07304991036653519, "step": 635, "valid_targets_mean": 4595.9, "valid_targets_min": 1186 }, { "epoch": 1.040650406504065, "grad_norm": 0.45037630599723943, "learning_rate": 3.971615762019401e-05, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.11517719179391861, "step": 640, "valid_targets_mean": 5899.5, "valid_targets_min": 1202 }, { "epoch": 1.048780487804878, "grad_norm": 0.42484313621126, "learning_rate": 3.970238168589911e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.11953368037939072, "step": 645, "valid_targets_mean": 7097.9, "valid_targets_min": 728 }, { "epoch": 1.056910569105691, "grad_norm": 0.5373937832124734, "learning_rate": 3.968828183093984e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.2030530571937561, "step": 650, "valid_targets_mean": 5451.6, "valid_targets_min": 914 }, { "epoch": 1.065040650406504, "grad_norm": 0.5775556839202732, "learning_rate": 3.9673858287127484e-05, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.07258522510528564, "step": 655, "valid_targets_mean": 2761.9, "valid_targets_min": 1021 }, { "epoch": 1.0731707317073171, "grad_norm": 0.4668438128769485, "learning_rate": 3.965911129159501e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.11301024258136749, "step": 660, "valid_targets_mean": 4898.1, "valid_targets_min": 837 }, { "epoch": 1.08130081300813, "grad_norm": 0.47013516024956364, "learning_rate": 3.9644041086793115e-05, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.1186167299747467, "step": 665, "valid_targets_mean": 5868.8, "valid_targets_min": 1242 }, { "epoch": 1.089430894308943, "grad_norm": 0.5312618418016917, "learning_rate": 3.9628647920486313e-05, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.14017723500728607, "step": 670, "valid_targets_mean": 5641.1, "valid_targets_min": 1378 }, { "epoch": 1.0975609756097562, "grad_norm": 0.5681891495304583, "learning_rate": 3.961293204574881e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.10212357342243195, "step": 675, "valid_targets_mean": 3441.1, "valid_targets_min": 1530 }, { "epoch": 1.1056910569105691, "grad_norm": 0.6065666956962985, "learning_rate": 3.959689372096034e-05, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.13657888770103455, "step": 680, "valid_targets_mean": 3406.0, "valid_targets_min": 1091 }, { "epoch": 1.113821138211382, "grad_norm": 0.4844859917334594, "learning_rate": 3.9580533209802e-05, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.08240572363138199, "step": 685, "valid_targets_mean": 4039.8, "valid_targets_min": 900 }, { "epoch": 1.1219512195121952, "grad_norm": 0.6990793948181184, "learning_rate": 3.9563850781251785e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.11636875569820404, "step": 690, "valid_targets_mean": 3964.8, "valid_targets_min": 1159 }, { "epoch": 1.1300813008130082, "grad_norm": 0.556330864071891, "learning_rate": 3.954684670958027e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.19163313508033752, "step": 695, "valid_targets_mean": 7370.8, "valid_targets_min": 820 }, { "epoch": 1.1382113821138211, "grad_norm": 0.40935712343833286, "learning_rate": 3.9529521274346036e-05, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.1110377162694931, "step": 700, "valid_targets_mean": 5178.5, "valid_targets_min": 1448 }, { "epoch": 1.146341463414634, "grad_norm": 0.3940130059339374, "learning_rate": 3.951187476039114e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.1282082051038742, "step": 705, "valid_targets_mean": 7301.4, "valid_targets_min": 554 }, { "epoch": 1.1544715447154472, "grad_norm": 0.44484094340330965, "learning_rate": 3.9493907457836355e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.17798787355422974, "step": 710, "valid_targets_mean": 8418.2, "valid_targets_min": 988 }, { "epoch": 1.1626016260162602, "grad_norm": 0.5029070645971326, "learning_rate": 3.947561966207646e-05, "loss": 0.216, "loss_nan_ranks": 0, "loss_rank_avg": 0.11835639178752899, "step": 715, "valid_targets_mean": 4406.4, "valid_targets_min": 1903 }, { "epoch": 1.170731707317073, "grad_norm": 0.5253126899420384, "learning_rate": 3.945701167377537e-05, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.12034034729003906, "step": 720, "valid_targets_mean": 3810.2, "valid_targets_min": 887 }, { "epoch": 1.1788617886178863, "grad_norm": 0.5203754009367536, "learning_rate": 3.9438083798861145e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.158294677734375, "step": 725, "valid_targets_mean": 5777.6, "valid_targets_min": 742 }, { "epoch": 1.1869918699186992, "grad_norm": 0.4596179239456433, "learning_rate": 3.9418836348521045e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.09662042558193207, "step": 730, "valid_targets_mean": 4278.9, "valid_targets_min": 922 }, { "epoch": 1.1951219512195121, "grad_norm": 0.5667907157862749, "learning_rate": 3.939926963919635e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.12269654124975204, "step": 735, "valid_targets_mean": 3766.8, "valid_targets_min": 1459 }, { "epoch": 1.203252032520325, "grad_norm": 0.4819765692219803, "learning_rate": 3.9379383992577166e-05, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.1358526349067688, "step": 740, "valid_targets_mean": 7279.0, "valid_targets_min": 1649 }, { "epoch": 1.2113821138211383, "grad_norm": 0.5477941987006576, "learning_rate": 3.9359179735597174e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.11408542096614838, "step": 745, "valid_targets_mean": 3712.0, "valid_targets_min": 1354 }, { "epoch": 1.2195121951219512, "grad_norm": 0.45240321164701147, "learning_rate": 3.9338657200428215e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.17122586071491241, "step": 750, "valid_targets_mean": 8166.0, "valid_targets_min": 945 }, { "epoch": 1.2276422764227641, "grad_norm": 0.5134051430559291, "learning_rate": 3.931781672447482e-05, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.10336388647556305, "step": 755, "valid_targets_mean": 4337.1, "valid_targets_min": 1770 }, { "epoch": 1.2357723577235773, "grad_norm": 0.46248929000623507, "learning_rate": 3.9296658650368707e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.1598723828792572, "step": 760, "valid_targets_mean": 7182.5, "valid_targets_min": 1743 }, { "epoch": 1.2439024390243902, "grad_norm": 0.4045246673600557, "learning_rate": 3.927518332596313e-05, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.1024380698800087, "step": 765, "valid_targets_mean": 5769.1, "valid_targets_min": 1796 }, { "epoch": 1.2520325203252032, "grad_norm": 0.5883123618533636, "learning_rate": 3.925339110432716e-05, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.1015361100435257, "step": 770, "valid_targets_mean": 3251.4, "valid_targets_min": 1270 }, { "epoch": 1.2601626016260163, "grad_norm": 0.5828148938062185, "learning_rate": 3.923128234373984e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.10613632947206497, "step": 775, "valid_targets_mean": 3267.2, "valid_targets_min": 1370 }, { "epoch": 1.2682926829268293, "grad_norm": 0.40240363329826595, "learning_rate": 3.9208857407684356e-05, "loss": 0.2234, "loss_nan_ranks": 0, "loss_rank_avg": 0.09415178000926971, "step": 780, "valid_targets_mean": 7389.1, "valid_targets_min": 706 }, { "epoch": 1.2764227642276422, "grad_norm": 0.5130971984985822, "learning_rate": 3.918611666484205e-05, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.08123107254505157, "step": 785, "valid_targets_mean": 3929.4, "valid_targets_min": 701 }, { "epoch": 1.2845528455284554, "grad_norm": 0.44592104893541273, "learning_rate": 3.9163060489086305e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.08503039181232452, "step": 790, "valid_targets_mean": 4937.2, "valid_targets_min": 770 }, { "epoch": 1.2926829268292683, "grad_norm": 0.43588099867731694, "learning_rate": 3.913968925947647e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.07082471251487732, "step": 795, "valid_targets_mean": 4000.6, "valid_targets_min": 1536 }, { "epoch": 1.3008130081300813, "grad_norm": 0.4566753193243506, "learning_rate": 3.91160033602516e-05, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.1148664802312851, "step": 800, "valid_targets_mean": 5021.1, "valid_targets_min": 1627 }, { "epoch": 1.3089430894308944, "grad_norm": 0.5165353964813596, "learning_rate": 3.909200318082409e-05, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.13186779618263245, "step": 805, "valid_targets_mean": 3941.8, "valid_targets_min": 1181 }, { "epoch": 1.3170731707317074, "grad_norm": 0.5833276887483743, "learning_rate": 3.906768911577337e-05, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.10670767724514008, "step": 810, "valid_targets_mean": 3626.6, "valid_targets_min": 1062 }, { "epoch": 1.3252032520325203, "grad_norm": 0.49635872075491133, "learning_rate": 3.9043061564839325e-05, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.08261899650096893, "step": 815, "valid_targets_mean": 4500.2, "valid_targets_min": 849 }, { "epoch": 1.3333333333333333, "grad_norm": 0.548229261225524, "learning_rate": 3.901812093291579e-05, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.10293751955032349, "step": 820, "valid_targets_mean": 3782.9, "valid_targets_min": 940 }, { "epoch": 1.3414634146341464, "grad_norm": 0.5234071387100208, "learning_rate": 3.8992867630043855e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.07623535394668579, "step": 825, "valid_targets_mean": 2872.5, "valid_targets_min": 994 }, { "epoch": 1.3495934959349594, "grad_norm": 0.5404349957246796, "learning_rate": 3.896730207140512e-05, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.12489671260118484, "step": 830, "valid_targets_mean": 3263.4, "valid_targets_min": 1317 }, { "epoch": 1.3577235772357723, "grad_norm": 0.4884698037211131, "learning_rate": 3.894142467731492e-05, "loss": 0.2282, "loss_nan_ranks": 0, "loss_rank_avg": 0.06963957101106644, "step": 835, "valid_targets_mean": 2535.8, "valid_targets_min": 172 }, { "epoch": 1.3658536585365852, "grad_norm": 0.49654709244628675, "learning_rate": 3.891523587321534e-05, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.07644413411617279, "step": 840, "valid_targets_mean": 2537.6, "valid_targets_min": 716 }, { "epoch": 1.3739837398373984, "grad_norm": 0.45789596797915566, "learning_rate": 3.888873608966828e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.14082862436771393, "step": 845, "valid_targets_mean": 5098.6, "valid_targets_min": 1615 }, { "epoch": 1.3821138211382114, "grad_norm": 0.42601543684470095, "learning_rate": 3.886192576234836e-05, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.11353771388530731, "step": 850, "valid_targets_mean": 6617.1, "valid_targets_min": 181 }, { "epoch": 1.3902439024390243, "grad_norm": 0.4460558967093584, "learning_rate": 3.883480533203574e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.07416103035211563, "step": 855, "valid_targets_mean": 3448.2, "valid_targets_min": 1237 }, { "epoch": 1.3983739837398375, "grad_norm": 0.5689795665849158, "learning_rate": 3.880737524460888e-05, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.10141883790493011, "step": 860, "valid_targets_mean": 3529.6, "valid_targets_min": 1170 }, { "epoch": 1.4065040650406504, "grad_norm": 0.5523925146103473, "learning_rate": 3.877963595103725e-05, "loss": 0.2292, "loss_nan_ranks": 0, "loss_rank_avg": 0.08235596120357513, "step": 865, "valid_targets_mean": 3140.4, "valid_targets_min": 1076 }, { "epoch": 1.4146341463414633, "grad_norm": 0.5006563508751788, "learning_rate": 3.875158790737383e-05, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.14744211733341217, "step": 870, "valid_targets_mean": 5835.6, "valid_targets_min": 1277 }, { "epoch": 1.4227642276422765, "grad_norm": 0.46073040469054943, "learning_rate": 3.87232315747477e-05, "loss": 0.2409, "loss_nan_ranks": 0, "loss_rank_avg": 0.06571760028600693, "step": 875, "valid_targets_mean": 3359.1, "valid_targets_min": 1108 }, { "epoch": 1.4308943089430894, "grad_norm": 0.4835829355742183, "learning_rate": 3.8694567419356414e-05, "loss": 0.242, "loss_nan_ranks": 0, "loss_rank_avg": 0.12007689476013184, "step": 880, "valid_targets_mean": 4315.8, "valid_targets_min": 940 }, { "epoch": 1.4390243902439024, "grad_norm": 0.4536137739618375, "learning_rate": 3.8665595912458346e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.11298682540655136, "step": 885, "valid_targets_mean": 5438.1, "valid_targets_min": 2376 }, { "epoch": 1.4471544715447155, "grad_norm": 0.5021045202574305, "learning_rate": 3.863631753036492e-05, "loss": 0.2365, "loss_nan_ranks": 0, "loss_rank_avg": 0.058069903403520584, "step": 890, "valid_targets_mean": 2323.1, "valid_targets_min": 1420 }, { "epoch": 1.4552845528455285, "grad_norm": 0.39426333614827813, "learning_rate": 3.860673275443283e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.1470167487859726, "step": 895, "valid_targets_mean": 9059.5, "valid_targets_min": 2964 }, { "epoch": 1.4634146341463414, "grad_norm": 0.6249825194478345, "learning_rate": 3.857684207105606e-05, "loss": 0.2183, "loss_nan_ranks": 0, "loss_rank_avg": 0.10146964341402054, "step": 900, "valid_targets_mean": 3395.1, "valid_targets_min": 1048 }, { "epoch": 1.4715447154471546, "grad_norm": 0.5012413355120879, "learning_rate": 3.854664597165795e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.11698883026838303, "step": 905, "valid_targets_mean": 4783.1, "valid_targets_min": 2176 }, { "epoch": 1.4796747967479675, "grad_norm": 0.4596049298495697, "learning_rate": 3.851614495268308e-05, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.08823439478874207, "step": 910, "valid_targets_mean": 4672.1, "valid_targets_min": 1174 }, { "epoch": 1.4878048780487805, "grad_norm": 0.3944524603942707, "learning_rate": 3.848533951558912e-05, "loss": 0.2301, "loss_nan_ranks": 0, "loss_rank_avg": 0.1314489096403122, "step": 915, "valid_targets_mean": 8109.9, "valid_targets_min": 2266 }, { "epoch": 1.4959349593495934, "grad_norm": 0.394735121722566, "learning_rate": 3.845423016683856e-05, "loss": 0.2234, "loss_nan_ranks": 0, "loss_rank_avg": 0.09605981409549713, "step": 920, "valid_targets_mean": 6552.8, "valid_targets_min": 1446 }, { "epoch": 1.5040650406504064, "grad_norm": 0.5389195205596354, "learning_rate": 3.842281741789044e-05, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.10946165025234222, "step": 925, "valid_targets_mean": 3415.9, "valid_targets_min": 1270 }, { "epoch": 1.5121951219512195, "grad_norm": 0.524120559872235, "learning_rate": 3.839110178519189e-05, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.15303677320480347, "step": 930, "valid_targets_mean": 4837.9, "valid_targets_min": 1657 }, { "epoch": 1.5203252032520327, "grad_norm": 0.5240421403900116, "learning_rate": 3.835908379016966e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.15414929389953613, "step": 935, "valid_targets_mean": 5523.1, "valid_targets_min": 1377 }, { "epoch": 1.5284552845528454, "grad_norm": 0.5224481197292362, "learning_rate": 3.832676395922153e-05, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.1074165552854538, "step": 940, "valid_targets_mean": 3784.5, "valid_targets_min": 2352 }, { "epoch": 1.5365853658536586, "grad_norm": 0.5072180548482026, "learning_rate": 3.82941428237077e-05, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.12508507072925568, "step": 945, "valid_targets_mean": 4790.2, "valid_targets_min": 1204 }, { "epoch": 1.5447154471544715, "grad_norm": 0.5030735545977771, "learning_rate": 3.826122091994198e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.11002949625253677, "step": 950, "valid_targets_mean": 4168.2, "valid_targets_min": 1034 }, { "epoch": 1.5528455284552845, "grad_norm": 0.4967683087750268, "learning_rate": 3.822799878918307e-05, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.10862497240304947, "step": 955, "valid_targets_mean": 3963.9, "valid_targets_min": 763 }, { "epoch": 1.5609756097560976, "grad_norm": 0.4823100231835806, "learning_rate": 3.8194476977625556e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.08248058706521988, "step": 960, "valid_targets_mean": 6830.8, "valid_targets_min": 1687 }, { "epoch": 1.5691056910569106, "grad_norm": 0.5049053209040891, "learning_rate": 3.8160656036391024e-05, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.061338260769844055, "step": 965, "valid_targets_mean": 4099.9, "valid_targets_min": 1219 }, { "epoch": 1.5772357723577235, "grad_norm": 0.540276950242508, "learning_rate": 3.812653652151893e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.10732004791498184, "step": 970, "valid_targets_mean": 3163.6, "valid_targets_min": 1656 }, { "epoch": 1.5853658536585367, "grad_norm": 0.4835227819538819, "learning_rate": 3.809211899395749e-05, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.14421193301677704, "step": 975, "valid_targets_mean": 6843.2, "valid_targets_min": 2950 }, { "epoch": 1.5934959349593496, "grad_norm": 0.5334854543454322, "learning_rate": 3.8057404019554464e-05, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.1714661717414856, "step": 980, "valid_targets_mean": 5989.1, "valid_targets_min": 1145 }, { "epoch": 1.6016260162601625, "grad_norm": 0.43166365470341506, "learning_rate": 3.802239216904782e-05, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.0918479859828949, "step": 985, "valid_targets_mean": 4852.0, "valid_targets_min": 1623 }, { "epoch": 1.6097560975609757, "grad_norm": 0.4636530333951324, "learning_rate": 3.79870840180564e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.06160171329975128, "step": 990, "valid_targets_mean": 3179.1, "valid_targets_min": 1135 }, { "epoch": 1.6178861788617886, "grad_norm": 0.4274181136650196, "learning_rate": 3.795148014707042e-05, "loss": 0.2162, "loss_nan_ranks": 0, "loss_rank_avg": 0.08692105114459991, "step": 995, "valid_targets_mean": 4837.5, "valid_targets_min": 1672 }, { "epoch": 1.6260162601626016, "grad_norm": 0.4703841246931964, "learning_rate": 3.791558114144192e-05, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.08486643433570862, "step": 1000, "valid_targets_mean": 3899.8, "valid_targets_min": 656 }, { "epoch": 1.6341463414634148, "grad_norm": 0.6624769950377596, "learning_rate": 3.7879387591375174e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.1466502994298935, "step": 1005, "valid_targets_mean": 5033.8, "valid_targets_min": 1566 }, { "epoch": 1.6422764227642277, "grad_norm": 0.4190367189532978, "learning_rate": 3.7842900091916956e-05, "loss": 0.2238, "loss_nan_ranks": 0, "loss_rank_avg": 0.12614805996418, "step": 1010, "valid_targets_mean": 6549.5, "valid_targets_min": 1115 }, { "epoch": 1.6504065040650406, "grad_norm": 0.738418186886985, "learning_rate": 3.7806119242946785e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.12393393367528915, "step": 1015, "valid_targets_mean": 3459.9, "valid_targets_min": 798 }, { "epoch": 1.6585365853658538, "grad_norm": 0.5644460291732224, "learning_rate": 3.7769045649167034e-05, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.11421222984790802, "step": 1020, "valid_targets_mean": 3315.9, "valid_targets_min": 1547 }, { "epoch": 1.6666666666666665, "grad_norm": 0.41320505192823315, "learning_rate": 3.7731679920093e-05, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.08888000249862671, "step": 1025, "valid_targets_mean": 6288.9, "valid_targets_min": 1798 }, { "epoch": 1.6747967479674797, "grad_norm": 0.5480236382343993, "learning_rate": 3.7694022670042894e-05, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.12863221764564514, "step": 1030, "valid_targets_mean": 3568.1, "valid_targets_min": 1739 }, { "epoch": 1.6829268292682928, "grad_norm": 0.42629628455906676, "learning_rate": 3.765607451812773e-05, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.09852313995361328, "step": 1035, "valid_targets_mean": 4824.5, "valid_targets_min": 1052 }, { "epoch": 1.6910569105691056, "grad_norm": 0.5762264821222708, "learning_rate": 3.7617836088241144e-05, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.07967015355825424, "step": 1040, "valid_targets_mean": 2944.0, "valid_targets_min": 1051 }, { "epoch": 1.6991869918699187, "grad_norm": 0.4459514021715225, "learning_rate": 3.757930800904914e-05, "loss": 0.2293, "loss_nan_ranks": 0, "loss_rank_avg": 0.08062554895877838, "step": 1045, "valid_targets_mean": 3992.1, "valid_targets_min": 925 }, { "epoch": 1.7073170731707317, "grad_norm": 0.45826392195164917, "learning_rate": 3.754049091397976e-05, "loss": 0.2236, "loss_nan_ranks": 0, "loss_rank_avg": 0.13178986310958862, "step": 1050, "valid_targets_mean": 5064.0, "valid_targets_min": 1014 }, { "epoch": 1.7154471544715446, "grad_norm": 0.45683672813542875, "learning_rate": 3.7501385441212664e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.10273057967424393, "step": 1055, "valid_targets_mean": 5496.4, "valid_targets_min": 1647 }, { "epoch": 1.7235772357723578, "grad_norm": 0.48910396683039425, "learning_rate": 3.746199223366863e-05, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.1314147561788559, "step": 1060, "valid_targets_mean": 5321.6, "valid_targets_min": 351 }, { "epoch": 1.7317073170731707, "grad_norm": 0.604640944264289, "learning_rate": 3.7422311938999013e-05, "loss": 0.2423, "loss_nan_ranks": 0, "loss_rank_avg": 0.12249931693077087, "step": 1065, "valid_targets_mean": 4093.8, "valid_targets_min": 1698 }, { "epoch": 1.7398373983739837, "grad_norm": 0.38096825630284653, "learning_rate": 3.738234520957506e-05, "loss": 0.2331, "loss_nan_ranks": 0, "loss_rank_avg": 0.17623598873615265, "step": 1070, "valid_targets_mean": 9686.1, "valid_targets_min": 1532 }, { "epoch": 1.7479674796747968, "grad_norm": 0.4345873658757806, "learning_rate": 3.73420927024772e-05, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.1418791115283966, "step": 1075, "valid_targets_mean": 6910.9, "valid_targets_min": 1164 }, { "epoch": 1.7560975609756098, "grad_norm": 0.6342367237361929, "learning_rate": 3.730155507948426e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.11825092136859894, "step": 1080, "valid_targets_mean": 2878.2, "valid_targets_min": 794 }, { "epoch": 1.7642276422764227, "grad_norm": 0.4911237796956687, "learning_rate": 3.726073300706256e-05, "loss": 0.2171, "loss_nan_ranks": 0, "loss_rank_avg": 0.12331271171569824, "step": 1085, "valid_targets_mean": 4839.2, "valid_targets_min": 1012 }, { "epoch": 1.7723577235772359, "grad_norm": 0.5720052301592458, "learning_rate": 3.721962715635495e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.14887095987796783, "step": 1090, "valid_targets_mean": 4142.1, "valid_targets_min": 1840 }, { "epoch": 1.7804878048780488, "grad_norm": 0.5575492029691669, "learning_rate": 3.7178238203169804e-05, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.20791137218475342, "step": 1095, "valid_targets_mean": 6027.8, "valid_targets_min": 2228 }, { "epoch": 1.7886178861788617, "grad_norm": 0.39049859672884946, "learning_rate": 3.7136566827969895e-05, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.0716979056596756, "step": 1100, "valid_targets_mean": 4628.1, "valid_targets_min": 1101 }, { "epoch": 1.796747967479675, "grad_norm": 0.47421428965884277, "learning_rate": 3.70946137158612e-05, "loss": 0.2237, "loss_nan_ranks": 0, "loss_rank_avg": 0.07806351780891418, "step": 1105, "valid_targets_mean": 3712.0, "valid_targets_min": 1293 }, { "epoch": 1.8048780487804879, "grad_norm": 0.5068968975373506, "learning_rate": 3.705237955658166e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.11200665682554245, "step": 1110, "valid_targets_mean": 5447.4, "valid_targets_min": 788 }, { "epoch": 1.8130081300813008, "grad_norm": 0.5580468796303095, "learning_rate": 3.70098650444898e-05, "loss": 0.2189, "loss_nan_ranks": 0, "loss_rank_avg": 0.1504202038049698, "step": 1115, "valid_targets_mean": 4488.5, "valid_targets_min": 816 }, { "epoch": 1.821138211382114, "grad_norm": 0.4258590181032865, "learning_rate": 3.6967070878553346e-05, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.054161518812179565, "step": 1120, "valid_targets_mean": 3008.2, "valid_targets_min": 575 }, { "epoch": 1.8292682926829267, "grad_norm": 0.4624366928822223, "learning_rate": 3.692399776233775e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.13637976348400116, "step": 1125, "valid_targets_mean": 4433.0, "valid_targets_min": 934 }, { "epoch": 1.8373983739837398, "grad_norm": 0.5349988680640237, "learning_rate": 3.688064640399456e-05, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.1040443405508995, "step": 1130, "valid_targets_mean": 3776.0, "valid_targets_min": 1464 }, { "epoch": 1.845528455284553, "grad_norm": 0.4181283196951306, "learning_rate": 3.683701751624983e-05, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.08952677249908447, "step": 1135, "valid_targets_mean": 5412.9, "valid_targets_min": 971 }, { "epoch": 1.8536585365853657, "grad_norm": 0.3724889591158931, "learning_rate": 3.67931118163924e-05, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.12202881276607513, "step": 1140, "valid_targets_mean": 9458.0, "valid_targets_min": 2193 }, { "epoch": 1.8617886178861789, "grad_norm": 0.5169536041735174, "learning_rate": 3.674893002626208e-05, "loss": 0.2252, "loss_nan_ranks": 0, "loss_rank_avg": 0.09581346809864044, "step": 1145, "valid_targets_mean": 4473.0, "valid_targets_min": 571 }, { "epoch": 1.8699186991869918, "grad_norm": 0.5269674507898049, "learning_rate": 3.6704472872237786e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.16145059466362, "step": 1150, "valid_targets_mean": 4877.0, "valid_targets_min": 1250 }, { "epoch": 1.8780487804878048, "grad_norm": 0.46729556622361995, "learning_rate": 3.665974108522562e-05, "loss": 0.2316, "loss_nan_ranks": 0, "loss_rank_avg": 0.09038245677947998, "step": 1155, "valid_targets_mean": 4328.5, "valid_targets_min": 937 }, { "epoch": 1.886178861788618, "grad_norm": 0.5813298392003822, "learning_rate": 3.6614735400646824e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.13836345076560974, "step": 1160, "valid_targets_mean": 4373.9, "valid_targets_min": 1026 }, { "epoch": 1.8943089430894309, "grad_norm": 0.5471754039067721, "learning_rate": 3.6569456558425724e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.0936594158411026, "step": 1165, "valid_targets_mean": 3060.2, "valid_targets_min": 1861 }, { "epoch": 1.9024390243902438, "grad_norm": 0.3893905924430736, "learning_rate": 3.6523905302977524e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.10204647481441498, "step": 1170, "valid_targets_mean": 6846.0, "valid_targets_min": 1176 }, { "epoch": 1.910569105691057, "grad_norm": 0.5100100212492299, "learning_rate": 3.64780823831961e-05, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.13216924667358398, "step": 1175, "valid_targets_mean": 3942.9, "valid_targets_min": 1280 }, { "epoch": 1.91869918699187, "grad_norm": 0.4019402090250472, "learning_rate": 3.643198855244167e-05, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.18250243365764618, "step": 1180, "valid_targets_mean": 9317.6, "valid_targets_min": 1402 }, { "epoch": 1.9268292682926829, "grad_norm": 0.5465059692098683, "learning_rate": 3.6385624568528424e-05, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.15493763983249664, "step": 1185, "valid_targets_mean": 5039.5, "valid_targets_min": 1508 }, { "epoch": 1.934959349593496, "grad_norm": 0.46918759776118196, "learning_rate": 3.6338991193712045e-05, "loss": 0.2263, "loss_nan_ranks": 0, "loss_rank_avg": 0.10133281350135803, "step": 1190, "valid_targets_mean": 4153.9, "valid_targets_min": 1435 }, { "epoch": 1.943089430894309, "grad_norm": 0.36245879733356207, "learning_rate": 3.629208919467718e-05, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.1810036152601242, "step": 1195, "valid_targets_mean": 12011.8, "valid_targets_min": 3220 }, { "epoch": 1.951219512195122, "grad_norm": 0.5457213202060804, "learning_rate": 3.624491934252487e-05, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.0889679342508316, "step": 1200, "valid_targets_mean": 2738.9, "valid_targets_min": 1382 }, { "epoch": 1.959349593495935, "grad_norm": 0.5064331250921682, "learning_rate": 3.619748241275981e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.16250590980052948, "step": 1205, "valid_targets_mean": 5459.4, "valid_targets_min": 1793 }, { "epoch": 1.967479674796748, "grad_norm": 0.4010359059500501, "learning_rate": 3.614977918527767e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.09311247617006302, "step": 1210, "valid_targets_mean": 5402.5, "valid_targets_min": 608 }, { "epoch": 1.975609756097561, "grad_norm": 0.45703735377056554, "learning_rate": 3.610181044435221e-05, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.12596140801906586, "step": 1215, "valid_targets_mean": 4364.6, "valid_targets_min": 1162 }, { "epoch": 1.9837398373983741, "grad_norm": 0.49264297254095274, "learning_rate": 3.605357697862242e-05, "loss": 0.2191, "loss_nan_ranks": 0, "loss_rank_avg": 0.07238320261240005, "step": 1220, "valid_targets_mean": 3485.9, "valid_targets_min": 830 }, { "epoch": 1.9918699186991868, "grad_norm": 0.5373153715044475, "learning_rate": 3.6005079581079545e-05, "loss": 0.2205, "loss_nan_ranks": 0, "loss_rank_avg": 0.10004070401191711, "step": 1225, "valid_targets_mean": 3992.0, "valid_targets_min": 494 }, { "epoch": 2.0, "grad_norm": 0.49130671620094196, "learning_rate": 3.595631904905406e-05, "loss": 0.235, "loss_nan_ranks": 0, "loss_rank_avg": 0.07893165200948715, "step": 1230, "valid_targets_mean": 3782.1, "valid_targets_min": 1686 }, { "epoch": 2.008130081300813, "grad_norm": 0.6096653945173733, "learning_rate": 3.590729618420255e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.168676495552063, "step": 1235, "valid_targets_mean": 5550.9, "valid_targets_min": 1152 }, { "epoch": 2.016260162601626, "grad_norm": 0.486267941126717, "learning_rate": 3.585801179249452e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.06921999901533127, "step": 1240, "valid_targets_mean": 2600.0, "valid_targets_min": 1002 }, { "epoch": 2.024390243902439, "grad_norm": 0.36075225178757375, "learning_rate": 3.5808466684199166e-05, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.07709603011608124, "step": 1245, "valid_targets_mean": 6242.2, "valid_targets_min": 2079 }, { "epoch": 2.032520325203252, "grad_norm": 0.5015575667963293, "learning_rate": 3.575866167387204e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.08766970038414001, "step": 1250, "valid_targets_mean": 6274.9, "valid_targets_min": 1542 }, { "epoch": 2.040650406504065, "grad_norm": 0.5329677102018745, "learning_rate": 3.570859758034165e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.10257251560688019, "step": 1255, "valid_targets_mean": 3697.9, "valid_targets_min": 1089 }, { "epoch": 2.048780487804878, "grad_norm": 0.407657612500359, "learning_rate": 3.565827522669605e-05, "loss": 0.1916, "loss_nan_ranks": 0, "loss_rank_avg": 0.12750816345214844, "step": 1260, "valid_targets_mean": 8551.9, "valid_targets_min": 1048 }, { "epoch": 2.0569105691056913, "grad_norm": 0.5071880520537156, "learning_rate": 3.5607695440269214e-05, "loss": 0.2069, "loss_nan_ranks": 0, "loss_rank_avg": 0.09404310584068298, "step": 1265, "valid_targets_mean": 3794.0, "valid_targets_min": 860 }, { "epoch": 2.065040650406504, "grad_norm": 0.42913178787653894, "learning_rate": 3.555685905262751e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.1402793526649475, "step": 1270, "valid_targets_mean": 8416.9, "valid_targets_min": 1647 }, { "epoch": 2.073170731707317, "grad_norm": 0.3741576355752387, "learning_rate": 3.5505766899556026e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.08094493299722672, "step": 1275, "valid_targets_mean": 7083.0, "valid_targets_min": 451 }, { "epoch": 2.08130081300813, "grad_norm": 0.49827679661491187, "learning_rate": 3.5454419821044786e-05, "loss": 0.2092, "loss_nan_ranks": 0, "loss_rank_avg": 0.14759448170661926, "step": 1280, "valid_targets_mean": 5587.4, "valid_targets_min": 1198 }, { "epoch": 2.089430894308943, "grad_norm": 0.6400743430881105, "learning_rate": 3.540281866127496e-05, "loss": 0.2086, "loss_nan_ranks": 0, "loss_rank_avg": 0.05334595590829849, "step": 1285, "valid_targets_mean": 2796.2, "valid_targets_min": 681 }, { "epoch": 2.097560975609756, "grad_norm": 0.5048187645555281, "learning_rate": 3.5350964268605006e-05, "loss": 0.1993, "loss_nan_ranks": 0, "loss_rank_avg": 0.1001671701669693, "step": 1290, "valid_targets_mean": 4451.6, "valid_targets_min": 907 }, { "epoch": 2.105691056910569, "grad_norm": 0.4184546206143324, "learning_rate": 3.5298857495556684e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.06665745377540588, "step": 1295, "valid_targets_mean": 3604.9, "valid_targets_min": 691 }, { "epoch": 2.113821138211382, "grad_norm": 0.5625880783856632, "learning_rate": 3.524649919880108e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.16128672659397125, "step": 1300, "valid_targets_mean": 6107.8, "valid_targets_min": 2044 }, { "epoch": 2.1219512195121952, "grad_norm": 0.5336695824686021, "learning_rate": 3.519389023914449e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.09741990268230438, "step": 1305, "valid_targets_mean": 5461.4, "valid_targets_min": 1046 }, { "epoch": 2.130081300813008, "grad_norm": 0.4784752346834324, "learning_rate": 3.5141031481514276e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.09999379515647888, "step": 1310, "valid_targets_mean": 4342.1, "valid_targets_min": 980 }, { "epoch": 2.138211382113821, "grad_norm": 0.4230176122307435, "learning_rate": 3.508792379494468e-05, "loss": 0.1989, "loss_nan_ranks": 0, "loss_rank_avg": 0.11121249198913574, "step": 1315, "valid_targets_mean": 7179.1, "valid_targets_min": 2978 }, { "epoch": 2.1463414634146343, "grad_norm": 0.5652067480064321, "learning_rate": 3.503456805256246e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.07307397574186325, "step": 1320, "valid_targets_mean": 3486.0, "valid_targets_min": 1436 }, { "epoch": 2.154471544715447, "grad_norm": 0.4274977353992751, "learning_rate": 3.4980965131572616e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.1140279471874237, "step": 1325, "valid_targets_mean": 7104.9, "valid_targets_min": 3123 }, { "epoch": 2.16260162601626, "grad_norm": 0.38536408604434963, "learning_rate": 3.492711591324392e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.11197927594184875, "step": 1330, "valid_targets_mean": 8223.5, "valid_targets_min": 1355 }, { "epoch": 2.1707317073170733, "grad_norm": 0.4891780029787705, "learning_rate": 3.487302128289445e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.06790201365947723, "step": 1335, "valid_targets_mean": 6352.5, "valid_targets_min": 756 }, { "epoch": 2.178861788617886, "grad_norm": 0.4265617210773642, "learning_rate": 3.481868212987702e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.11568331718444824, "step": 1340, "valid_targets_mean": 7652.5, "valid_targets_min": 686 }, { "epoch": 2.186991869918699, "grad_norm": 0.44127630130500006, "learning_rate": 3.476409934756456e-05, "loss": 0.1998, "loss_nan_ranks": 0, "loss_rank_avg": 0.12968169152736664, "step": 1345, "valid_targets_mean": 7471.9, "valid_targets_min": 2830 }, { "epoch": 2.1951219512195124, "grad_norm": 0.5860704749863329, "learning_rate": 3.470927383333544e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.12853296101093292, "step": 1350, "valid_targets_mean": 4670.8, "valid_targets_min": 1837 }, { "epoch": 2.203252032520325, "grad_norm": 0.4431972382892355, "learning_rate": 3.46542064885587e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.07435105741024017, "step": 1355, "valid_targets_mean": 3843.2, "valid_targets_min": 1789 }, { "epoch": 2.2113821138211383, "grad_norm": 0.44088032105092884, "learning_rate": 3.459889821857926e-05, "loss": 0.1912, "loss_nan_ranks": 0, "loss_rank_avg": 0.1073368489742279, "step": 1360, "valid_targets_mean": 6742.0, "valid_targets_min": 855 }, { "epoch": 2.2195121951219514, "grad_norm": 0.35953157358731014, "learning_rate": 3.4543349932702984e-05, "loss": 0.2012, "loss_nan_ranks": 0, "loss_rank_avg": 0.10705859959125519, "step": 1365, "valid_targets_mean": 9445.9, "valid_targets_min": 2016 }, { "epoch": 2.227642276422764, "grad_norm": 0.5113381602477436, "learning_rate": 3.448756254418179e-05, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.09596805274486542, "step": 1370, "valid_targets_mean": 4466.6, "valid_targets_min": 1403 }, { "epoch": 2.2357723577235773, "grad_norm": 0.46251235271924046, "learning_rate": 3.443153697019861e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.12127140164375305, "step": 1375, "valid_targets_mean": 6918.5, "valid_targets_min": 3675 }, { "epoch": 2.2439024390243905, "grad_norm": 0.4540722452279749, "learning_rate": 3.437527413185227e-05, "loss": 0.2039, "loss_nan_ranks": 0, "loss_rank_avg": 0.08045300841331482, "step": 1380, "valid_targets_mean": 4948.8, "valid_targets_min": 839 }, { "epoch": 2.252032520325203, "grad_norm": 0.5398814237704406, "learning_rate": 3.431877495414242e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.09723912179470062, "step": 1385, "valid_targets_mean": 3995.0, "valid_targets_min": 542 }, { "epoch": 2.2601626016260163, "grad_norm": 0.43622077951027255, "learning_rate": 3.42620403659543e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.09109564125537872, "step": 1390, "valid_targets_mean": 4886.4, "valid_targets_min": 2270 }, { "epoch": 2.2682926829268295, "grad_norm": 0.4780052836341229, "learning_rate": 3.420507130004341e-05, "loss": 0.2134, "loss_nan_ranks": 0, "loss_rank_avg": 0.12145769596099854, "step": 1395, "valid_targets_mean": 6276.2, "valid_targets_min": 1143 }, { "epoch": 2.2764227642276422, "grad_norm": 0.429081273564811, "learning_rate": 3.414786869302029e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.08802617341279984, "step": 1400, "valid_targets_mean": 6404.5, "valid_targets_min": 1532 }, { "epoch": 2.2845528455284554, "grad_norm": 0.7006098276866646, "learning_rate": 3.4090433485334996e-05, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.1448991894721985, "step": 1405, "valid_targets_mean": 3894.5, "valid_targets_min": 1613 }, { "epoch": 2.292682926829268, "grad_norm": 0.49226063306323403, "learning_rate": 3.403276662126173e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.09556463360786438, "step": 1410, "valid_targets_mean": 4234.4, "valid_targets_min": 1103 }, { "epoch": 2.3008130081300813, "grad_norm": 0.4292303582797742, "learning_rate": 3.397486904888328e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.07498009502887726, "step": 1415, "valid_targets_mean": 3567.9, "valid_targets_min": 605 }, { "epoch": 2.3089430894308944, "grad_norm": 0.402683354693791, "learning_rate": 3.391674172007544e-05, "loss": 0.187, "loss_nan_ranks": 0, "loss_rank_avg": 0.10655438899993896, "step": 1420, "valid_targets_mean": 8109.4, "valid_targets_min": 1813 }, { "epoch": 2.317073170731707, "grad_norm": 0.4788551867309091, "learning_rate": 3.3858385590491347e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.08100958168506622, "step": 1425, "valid_targets_mean": 4947.1, "valid_targets_min": 922 }, { "epoch": 2.3252032520325203, "grad_norm": 0.42966789195428107, "learning_rate": 3.379980161954578e-05, "loss": 0.2068, "loss_nan_ranks": 0, "loss_rank_avg": 0.09635898470878601, "step": 1430, "valid_targets_mean": 7544.0, "valid_targets_min": 1909 }, { "epoch": 2.3333333333333335, "grad_norm": 0.5231607562969665, "learning_rate": 3.3740990770399404e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.048967648297548294, "step": 1435, "valid_targets_mean": 2041.6, "valid_targets_min": 840 }, { "epoch": 2.341463414634146, "grad_norm": 0.40935225942983994, "learning_rate": 3.368195400994289e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.12222021073102951, "step": 1440, "valid_targets_mean": 8182.5, "valid_targets_min": 1285 }, { "epoch": 2.3495934959349594, "grad_norm": 0.4083917337873208, "learning_rate": 3.362269230878107e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.09421306848526001, "step": 1445, "valid_targets_mean": 6619.4, "valid_targets_min": 1243 }, { "epoch": 2.3577235772357725, "grad_norm": 0.521234806274641, "learning_rate": 3.356320664121694e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.15950816869735718, "step": 1450, "valid_targets_mean": 6547.8, "valid_targets_min": 805 }, { "epoch": 2.3658536585365852, "grad_norm": 0.47460792948559755, "learning_rate": 3.350349798523566e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.09871967136859894, "step": 1455, "valid_targets_mean": 4197.1, "valid_targets_min": 1046 }, { "epoch": 2.3739837398373984, "grad_norm": 0.4487217666661941, "learning_rate": 3.344356732248849e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.09437257051467896, "step": 1460, "valid_targets_mean": 4658.2, "valid_targets_min": 1857 }, { "epoch": 2.3821138211382116, "grad_norm": 1.0298594905058047, "learning_rate": 3.33834156382766e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.12231095135211945, "step": 1465, "valid_targets_mean": 4875.1, "valid_targets_min": 1533 }, { "epoch": 2.3902439024390243, "grad_norm": 0.543942703465496, "learning_rate": 3.332304392153494e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.11395194381475449, "step": 1470, "valid_targets_mean": 4295.1, "valid_targets_min": 240 }, { "epoch": 2.3983739837398375, "grad_norm": 0.48347940542906515, "learning_rate": 3.326245316481591e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.08603271842002869, "step": 1475, "valid_targets_mean": 5712.1, "valid_targets_min": 1533 }, { "epoch": 2.40650406504065, "grad_norm": 0.529322768224568, "learning_rate": 3.320164436427311e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.14546674489974976, "step": 1480, "valid_targets_mean": 5456.8, "valid_targets_min": 798 }, { "epoch": 2.4146341463414633, "grad_norm": 0.4025185362190621, "learning_rate": 3.314061851964491e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.13945616781711578, "step": 1485, "valid_targets_mean": 8392.6, "valid_targets_min": 847 }, { "epoch": 2.4227642276422765, "grad_norm": 0.45832574829489403, "learning_rate": 3.307937663423804e-05, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.12582911550998688, "step": 1490, "valid_targets_mean": 5385.4, "valid_targets_min": 743 }, { "epoch": 2.430894308943089, "grad_norm": 0.49440731292197876, "learning_rate": 3.3017919714911094e-05, "loss": 0.2036, "loss_nan_ranks": 0, "loss_rank_avg": 0.10726660490036011, "step": 1495, "valid_targets_mean": 4643.4, "valid_targets_min": 2468 }, { "epoch": 2.4390243902439024, "grad_norm": 0.40136331395370467, "learning_rate": 3.295624877205796e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.06084207072854042, "step": 1500, "valid_targets_mean": 5294.8, "valid_targets_min": 233 }, { "epoch": 2.4471544715447155, "grad_norm": 0.5382432440141132, "learning_rate": 3.2894364819591224e-05, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.09458312392234802, "step": 1505, "valid_targets_mean": 3362.5, "valid_targets_min": 1147 }, { "epoch": 2.4552845528455283, "grad_norm": 0.527145677762709, "learning_rate": 3.28322688749255e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.09245900064706802, "step": 1510, "valid_targets_mean": 4313.1, "valid_targets_min": 1945 }, { "epoch": 2.4634146341463414, "grad_norm": 0.542513461496231, "learning_rate": 3.2769961958960694e-05, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.0820431038737297, "step": 1515, "valid_targets_mean": 3790.0, "valid_targets_min": 1595 }, { "epoch": 2.4715447154471546, "grad_norm": 0.43262729398900607, "learning_rate": 3.270744509606523e-05, "loss": 0.2044, "loss_nan_ranks": 0, "loss_rank_avg": 0.1285000741481781, "step": 1520, "valid_targets_mean": 6114.9, "valid_targets_min": 1122 }, { "epoch": 2.4796747967479673, "grad_norm": 0.47951988866409967, "learning_rate": 3.26447193140592e-05, "loss": 0.1987, "loss_nan_ranks": 0, "loss_rank_avg": 0.15053929388523102, "step": 1525, "valid_targets_mean": 6729.1, "valid_targets_min": 1318 }, { "epoch": 2.4878048780487805, "grad_norm": 0.4591921861251178, "learning_rate": 3.2581785644197456e-05, "loss": 0.1879, "loss_nan_ranks": 0, "loss_rank_avg": 0.11216693371534348, "step": 1530, "valid_targets_mean": 5327.1, "valid_targets_min": 1354 }, { "epoch": 2.4959349593495936, "grad_norm": 0.6778821114046177, "learning_rate": 3.251864512115271e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.085115946829319, "step": 1535, "valid_targets_mean": 2291.9, "valid_targets_min": 1334 }, { "epoch": 2.5040650406504064, "grad_norm": 0.47109091076267534, "learning_rate": 3.2455298782998424e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.08691582083702087, "step": 1540, "valid_targets_mean": 4806.1, "valid_targets_min": 1110 }, { "epoch": 2.5121951219512195, "grad_norm": 0.49712824331006406, "learning_rate": 3.2391747671191854e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.11779696494340897, "step": 1545, "valid_targets_mean": 4333.4, "valid_targets_min": 925 }, { "epoch": 2.5203252032520327, "grad_norm": 0.5321267904890513, "learning_rate": 3.2327992830556846e-05, "loss": 0.1993, "loss_nan_ranks": 0, "loss_rank_avg": 0.12687452137470245, "step": 1550, "valid_targets_mean": 7064.0, "valid_targets_min": 2171 }, { "epoch": 2.5284552845528454, "grad_norm": 0.4066751905340784, "learning_rate": 3.22640353092667e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.08782736957073212, "step": 1555, "valid_targets_mean": 8502.2, "valid_targets_min": 1756 }, { "epoch": 2.5365853658536586, "grad_norm": 0.4934355772738274, "learning_rate": 3.2199876158826915e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.0565190389752388, "step": 1560, "valid_targets_mean": 2574.8, "valid_targets_min": 971 }, { "epoch": 2.5447154471544717, "grad_norm": 0.419183504433638, "learning_rate": 3.2135516434057915e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.09079393744468689, "step": 1565, "valid_targets_mean": 5667.6, "valid_targets_min": 2330 }, { "epoch": 2.5528455284552845, "grad_norm": 0.5326857645605443, "learning_rate": 3.2070957193077705e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.0880943313241005, "step": 1570, "valid_targets_mean": 3525.1, "valid_targets_min": 1269 }, { "epoch": 2.5609756097560976, "grad_norm": 0.4901370161149051, "learning_rate": 3.200619949728448e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.12771451473236084, "step": 1575, "valid_targets_mean": 7970.2, "valid_targets_min": 788 }, { "epoch": 2.569105691056911, "grad_norm": 0.40216340422425895, "learning_rate": 3.194124441133916e-05, "loss": 0.2164, "loss_nan_ranks": 0, "loss_rank_avg": 0.0669591873884201, "step": 1580, "valid_targets_mean": 5408.6, "valid_targets_min": 987 }, { "epoch": 2.5772357723577235, "grad_norm": 0.41866839377080073, "learning_rate": 3.187609300314789e-05, "loss": 0.1912, "loss_nan_ranks": 0, "loss_rank_avg": 0.08089277893304825, "step": 1585, "valid_targets_mean": 5770.2, "valid_targets_min": 1381 }, { "epoch": 2.5853658536585367, "grad_norm": 0.7475178640148638, "learning_rate": 3.181074634384451e-05, "loss": 0.1879, "loss_nan_ranks": 0, "loss_rank_avg": 0.06491148471832275, "step": 1590, "valid_targets_mean": 3679.2, "valid_targets_min": 829 }, { "epoch": 2.59349593495935, "grad_norm": 0.4640334856163724, "learning_rate": 3.1745205507772876e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.1091621071100235, "step": 1595, "valid_targets_mean": 5501.0, "valid_targets_min": 2653 }, { "epoch": 2.6016260162601625, "grad_norm": 0.44111116873044287, "learning_rate": 3.16794715724693e-05, "loss": 0.2148, "loss_nan_ranks": 0, "loss_rank_avg": 0.06696584820747375, "step": 1600, "valid_targets_mean": 4336.1, "valid_targets_min": 1545 }, { "epoch": 2.6097560975609757, "grad_norm": 0.4499024414631357, "learning_rate": 3.161354561864474e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.10789573937654495, "step": 1605, "valid_targets_mean": 5973.6, "valid_targets_min": 664 }, { "epoch": 2.617886178861789, "grad_norm": 0.4933602573335838, "learning_rate": 3.154742873016707e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.09290064871311188, "step": 1610, "valid_targets_mean": 4232.5, "valid_targets_min": 1197 }, { "epoch": 2.6260162601626016, "grad_norm": 0.4518034316255408, "learning_rate": 3.14811219940433e-05, "loss": 0.216, "loss_nan_ranks": 0, "loss_rank_avg": 0.09312482178211212, "step": 1615, "valid_targets_mean": 4682.0, "valid_targets_min": 673 }, { "epoch": 2.6341463414634148, "grad_norm": 0.469629783014579, "learning_rate": 3.141462650040161e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.08355654776096344, "step": 1620, "valid_targets_mean": 6263.6, "valid_targets_min": 801 }, { "epoch": 2.642276422764228, "grad_norm": 0.44206782838213976, "learning_rate": 3.134794334247351e-05, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.14838598668575287, "step": 1625, "valid_targets_mean": 7028.2, "valid_targets_min": 1092 }, { "epoch": 2.6504065040650406, "grad_norm": 0.44167859857806796, "learning_rate": 3.1281073616575856e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.13126231729984283, "step": 1630, "valid_targets_mean": 6458.9, "valid_targets_min": 1392 }, { "epoch": 2.658536585365854, "grad_norm": 0.9930730490394902, "learning_rate": 3.121401842209279e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.1059987023472786, "step": 1635, "valid_targets_mean": 6444.2, "valid_targets_min": 1204 }, { "epoch": 2.6666666666666665, "grad_norm": 0.5264299041430799, "learning_rate": 3.114677886145768e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.09932096302509308, "step": 1640, "valid_targets_mean": 3742.2, "valid_targets_min": 575 }, { "epoch": 2.6747967479674797, "grad_norm": 0.46181615275441623, "learning_rate": 3.107935604013501e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.12092652916908264, "step": 1645, "valid_targets_mean": 5040.0, "valid_targets_min": 986 }, { "epoch": 2.682926829268293, "grad_norm": 0.5408363797932924, "learning_rate": 3.101175106660219e-05, "loss": 0.1929, "loss_nan_ranks": 0, "loss_rank_avg": 0.08361901342868805, "step": 1650, "valid_targets_mean": 2857.5, "valid_targets_min": 1017 }, { "epoch": 2.6910569105691056, "grad_norm": 0.5974222781633645, "learning_rate": 3.094396505233135e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.10258916765451431, "step": 1655, "valid_targets_mean": 3257.5, "valid_targets_min": 1496 }, { "epoch": 2.6991869918699187, "grad_norm": 0.5934888003376159, "learning_rate": 3.087599911177103e-05, "loss": 0.1861, "loss_nan_ranks": 0, "loss_rank_avg": 0.11051664501428604, "step": 1660, "valid_targets_mean": 5552.6, "valid_targets_min": 2418 }, { "epoch": 2.7073170731707314, "grad_norm": 0.4731850876184984, "learning_rate": 3.0807854362327906e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.09753349423408508, "step": 1665, "valid_targets_mean": 4443.4, "valid_targets_min": 1307 }, { "epoch": 2.7154471544715446, "grad_norm": 0.4945326508373184, "learning_rate": 3.073953192434837e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.11155946552753448, "step": 1670, "valid_targets_mean": 4997.1, "valid_targets_min": 1645 }, { "epoch": 2.7235772357723578, "grad_norm": 0.5107912376754389, "learning_rate": 3.067103292110017e-05, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.07774278521537781, "step": 1675, "valid_targets_mean": 4761.9, "valid_targets_min": 956 }, { "epoch": 2.7317073170731705, "grad_norm": 0.48586882320037633, "learning_rate": 3.060235847875387e-05, "loss": 0.2141, "loss_nan_ranks": 0, "loss_rank_avg": 0.06829272210597992, "step": 1680, "valid_targets_mean": 4193.4, "valid_targets_min": 933 }, { "epoch": 2.7398373983739837, "grad_norm": 0.5099656045393953, "learning_rate": 3.05335097263644e-05, "loss": 0.1938, "loss_nan_ranks": 0, "loss_rank_avg": 0.15921106934547424, "step": 1685, "valid_targets_mean": 5868.9, "valid_targets_min": 841 }, { "epoch": 2.747967479674797, "grad_norm": 0.5714169725521554, "learning_rate": 3.0464487795852463e-05, "loss": 0.2066, "loss_nan_ranks": 0, "loss_rank_avg": 0.07646902650594711, "step": 1690, "valid_targets_mean": 2782.6, "valid_targets_min": 1153 }, { "epoch": 2.7560975609756095, "grad_norm": 0.4654054786604614, "learning_rate": 3.0395293821985906e-05, "loss": 0.2056, "loss_nan_ranks": 0, "loss_rank_avg": 0.11511363089084625, "step": 1695, "valid_targets_mean": 5739.6, "valid_targets_min": 1507 }, { "epoch": 2.7642276422764227, "grad_norm": 0.5203276245162031, "learning_rate": 3.032592894236112e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.0801495909690857, "step": 1700, "valid_targets_mean": 2790.5, "valid_targets_min": 978 }, { "epoch": 2.772357723577236, "grad_norm": 0.4278422740839682, "learning_rate": 3.0256394297384273e-05, "loss": 0.187, "loss_nan_ranks": 0, "loss_rank_avg": 0.09725311398506165, "step": 1705, "valid_targets_mean": 5771.8, "valid_targets_min": 1320 }, { "epoch": 2.7804878048780486, "grad_norm": 0.44587369970786395, "learning_rate": 3.0186691030252614e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.09690342843532562, "step": 1710, "valid_targets_mean": 5325.9, "valid_targets_min": 1506 }, { "epoch": 2.7886178861788617, "grad_norm": 0.5177722165226661, "learning_rate": 3.0116820286935654e-05, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.10034046322107315, "step": 1715, "valid_targets_mean": 3943.9, "valid_targets_min": 1169 }, { "epoch": 2.796747967479675, "grad_norm": 0.4385571953416844, "learning_rate": 3.0046783216156315e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.0963803306221962, "step": 1720, "valid_targets_mean": 5634.6, "valid_targets_min": 1159 }, { "epoch": 2.8048780487804876, "grad_norm": 0.52564722394055, "learning_rate": 2.997658096937207e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.1279086470603943, "step": 1725, "valid_targets_mean": 4661.8, "valid_targets_min": 972 }, { "epoch": 2.813008130081301, "grad_norm": 0.45833386033090195, "learning_rate": 2.990621470075598e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.13034580647945404, "step": 1730, "valid_targets_mean": 7998.8, "valid_targets_min": 1663 }, { "epoch": 2.821138211382114, "grad_norm": 0.4934768700894649, "learning_rate": 2.9835685567177763e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.12494466453790665, "step": 1735, "valid_targets_mean": 4650.6, "valid_targets_min": 730 }, { "epoch": 2.8292682926829267, "grad_norm": 0.5438290668490738, "learning_rate": 2.9764994728184725e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.16482070088386536, "step": 1740, "valid_targets_mean": 5444.2, "valid_targets_min": 1124 }, { "epoch": 2.83739837398374, "grad_norm": 0.44567358742187385, "learning_rate": 2.9694143345982732e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.11280884593725204, "step": 1745, "valid_targets_mean": 7374.9, "valid_targets_min": 1862 }, { "epoch": 2.845528455284553, "grad_norm": 0.6520175731062912, "learning_rate": 2.9623132585417096e-05, "loss": 0.204, "loss_nan_ranks": 0, "loss_rank_avg": 0.1001191958785057, "step": 1750, "valid_targets_mean": 2833.2, "valid_targets_min": 994 }, { "epoch": 2.8536585365853657, "grad_norm": 0.5160489877477896, "learning_rate": 2.9551963613953404e-05, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.0647708922624588, "step": 1755, "valid_targets_mean": 2973.1, "valid_targets_min": 1220 }, { "epoch": 2.861788617886179, "grad_norm": 0.497707032437291, "learning_rate": 2.948063760165835e-05, "loss": 0.1913, "loss_nan_ranks": 0, "loss_rank_avg": 0.08599328249692917, "step": 1760, "valid_targets_mean": 3740.5, "valid_targets_min": 1285 }, { "epoch": 2.869918699186992, "grad_norm": 0.5010926535897279, "learning_rate": 2.9409155721180477e-05, "loss": 0.2079, "loss_nan_ranks": 0, "loss_rank_avg": 0.11671507358551025, "step": 1765, "valid_targets_mean": 4664.5, "valid_targets_min": 1330 }, { "epoch": 2.8780487804878048, "grad_norm": 0.521313660684931, "learning_rate": 2.9337519147730918e-05, "loss": 0.1989, "loss_nan_ranks": 0, "loss_rank_avg": 0.11742527782917023, "step": 1770, "valid_targets_mean": 4550.5, "valid_targets_min": 1584 }, { "epoch": 2.886178861788618, "grad_norm": 0.42731259008703787, "learning_rate": 2.9265729059064054e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.06839574873447418, "step": 1775, "valid_targets_mean": 4588.4, "valid_targets_min": 1141 }, { "epoch": 2.894308943089431, "grad_norm": 0.4336731175739462, "learning_rate": 2.9193786635458178e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.11395157873630524, "step": 1780, "valid_targets_mean": 8954.6, "valid_targets_min": 1236 }, { "epoch": 2.902439024390244, "grad_norm": 0.45836128306992324, "learning_rate": 2.912169305969605e-05, "loss": 0.1908, "loss_nan_ranks": 0, "loss_rank_avg": 0.0793212354183197, "step": 1785, "valid_targets_mean": 4813.9, "valid_targets_min": 1453 }, { "epoch": 2.910569105691057, "grad_norm": 0.5242475632918033, "learning_rate": 2.9049449517045497e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.10133905708789825, "step": 1790, "valid_targets_mean": 4795.0, "valid_targets_min": 2455 }, { "epoch": 2.91869918699187, "grad_norm": 0.4617766146376155, "learning_rate": 2.89770571952399e-05, "loss": 0.1976, "loss_nan_ranks": 0, "loss_rank_avg": 0.11333787441253662, "step": 1795, "valid_targets_mean": 8331.5, "valid_targets_min": 1699 }, { "epoch": 2.926829268292683, "grad_norm": 0.5105310774218661, "learning_rate": 2.890451728445866e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.07548114657402039, "step": 1800, "valid_targets_mean": 2948.1, "valid_targets_min": 835 }, { "epoch": 2.934959349593496, "grad_norm": 0.6293059490890891, "learning_rate": 2.8831830977307644e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.19505786895751953, "step": 1805, "valid_targets_mean": 7034.6, "valid_targets_min": 1869 }, { "epoch": 2.943089430894309, "grad_norm": 0.5183400183562941, "learning_rate": 2.8758999468799594e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.0845247358083725, "step": 1810, "valid_targets_mean": 3532.0, "valid_targets_min": 1066 }, { "epoch": 2.951219512195122, "grad_norm": 0.6184094809265098, "learning_rate": 2.868602395633444e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.05015844851732254, "step": 1815, "valid_targets_mean": 1691.1, "valid_targets_min": 736 }, { "epoch": 2.959349593495935, "grad_norm": 0.45307611653553626, "learning_rate": 2.861290563967965e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.16129237413406372, "step": 1820, "valid_targets_mean": 8123.6, "valid_targets_min": 1685 }, { "epoch": 2.9674796747967482, "grad_norm": 0.38101703395338005, "learning_rate": 2.8539645720950474e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.09711259603500366, "step": 1825, "valid_targets_mean": 5972.8, "valid_targets_min": 1171 }, { "epoch": 2.975609756097561, "grad_norm": 0.4635353158231019, "learning_rate": 2.8466245404590226e-05, "loss": 0.2012, "loss_nan_ranks": 0, "loss_rank_avg": 0.13544566929340363, "step": 1830, "valid_targets_mean": 6735.6, "valid_targets_min": 1058 }, { "epoch": 2.983739837398374, "grad_norm": 0.5076819300170817, "learning_rate": 2.8392705897350425e-05, "loss": 0.1936, "loss_nan_ranks": 0, "loss_rank_avg": 0.04716028645634651, "step": 1835, "valid_targets_mean": 2432.6, "valid_targets_min": 960 }, { "epoch": 2.991869918699187, "grad_norm": 0.44233934523750484, "learning_rate": 2.8319028408270983e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.07935938239097595, "step": 1840, "valid_targets_mean": 3761.2, "valid_targets_min": 1845 }, { "epoch": 3.0, "grad_norm": 0.43078759496852226, "learning_rate": 2.8245214148660364e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.08466893434524536, "step": 1845, "valid_targets_mean": 5015.8, "valid_targets_min": 1175 }, { "epoch": 3.008130081300813, "grad_norm": 0.4860108657211595, "learning_rate": 2.8171264332075588e-05, "loss": 0.1968, "loss_nan_ranks": 0, "loss_rank_avg": 0.10784369707107544, "step": 1850, "valid_targets_mean": 6494.8, "valid_targets_min": 1708 }, { "epoch": 3.016260162601626, "grad_norm": 0.5120569455007582, "learning_rate": 2.809718017430236e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.11345131695270538, "step": 1855, "valid_targets_mean": 7375.0, "valid_targets_min": 2308 }, { "epoch": 3.024390243902439, "grad_norm": 0.5339539923625253, "learning_rate": 2.8022962893335023e-05, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.07034371793270111, "step": 1860, "valid_targets_mean": 2437.1, "valid_targets_min": 837 }, { "epoch": 3.032520325203252, "grad_norm": 0.5748427139778293, "learning_rate": 2.7948613709356565e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.08655751496553421, "step": 1865, "valid_targets_mean": 3470.6, "valid_targets_min": 785 }, { "epoch": 3.040650406504065, "grad_norm": 0.4561868210128982, "learning_rate": 2.7874133844718557e-05, "loss": 0.1827, "loss_nan_ranks": 0, "loss_rank_avg": 0.07496097683906555, "step": 1870, "valid_targets_mean": 4220.2, "valid_targets_min": 1352 }, { "epoch": 3.048780487804878, "grad_norm": 0.6173888932816397, "learning_rate": 2.7799524523921038e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.09803314507007599, "step": 1875, "valid_targets_mean": 3218.0, "valid_targets_min": 698 }, { "epoch": 3.0569105691056913, "grad_norm": 0.4694678814515231, "learning_rate": 2.77247869735924e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.1420827955007553, "step": 1880, "valid_targets_mean": 5605.1, "valid_targets_min": 1354 }, { "epoch": 3.065040650406504, "grad_norm": 0.3908987051556123, "learning_rate": 2.764992242246921e-05, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.06274786591529846, "step": 1885, "valid_targets_mean": 6652.4, "valid_targets_min": 1244 }, { "epoch": 3.073170731707317, "grad_norm": 0.5615128427273671, "learning_rate": 2.7574932101376034e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.10297388583421707, "step": 1890, "valid_targets_mean": 4293.8, "valid_targets_min": 766 }, { "epoch": 3.08130081300813, "grad_norm": 0.4347419064601247, "learning_rate": 2.749981724320516e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.10179280489683151, "step": 1895, "valid_targets_mean": 6650.6, "valid_targets_min": 1873 }, { "epoch": 3.089430894308943, "grad_norm": 0.36648106399201374, "learning_rate": 2.7424579082896357e-05, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.10221441090106964, "step": 1900, "valid_targets_mean": 10330.4, "valid_targets_min": 638 }, { "epoch": 3.097560975609756, "grad_norm": 0.4124076111320386, "learning_rate": 2.7349218857416587e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.09633245319128036, "step": 1905, "valid_targets_mean": 7077.1, "valid_targets_min": 2522 }, { "epoch": 3.105691056910569, "grad_norm": 0.4856129912805476, "learning_rate": 2.7273737805739614e-05, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.09282836318016052, "step": 1910, "valid_targets_mean": 3699.0, "valid_targets_min": 1432 }, { "epoch": 3.113821138211382, "grad_norm": 0.4794044219507053, "learning_rate": 2.719813716882569e-05, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.06483015418052673, "step": 1915, "valid_targets_mean": 4546.4, "valid_targets_min": 1389 }, { "epoch": 3.1219512195121952, "grad_norm": 0.619089722970813, "learning_rate": 2.7122418189601118e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.11483106017112732, "step": 1920, "valid_targets_mean": 3839.5, "valid_targets_min": 1596 }, { "epoch": 3.130081300813008, "grad_norm": 0.6297752293745941, "learning_rate": 2.7046582112937837e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.0702546015381813, "step": 1925, "valid_targets_mean": 2191.4, "valid_targets_min": 1255 }, { "epoch": 3.138211382113821, "grad_norm": 0.6178952616342983, "learning_rate": 2.697063018563295e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.09800857305526733, "step": 1930, "valid_targets_mean": 2995.4, "valid_targets_min": 1192 }, { "epoch": 3.1463414634146343, "grad_norm": 0.5727494786404239, "learning_rate": 2.6894563656388217e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.11543776094913483, "step": 1935, "valid_targets_mean": 4811.8, "valid_targets_min": 1378 }, { "epoch": 3.154471544715447, "grad_norm": 0.49131373835412284, "learning_rate": 2.681838377578954e-05, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.15042293071746826, "step": 1940, "valid_targets_mean": 7221.5, "valid_targets_min": 899 }, { "epoch": 3.16260162601626, "grad_norm": 0.4755416637163348, "learning_rate": 2.6742091796286388e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.06937994807958603, "step": 1945, "valid_targets_mean": 4864.8, "valid_targets_min": 862 }, { "epoch": 3.1707317073170733, "grad_norm": 0.5058451616208286, "learning_rate": 2.6665688972171215e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.08511316776275635, "step": 1950, "valid_targets_mean": 4464.4, "valid_targets_min": 1003 }, { "epoch": 3.178861788617886, "grad_norm": 0.7358076121095269, "learning_rate": 2.658917655955884e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.1269768923521042, "step": 1955, "valid_targets_mean": 4176.8, "valid_targets_min": 666 }, { "epoch": 3.186991869918699, "grad_norm": 0.5253173738845284, "learning_rate": 2.651255581636578e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.07415660470724106, "step": 1960, "valid_targets_mean": 2948.5, "valid_targets_min": 857 }, { "epoch": 3.1951219512195124, "grad_norm": 0.42428482976175114, "learning_rate": 2.6435828002289596e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.05891459435224533, "step": 1965, "valid_targets_mean": 5228.0, "valid_targets_min": 797 }, { "epoch": 3.203252032520325, "grad_norm": 0.38192452477981753, "learning_rate": 2.6358994378788163e-05, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.10647241026163101, "step": 1970, "valid_targets_mean": 9946.2, "valid_targets_min": 867 }, { "epoch": 3.2113821138211383, "grad_norm": 0.579008811186245, "learning_rate": 2.6282056209058936e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.12035466730594635, "step": 1975, "valid_targets_mean": 3877.4, "valid_targets_min": 830 }, { "epoch": 3.2195121951219514, "grad_norm": 0.5686842217747077, "learning_rate": 2.6205014758018176e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.1187640056014061, "step": 1980, "valid_targets_mean": 4403.0, "valid_targets_min": 1338 }, { "epoch": 3.227642276422764, "grad_norm": 0.6255511264003251, "learning_rate": 2.6127871292280165e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.11581926792860031, "step": 1985, "valid_targets_mean": 7522.9, "valid_targets_min": 463 }, { "epoch": 3.2357723577235773, "grad_norm": 0.4687293252671812, "learning_rate": 2.6050627080136376e-05, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.10452213883399963, "step": 1990, "valid_targets_mean": 6076.9, "valid_targets_min": 750 }, { "epoch": 3.2439024390243905, "grad_norm": 0.41434615118758467, "learning_rate": 2.5973283391534615e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.10657718777656555, "step": 1995, "valid_targets_mean": 8722.5, "valid_targets_min": 291 }, { "epoch": 3.252032520325203, "grad_norm": 0.5526274725533402, "learning_rate": 2.589584149805817e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.12291304767131805, "step": 2000, "valid_targets_mean": 4717.1, "valid_targets_min": 1197 }, { "epoch": 3.2601626016260163, "grad_norm": 0.44820414968833555, "learning_rate": 2.581830267290486e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.14701004326343536, "step": 2005, "valid_targets_mean": 7174.9, "valid_targets_min": 841 }, { "epoch": 3.2682926829268295, "grad_norm": 0.5790502157747228, "learning_rate": 2.574066819086613e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.09761584550142288, "step": 2010, "valid_targets_mean": 5652.6, "valid_targets_min": 233 }, { "epoch": 3.2764227642276422, "grad_norm": 0.43237790933709264, "learning_rate": 2.5662939328306113e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.07850054651498795, "step": 2015, "valid_targets_mean": 4159.8, "valid_targets_min": 388 }, { "epoch": 3.2845528455284554, "grad_norm": 0.49724922196897114, "learning_rate": 2.5585117363140592e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.09476260840892792, "step": 2020, "valid_targets_mean": 5778.5, "valid_targets_min": 1467 }, { "epoch": 3.292682926829268, "grad_norm": 0.6270117629616863, "learning_rate": 2.5507203574816043e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.11406762897968292, "step": 2025, "valid_targets_mean": 3870.1, "valid_targets_min": 1122 }, { "epoch": 3.3008130081300813, "grad_norm": 0.6109512933369908, "learning_rate": 2.542919924428856e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.0836646631360054, "step": 2030, "valid_targets_mean": 2958.4, "valid_targets_min": 1654 }, { "epoch": 3.3089430894308944, "grad_norm": 0.40973824874897186, "learning_rate": 2.5351105654002838e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.07277525961399078, "step": 2035, "valid_targets_mean": 5359.0, "valid_targets_min": 1418 }, { "epoch": 3.317073170731707, "grad_norm": 0.5260738962113803, "learning_rate": 2.527292408787104e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.06306485831737518, "step": 2040, "valid_targets_mean": 3337.9, "valid_targets_min": 734 }, { "epoch": 3.3252032520325203, "grad_norm": 0.5956396156166147, "learning_rate": 2.5194655831251712e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.09417542815208435, "step": 2045, "valid_targets_mean": 3043.8, "valid_targets_min": 1545 }, { "epoch": 3.3333333333333335, "grad_norm": 0.5622512014506079, "learning_rate": 2.5116302170928678e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.07839909940958023, "step": 2050, "valid_targets_mean": 2741.2, "valid_targets_min": 1645 }, { "epoch": 3.341463414634146, "grad_norm": 0.4871142757561353, "learning_rate": 2.5037864395089822e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.059922538697719574, "step": 2055, "valid_targets_mean": 4419.2, "valid_targets_min": 925 }, { "epoch": 3.3495934959349594, "grad_norm": 0.4049788216003715, "learning_rate": 2.495934379330597e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.11351704597473145, "step": 2060, "valid_targets_mean": 8152.6, "valid_targets_min": 1552 }, { "epoch": 3.3577235772357725, "grad_norm": 0.5008713329185713, "learning_rate": 2.4880741656509656e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.12235702574253082, "step": 2065, "valid_targets_mean": 5287.2, "valid_targets_min": 1702 }, { "epoch": 3.3658536585365852, "grad_norm": 0.7136278141438792, "learning_rate": 2.4802059276973904e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.10800117254257202, "step": 2070, "valid_targets_mean": 6376.0, "valid_targets_min": 750 }, { "epoch": 3.3739837398373984, "grad_norm": 0.6002242896884902, "learning_rate": 2.4723297948290982e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.10379073023796082, "step": 2075, "valid_targets_mean": 5667.2, "valid_targets_min": 1926 }, { "epoch": 3.3821138211382116, "grad_norm": 0.4807410385054655, "learning_rate": 2.464445896535113e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.0718056783080101, "step": 2080, "valid_targets_mean": 4393.0, "valid_targets_min": 829 }, { "epoch": 3.3902439024390243, "grad_norm": 0.45867338917020517, "learning_rate": 2.45655436243213e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.10537977516651154, "step": 2085, "valid_targets_mean": 6258.0, "valid_targets_min": 1649 }, { "epoch": 3.3983739837398375, "grad_norm": 0.48896653885329444, "learning_rate": 2.44865532226238e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.04254530370235443, "step": 2090, "valid_targets_mean": 2209.1, "valid_targets_min": 574 }, { "epoch": 3.40650406504065, "grad_norm": 0.4944998614218492, "learning_rate": 2.4407489058915004e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.15449640154838562, "step": 2095, "valid_targets_mean": 6770.5, "valid_targets_min": 2389 }, { "epoch": 3.4146341463414633, "grad_norm": 0.44912065588969774, "learning_rate": 2.4328352433063966e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.09958087652921677, "step": 2100, "valid_targets_mean": 6547.4, "valid_targets_min": 2736 }, { "epoch": 3.4227642276422765, "grad_norm": 0.41866012759872706, "learning_rate": 2.4249144646131083e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.10285385698080063, "step": 2105, "valid_targets_mean": 7321.2, "valid_targets_min": 1648 }, { "epoch": 3.430894308943089, "grad_norm": 0.5636871438809098, "learning_rate": 2.4169867000346684e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.06892851740121841, "step": 2110, "valid_targets_mean": 2981.8, "valid_targets_min": 1422 }, { "epoch": 3.4390243902439024, "grad_norm": 0.5114749746088917, "learning_rate": 2.4090520799089612e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.06464049220085144, "step": 2115, "valid_targets_mean": 2943.0, "valid_targets_min": 716 }, { "epoch": 3.4471544715447155, "grad_norm": 0.5066187203778031, "learning_rate": 2.4011107346865844e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.07400400936603546, "step": 2120, "valid_targets_mean": 5502.4, "valid_targets_min": 1108 }, { "epoch": 3.4552845528455283, "grad_norm": 0.4840604889659389, "learning_rate": 2.393162794928697e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.08897733688354492, "step": 2125, "valid_targets_mean": 5101.5, "valid_targets_min": 1130 }, { "epoch": 3.4634146341463414, "grad_norm": 0.5527474859781538, "learning_rate": 2.385208391304879e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.0687088817358017, "step": 2130, "valid_targets_mean": 2945.8, "valid_targets_min": 785 }, { "epoch": 3.4715447154471546, "grad_norm": 0.4600845353035065, "learning_rate": 2.3772476545909794e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.07164815813302994, "step": 2135, "valid_targets_mean": 3378.8, "valid_targets_min": 362 }, { "epoch": 3.4796747967479673, "grad_norm": 0.4230724684550869, "learning_rate": 2.3692807156669684e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.09702588617801666, "step": 2140, "valid_targets_mean": 6767.8, "valid_targets_min": 2145 }, { "epoch": 3.4878048780487805, "grad_norm": 0.5382239076136307, "learning_rate": 2.3613077055147855e-05, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.0891718715429306, "step": 2145, "valid_targets_mean": 3512.0, "valid_targets_min": 1287 }, { "epoch": 3.4959349593495936, "grad_norm": 0.5119342452083689, "learning_rate": 2.3533287552161833e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.06562502682209015, "step": 2150, "valid_targets_mean": 3547.9, "valid_targets_min": 759 }, { "epoch": 3.5040650406504064, "grad_norm": 0.4166846629033683, "learning_rate": 2.345343995950577e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.07943867146968842, "step": 2155, "valid_targets_mean": 6276.5, "valid_targets_min": 1527 }, { "epoch": 3.5121951219512195, "grad_norm": 0.4289981629755304, "learning_rate": 2.3373535589928827e-05, "loss": 0.1975, "loss_nan_ranks": 0, "loss_rank_avg": 0.14399868249893188, "step": 2160, "valid_targets_mean": 9145.0, "valid_targets_min": 2069 }, { "epoch": 3.5203252032520327, "grad_norm": 0.5028339624985111, "learning_rate": 2.3293575757113635e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.051561854779720306, "step": 2165, "valid_targets_mean": 2878.8, "valid_targets_min": 609 }, { "epoch": 3.5284552845528454, "grad_norm": 0.5348210854829778, "learning_rate": 2.3213561775654678e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.07135885953903198, "step": 2170, "valid_targets_mean": 3753.4, "valid_targets_min": 842 }, { "epoch": 3.5365853658536586, "grad_norm": 0.4484634908758471, "learning_rate": 2.3133494961036655e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.11038084328174591, "step": 2175, "valid_targets_mean": 6385.5, "valid_targets_min": 1352 }, { "epoch": 3.5447154471544717, "grad_norm": 0.40416038511592794, "learning_rate": 2.305337662961292e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.07623428106307983, "step": 2180, "valid_targets_mean": 3816.5, "valid_targets_min": 1761 }, { "epoch": 3.5528455284552845, "grad_norm": 0.5501649001520341, "learning_rate": 2.2973208098583767e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.12985031306743622, "step": 2185, "valid_targets_mean": 4583.2, "valid_targets_min": 2034 }, { "epoch": 3.5609756097560976, "grad_norm": 0.4539626972348566, "learning_rate": 2.2892990685974815e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.07589904218912125, "step": 2190, "valid_targets_mean": 3840.2, "valid_targets_min": 756 }, { "epoch": 3.569105691056911, "grad_norm": 0.4747779712686265, "learning_rate": 2.2812725710615328e-05, "loss": 0.1827, "loss_nan_ranks": 0, "loss_rank_avg": 0.11916742473840714, "step": 2195, "valid_targets_mean": 6800.1, "valid_targets_min": 1288 }, { "epoch": 3.5772357723577235, "grad_norm": 0.4078543423987889, "learning_rate": 2.2732414492116538e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.07764068990945816, "step": 2200, "valid_targets_mean": 6178.2, "valid_targets_min": 1869 }, { "epoch": 3.5853658536585367, "grad_norm": 0.43958544173804026, "learning_rate": 2.2652058350849955e-05, "loss": 0.1736, "loss_nan_ranks": 0, "loss_rank_avg": 0.07077381014823914, "step": 2205, "valid_targets_mean": 5291.6, "valid_targets_min": 2369 }, { "epoch": 3.59349593495935, "grad_norm": 0.524371110454708, "learning_rate": 2.2571658607925624e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.09251520782709122, "step": 2210, "valid_targets_mean": 5542.8, "valid_targets_min": 1796 }, { "epoch": 3.6016260162601625, "grad_norm": 0.4560634702353269, "learning_rate": 2.2491216585170458e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.08693362772464752, "step": 2215, "valid_targets_mean": 4975.4, "valid_targets_min": 1569 }, { "epoch": 3.6097560975609757, "grad_norm": 0.5173837967492884, "learning_rate": 2.2410733605106462e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.10831189155578613, "step": 2220, "valid_targets_mean": 5082.9, "valid_targets_min": 2070 }, { "epoch": 3.617886178861789, "grad_norm": 0.4668209301127543, "learning_rate": 2.233021099092902e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.11751365661621094, "step": 2225, "valid_targets_mean": 9244.8, "valid_targets_min": 1042 }, { "epoch": 3.6260162601626016, "grad_norm": 0.5693999377012714, "learning_rate": 2.224965006648512e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.052777741104364395, "step": 2230, "valid_targets_mean": 2239.2, "valid_targets_min": 833 }, { "epoch": 3.6341463414634148, "grad_norm": 0.6505764275109728, "learning_rate": 2.2169052156251585e-05, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.11289471387863159, "step": 2235, "valid_targets_mean": 3590.2, "valid_targets_min": 947 }, { "epoch": 3.642276422764228, "grad_norm": 0.4481036228632104, "learning_rate": 2.2088418585313346e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.06705661863088608, "step": 2240, "valid_targets_mean": 5500.2, "valid_targets_min": 1208 }, { "epoch": 3.6504065040650406, "grad_norm": 0.5003706870721794, "learning_rate": 2.200775067934158e-05, "loss": 0.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.08790750801563263, "step": 2245, "valid_targets_mean": 4177.6, "valid_targets_min": 1421 }, { "epoch": 3.658536585365854, "grad_norm": 0.9256659259454979, "learning_rate": 2.192704976457198e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.07639472186565399, "step": 2250, "valid_targets_mean": 5159.0, "valid_targets_min": 1681 }, { "epoch": 3.6666666666666665, "grad_norm": 0.5108219589731426, "learning_rate": 2.1846317167782923e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.11740477383136749, "step": 2255, "valid_targets_mean": 6264.1, "valid_targets_min": 2484 }, { "epoch": 3.6747967479674797, "grad_norm": 0.45206400769038635, "learning_rate": 2.1765554216273652e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.14643417298793793, "step": 2260, "valid_targets_mean": 8674.5, "valid_targets_min": 1957 }, { "epoch": 3.682926829268293, "grad_norm": 0.560565677738584, "learning_rate": 2.1684762237842466e-05, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.1252707540988922, "step": 2265, "valid_targets_mean": 5350.6, "valid_targets_min": 1199 }, { "epoch": 3.6910569105691056, "grad_norm": 0.5311151357253606, "learning_rate": 2.1603942560764884e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.09429627656936646, "step": 2270, "valid_targets_mean": 3556.2, "valid_targets_min": 1123 }, { "epoch": 3.6991869918699187, "grad_norm": 0.44734635595305705, "learning_rate": 2.1523096513771825e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.08364763855934143, "step": 2275, "valid_targets_mean": 5456.5, "valid_targets_min": 1764 }, { "epoch": 3.7073170731707314, "grad_norm": 0.5146727081454273, "learning_rate": 2.1442225426027724e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.08693309128284454, "step": 2280, "valid_targets_mean": 4708.5, "valid_targets_min": 1098 }, { "epoch": 3.7154471544715446, "grad_norm": 0.5834305426991228, "learning_rate": 2.1361330627108724e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.0817655622959137, "step": 2285, "valid_targets_mean": 3087.0, "valid_targets_min": 1033 }, { "epoch": 3.7235772357723578, "grad_norm": 0.43470760894780036, "learning_rate": 2.128041344698078e-05, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.06693185865879059, "step": 2290, "valid_targets_mean": 4628.4, "valid_targets_min": 927 }, { "epoch": 3.7317073170731705, "grad_norm": 0.4346074290355755, "learning_rate": 2.1199475215977817e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.08805598318576813, "step": 2295, "valid_targets_mean": 6400.4, "valid_targets_min": 1493 }, { "epoch": 3.7398373983739837, "grad_norm": 0.5969283504567086, "learning_rate": 2.1118517264779858e-05, "loss": 0.2017, "loss_nan_ranks": 0, "loss_rank_avg": 0.14364033937454224, "step": 2300, "valid_targets_mean": 4503.9, "valid_targets_min": 896 }, { "epoch": 3.747967479674797, "grad_norm": 0.5105693055196588, "learning_rate": 2.103754092439112e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.0883859246969223, "step": 2305, "valid_targets_mean": 4250.9, "valid_targets_min": 1489 }, { "epoch": 3.7560975609756095, "grad_norm": 0.6280552169336109, "learning_rate": 2.095654752611817e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.06845687329769135, "step": 2310, "valid_targets_mean": 2946.6, "valid_targets_min": 1335 }, { "epoch": 3.7642276422764227, "grad_norm": 0.45744630161207034, "learning_rate": 2.087553840154801e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.09981508553028107, "step": 2315, "valid_targets_mean": 6651.8, "valid_targets_min": 756 }, { "epoch": 3.772357723577236, "grad_norm": 0.5878109298912522, "learning_rate": 2.0794514882526196e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.12705446779727936, "step": 2320, "valid_targets_mean": 5654.0, "valid_targets_min": 1165 }, { "epoch": 3.7804878048780486, "grad_norm": 0.5309395695248087, "learning_rate": 2.0713478301134935e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.06934012472629547, "step": 2325, "valid_targets_mean": 3270.4, "valid_targets_min": 1317 }, { "epoch": 3.7886178861788617, "grad_norm": 0.493345912359992, "learning_rate": 2.063242998967118e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.09545746445655823, "step": 2330, "valid_targets_mean": 4757.8, "valid_targets_min": 650 }, { "epoch": 3.796747967479675, "grad_norm": 0.36419247146022254, "learning_rate": 2.0551371280624758e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.09308013319969177, "step": 2335, "valid_targets_mean": 9551.9, "valid_targets_min": 2129 }, { "epoch": 3.8048780487804876, "grad_norm": 0.5181442644465611, "learning_rate": 2.0470303506656414e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.11358301341533661, "step": 2340, "valid_targets_mean": 5998.6, "valid_targets_min": 1267 }, { "epoch": 3.813008130081301, "grad_norm": 0.47097767672036994, "learning_rate": 2.0389228000575953e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.08462050557136536, "step": 2345, "valid_targets_mean": 4959.8, "valid_targets_min": 2117 }, { "epoch": 3.821138211382114, "grad_norm": 0.47071219942130765, "learning_rate": 2.0308146095320275e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.11598730087280273, "step": 2350, "valid_targets_mean": 6695.8, "valid_targets_min": 339 }, { "epoch": 3.8292682926829267, "grad_norm": 0.5641637331957085, "learning_rate": 2.0227059123931504e-05, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.10073170065879822, "step": 2355, "valid_targets_mean": 4870.9, "valid_targets_min": 1993 }, { "epoch": 3.83739837398374, "grad_norm": 0.392563787267517, "learning_rate": 2.0145968419535045e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.12700442969799042, "step": 2360, "valid_targets_mean": 12199.5, "valid_targets_min": 2482 }, { "epoch": 3.845528455284553, "grad_norm": 0.4051664340705014, "learning_rate": 2.0064875315317674e-05, "loss": 0.1884, "loss_nan_ranks": 0, "loss_rank_avg": 0.09100687503814697, "step": 2365, "valid_targets_mean": 6205.1, "valid_targets_min": 1877 }, { "epoch": 3.8536585365853657, "grad_norm": 0.5519491156286782, "learning_rate": 1.998378114450565e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.09894944727420807, "step": 2370, "valid_targets_mean": 4669.1, "valid_targets_min": 1261 }, { "epoch": 3.861788617886179, "grad_norm": 0.4807020743059233, "learning_rate": 1.9902687240342722e-05, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.12336129695177078, "step": 2375, "valid_targets_mean": 6729.0, "valid_targets_min": 887 }, { "epoch": 3.869918699186992, "grad_norm": 0.4498434646188361, "learning_rate": 1.982159493606829e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.07332796603441238, "step": 2380, "valid_targets_mean": 4932.2, "valid_targets_min": 1174 }, { "epoch": 3.8780487804878048, "grad_norm": 0.7283797265957421, "learning_rate": 1.9740505564895436e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.09400719404220581, "step": 2385, "valid_targets_mean": 2918.2, "valid_targets_min": 1062 }, { "epoch": 3.886178861788618, "grad_norm": 0.46387280257048363, "learning_rate": 1.9659420459989026e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.08546875417232513, "step": 2390, "valid_targets_mean": 5171.4, "valid_targets_min": 1627 }, { "epoch": 3.894308943089431, "grad_norm": 0.3765452056233428, "learning_rate": 1.9578340954443784e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.08869325369596481, "step": 2395, "valid_targets_mean": 9414.5, "valid_targets_min": 1812 }, { "epoch": 3.902439024390244, "grad_norm": 0.5090421831820953, "learning_rate": 1.949726838126237e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.0852435827255249, "step": 2400, "valid_targets_mean": 4212.0, "valid_targets_min": 839 }, { "epoch": 3.910569105691057, "grad_norm": 0.4823014775049168, "learning_rate": 1.941620407333347e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.09680739790201187, "step": 2405, "valid_targets_mean": 4952.6, "valid_targets_min": 1350 }, { "epoch": 3.91869918699187, "grad_norm": 0.47944122003508816, "learning_rate": 1.933514936340991e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.077955462038517, "step": 2410, "valid_targets_mean": 5786.6, "valid_targets_min": 1363 }, { "epoch": 3.926829268292683, "grad_norm": 0.49657290110070973, "learning_rate": 1.9254105584086683e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.1016269102692604, "step": 2415, "valid_targets_mean": 6280.5, "valid_targets_min": 827 }, { "epoch": 3.934959349593496, "grad_norm": 0.43004078923554034, "learning_rate": 1.9173074067779102e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.09187685698270798, "step": 2420, "valid_targets_mean": 6853.8, "valid_targets_min": 1243 }, { "epoch": 3.943089430894309, "grad_norm": 0.4875377143239527, "learning_rate": 1.9092056146700844e-05, "loss": 0.1928, "loss_nan_ranks": 0, "loss_rank_avg": 0.12033165246248245, "step": 2425, "valid_targets_mean": 6599.9, "valid_targets_min": 2758 }, { "epoch": 3.951219512195122, "grad_norm": 0.5360225532620421, "learning_rate": 1.9011053152842087e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.07047030329704285, "step": 2430, "valid_targets_mean": 4145.9, "valid_targets_min": 940 }, { "epoch": 3.959349593495935, "grad_norm": 0.42880198360513266, "learning_rate": 1.89300664179476e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.04297485202550888, "step": 2435, "valid_targets_mean": 2505.9, "valid_targets_min": 907 }, { "epoch": 3.9674796747967482, "grad_norm": 0.46450077619291974, "learning_rate": 1.8849097273494827e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.09664749354124069, "step": 2440, "valid_targets_mean": 5649.5, "valid_targets_min": 1677 }, { "epoch": 3.975609756097561, "grad_norm": 0.5447369663169432, "learning_rate": 1.8768147050672028e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.10617190599441528, "step": 2445, "valid_targets_mean": 3496.9, "valid_targets_min": 687 }, { "epoch": 3.983739837398374, "grad_norm": 0.4717452738988299, "learning_rate": 1.8687217080356365e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.1073131114244461, "step": 2450, "valid_targets_mean": 5925.9, "valid_targets_min": 1798 }, { "epoch": 3.991869918699187, "grad_norm": 0.5298316474382961, "learning_rate": 1.8606308693092035e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.08571353554725647, "step": 2455, "valid_targets_mean": 3527.1, "valid_targets_min": 1130 }, { "epoch": 4.0, "grad_norm": 0.5458029010216223, "learning_rate": 1.8525423219068423e-05, "loss": 0.1711, "loss_nan_ranks": 0, "loss_rank_avg": 0.04789840430021286, "step": 2460, "valid_targets_mean": 2188.4, "valid_targets_min": 1152 }, { "epoch": 4.008130081300813, "grad_norm": 0.470355035275389, "learning_rate": 1.844456198809817e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.0760560929775238, "step": 2465, "valid_targets_mean": 3593.5, "valid_targets_min": 1344 }, { "epoch": 4.016260162601626, "grad_norm": 0.47451087233623207, "learning_rate": 1.8363726329595356e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.09951330721378326, "step": 2470, "valid_targets_mean": 5804.1, "valid_targets_min": 1060 }, { "epoch": 4.024390243902439, "grad_norm": 0.49642244775827304, "learning_rate": 1.828291757255364e-05, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.10721617937088013, "step": 2475, "valid_targets_mean": 8417.1, "valid_targets_min": 2637 }, { "epoch": 4.032520325203252, "grad_norm": 0.4775902100045484, "learning_rate": 1.8202137045524383e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.06014365702867508, "step": 2480, "valid_targets_mean": 3867.4, "valid_targets_min": 1246 }, { "epoch": 4.040650406504065, "grad_norm": 0.5267371803662289, "learning_rate": 1.812138607659486e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.066822849214077, "step": 2485, "valid_targets_mean": 4648.4, "valid_targets_min": 2692 }, { "epoch": 4.048780487804878, "grad_norm": 0.5202276524445878, "learning_rate": 1.8040665993366355e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.055022526532411575, "step": 2490, "valid_targets_mean": 3872.0, "valid_targets_min": 1124 }, { "epoch": 4.056910569105691, "grad_norm": 0.4822833273017539, "learning_rate": 1.795997812293239e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.06273403018712997, "step": 2495, "valid_targets_mean": 4760.5, "valid_targets_min": 1233 }, { "epoch": 4.065040650406504, "grad_norm": 0.5106660254136155, "learning_rate": 1.7879323791856875e-05, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.05794154107570648, "step": 2500, "valid_targets_mean": 3971.8, "valid_targets_min": 940 }, { "epoch": 4.073170731707317, "grad_norm": 0.41398244903576503, "learning_rate": 1.7798704326152317e-05, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.04327961057424545, "step": 2505, "valid_targets_mean": 3299.6, "valid_targets_min": 912 }, { "epoch": 4.08130081300813, "grad_norm": 0.4766202632898315, "learning_rate": 1.7718121051258016e-05, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.07671961933374405, "step": 2510, "valid_targets_mean": 6943.2, "valid_targets_min": 1406 }, { "epoch": 4.0894308943089435, "grad_norm": 0.4876408535651927, "learning_rate": 1.763757529201826e-05, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.05827348679304123, "step": 2515, "valid_targets_mean": 4735.4, "valid_targets_min": 992 }, { "epoch": 4.097560975609756, "grad_norm": 0.5060801606705408, "learning_rate": 1.7557068372660562e-05, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.09068716317415237, "step": 2520, "valid_targets_mean": 5210.0, "valid_targets_min": 1814 }, { "epoch": 4.105691056910569, "grad_norm": 0.5171104110449606, "learning_rate": 1.747660161677387e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.10956168174743652, "step": 2525, "valid_targets_mean": 6051.6, "valid_targets_min": 1609 }, { "epoch": 4.1138211382113825, "grad_norm": 0.4524889973073697, "learning_rate": 1.7396176347286838e-05, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.06161228567361832, "step": 2530, "valid_targets_mean": 4905.6, "valid_targets_min": 1237 }, { "epoch": 4.121951219512195, "grad_norm": 0.5151222071885753, "learning_rate": 1.7315793886446036e-05, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.0557260662317276, "step": 2535, "valid_targets_mean": 4326.4, "valid_targets_min": 638 }, { "epoch": 4.130081300813008, "grad_norm": 0.4450667494465782, "learning_rate": 1.7235455555794236e-05, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.08098851144313812, "step": 2540, "valid_targets_mean": 6224.8, "valid_targets_min": 1301 }, { "epoch": 4.138211382113822, "grad_norm": 0.46674087201623526, "learning_rate": 1.7155162676148682e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.11802077293395996, "step": 2545, "valid_targets_mean": 6261.2, "valid_targets_min": 802 }, { "epoch": 4.146341463414634, "grad_norm": 0.5143547555412055, "learning_rate": 1.707491656757936e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.09308500587940216, "step": 2550, "valid_targets_mean": 4701.8, "valid_targets_min": 844 }, { "epoch": 4.154471544715447, "grad_norm": 0.587891855203043, "learning_rate": 1.6994718549387332e-05, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.0780920758843422, "step": 2555, "valid_targets_mean": 3128.9, "valid_targets_min": 772 }, { "epoch": 4.16260162601626, "grad_norm": 0.5075349666289611, "learning_rate": 1.6914569940083004e-05, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.06455211341381073, "step": 2560, "valid_targets_mean": 4237.0, "valid_targets_min": 1429 }, { "epoch": 4.170731707317073, "grad_norm": 0.4644748738029107, "learning_rate": 1.6834472057364462e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.09997627139091492, "step": 2565, "valid_targets_mean": 6478.0, "valid_targets_min": 1985 }, { "epoch": 4.178861788617886, "grad_norm": 0.43715016647506927, "learning_rate": 1.6754426218095827e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.09350892901420593, "step": 2570, "valid_targets_mean": 7747.0, "valid_targets_min": 2135 }, { "epoch": 4.186991869918699, "grad_norm": 0.5144167874811619, "learning_rate": 1.6674433738285573e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.10404399037361145, "step": 2575, "valid_targets_mean": 5096.9, "valid_targets_min": 1528 }, { "epoch": 4.195121951219512, "grad_norm": 0.5836489841825808, "learning_rate": 1.6594495933064926e-05, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.06642283499240875, "step": 2580, "valid_targets_mean": 3414.9, "valid_targets_min": 1041 }, { "epoch": 4.203252032520325, "grad_norm": 0.4248964546565483, "learning_rate": 1.6514614116666213e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.07662998884916306, "step": 2585, "valid_targets_mean": 6127.9, "valid_targets_min": 1556 }, { "epoch": 4.211382113821138, "grad_norm": 0.5633035449980022, "learning_rate": 1.6434789602401264e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.07008647918701172, "step": 2590, "valid_targets_mean": 3270.1, "valid_targets_min": 1044 }, { "epoch": 4.219512195121951, "grad_norm": 0.479741702810202, "learning_rate": 1.6355023702639835e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.08551254123449326, "step": 2595, "valid_targets_mean": 5185.9, "valid_targets_min": 2262 }, { "epoch": 4.227642276422764, "grad_norm": 0.4556534575031909, "learning_rate": 1.6275317728787995e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.07114671170711517, "step": 2600, "valid_targets_mean": 4481.5, "valid_targets_min": 986 }, { "epoch": 4.235772357723577, "grad_norm": 0.47124227862472406, "learning_rate": 1.6195672991266627e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.04725772887468338, "step": 2605, "valid_targets_mean": 3744.0, "valid_targets_min": 1430 }, { "epoch": 4.2439024390243905, "grad_norm": 0.5143434728872713, "learning_rate": 1.6116090799489817e-05, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.06984749436378479, "step": 2610, "valid_targets_mean": 4490.1, "valid_targets_min": 1367 }, { "epoch": 4.252032520325203, "grad_norm": 0.5315336075348905, "learning_rate": 1.603657246184337e-05, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.08241944760084152, "step": 2615, "valid_targets_mean": 5229.8, "valid_targets_min": 1092 }, { "epoch": 4.260162601626016, "grad_norm": 0.4304341882650181, "learning_rate": 1.5957119285663276e-05, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.07520405948162079, "step": 2620, "valid_targets_mean": 6784.0, "valid_targets_min": 2445 }, { "epoch": 4.2682926829268295, "grad_norm": 0.4847716931386392, "learning_rate": 1.5877732577214227e-05, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.07001012563705444, "step": 2625, "valid_targets_mean": 4826.5, "valid_targets_min": 1595 }, { "epoch": 4.276422764227642, "grad_norm": 0.4988367383903381, "learning_rate": 1.5798413641668152e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.077020063996315, "step": 2630, "valid_targets_mean": 5269.6, "valid_targets_min": 1374 }, { "epoch": 4.284552845528455, "grad_norm": 0.5807973900920063, "learning_rate": 1.5719163783082735e-05, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.07132510840892792, "step": 2635, "valid_targets_mean": 2914.2, "valid_targets_min": 360 }, { "epoch": 4.2926829268292686, "grad_norm": 0.48502885572051696, "learning_rate": 1.563998430437999e-05, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.08346251398324966, "step": 2640, "valid_targets_mean": 4075.8, "valid_targets_min": 1022 }, { "epoch": 4.300813008130081, "grad_norm": 0.453331962859297, "learning_rate": 1.556087650732483e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.046189140528440475, "step": 2645, "valid_targets_mean": 3378.0, "valid_targets_min": 1136 }, { "epoch": 4.308943089430894, "grad_norm": 0.6099949910931554, "learning_rate": 1.5481841692503696e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.08059431612491608, "step": 2650, "valid_targets_mean": 5008.8, "valid_targets_min": 914 }, { "epoch": 4.317073170731708, "grad_norm": 0.4047454132808525, "learning_rate": 1.5402881159303132e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.08221932500600815, "step": 2655, "valid_targets_mean": 6544.0, "valid_targets_min": 2585 }, { "epoch": 4.32520325203252, "grad_norm": 0.46712956665924055, "learning_rate": 1.5323996205888444e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.09215272963047028, "step": 2660, "valid_targets_mean": 5262.6, "valid_targets_min": 856 }, { "epoch": 4.333333333333333, "grad_norm": 0.5736488228751866, "learning_rate": 1.5245188129182352e-05, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.12925416231155396, "step": 2665, "valid_targets_mean": 5132.2, "valid_targets_min": 1897 }, { "epoch": 4.341463414634147, "grad_norm": 0.43100075653800896, "learning_rate": 1.5166458224843666e-05, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.06192822754383087, "step": 2670, "valid_targets_mean": 5483.0, "valid_targets_min": 1147 }, { "epoch": 4.349593495934959, "grad_norm": 0.4089405411882674, "learning_rate": 1.5087807787246018e-05, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.0610245019197464, "step": 2675, "valid_targets_mean": 7012.1, "valid_targets_min": 884 }, { "epoch": 4.357723577235772, "grad_norm": 0.5115108287042687, "learning_rate": 1.5009238109456519e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.07275721430778503, "step": 2680, "valid_targets_mean": 4917.8, "valid_targets_min": 1031 }, { "epoch": 4.365853658536586, "grad_norm": 0.6219846224675181, "learning_rate": 1.4930750483214545e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.07144097238779068, "step": 2685, "valid_targets_mean": 4172.2, "valid_targets_min": 582 }, { "epoch": 4.373983739837398, "grad_norm": 0.6260641394398687, "learning_rate": 1.485234619891049e-05, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.07533955574035645, "step": 2690, "valid_targets_mean": 3091.9, "valid_targets_min": 1175 }, { "epoch": 4.382113821138211, "grad_norm": 0.4549669428429121, "learning_rate": 1.4774026545564542e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.06965496391057968, "step": 2695, "valid_targets_mean": 5983.5, "valid_targets_min": 724 }, { "epoch": 4.390243902439025, "grad_norm": 0.5455526041877279, "learning_rate": 1.4695792810805513e-05, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.10486696660518646, "step": 2700, "valid_targets_mean": 6566.9, "valid_targets_min": 900 }, { "epoch": 4.3983739837398375, "grad_norm": 0.6530779968965817, "learning_rate": 1.4617646280849642e-05, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.08029432594776154, "step": 2705, "valid_targets_mean": 4237.9, "valid_targets_min": 736 }, { "epoch": 4.40650406504065, "grad_norm": 0.5137034484423478, "learning_rate": 1.4539588240479465e-05, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.07562180608510971, "step": 2710, "valid_targets_mean": 3674.4, "valid_targets_min": 463 }, { "epoch": 4.414634146341464, "grad_norm": 0.4544189096267336, "learning_rate": 1.4461619973022687e-05, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.10149542987346649, "step": 2715, "valid_targets_mean": 8344.6, "valid_targets_min": 1459 }, { "epoch": 4.4227642276422765, "grad_norm": 0.5683967017561563, "learning_rate": 1.4383742760331076e-05, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.07244271785020828, "step": 2720, "valid_targets_mean": 5211.8, "valid_targets_min": 2229 }, { "epoch": 4.430894308943089, "grad_norm": 0.5193181601984862, "learning_rate": 1.4305957882759427e-05, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.04341577738523483, "step": 2725, "valid_targets_mean": 3964.2, "valid_targets_min": 956 }, { "epoch": 4.439024390243903, "grad_norm": 0.6823628303109857, "learning_rate": 1.4228266619144453e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.0863582193851471, "step": 2730, "valid_targets_mean": 2811.5, "valid_targets_min": 738 }, { "epoch": 4.4471544715447155, "grad_norm": 0.5493718999282637, "learning_rate": 1.4150670246783799e-05, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.10341790318489075, "step": 2735, "valid_targets_mean": 5248.6, "valid_targets_min": 835 }, { "epoch": 4.455284552845528, "grad_norm": 0.6378690416717784, "learning_rate": 1.4073170041415028e-05, "loss": 0.174, "loss_nan_ranks": 0, "loss_rank_avg": 0.06139558181166649, "step": 2740, "valid_targets_mean": 3043.8, "valid_targets_min": 994 }, { "epoch": 4.463414634146342, "grad_norm": 0.4611867678116556, "learning_rate": 1.3995767277194665e-05, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.11183435469865799, "step": 2745, "valid_targets_mean": 8525.0, "valid_targets_min": 2185 }, { "epoch": 4.471544715447155, "grad_norm": 0.5791260471503948, "learning_rate": 1.391846322667722e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.10518206655979156, "step": 2750, "valid_targets_mean": 4332.1, "valid_targets_min": 569 }, { "epoch": 4.479674796747967, "grad_norm": 0.473868549796618, "learning_rate": 1.3841259160794298e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.0857369527220726, "step": 2755, "valid_targets_mean": 5520.1, "valid_targets_min": 1822 }, { "epoch": 4.487804878048781, "grad_norm": 0.576014432118026, "learning_rate": 1.3764156348833666e-05, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.08932463824748993, "step": 2760, "valid_targets_mean": 4587.6, "valid_targets_min": 2137 }, { "epoch": 4.495934959349594, "grad_norm": 0.43786499906523346, "learning_rate": 1.3687156058418422e-05, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.06921911239624023, "step": 2765, "valid_targets_mean": 5706.2, "valid_targets_min": 1332 }, { "epoch": 4.504065040650406, "grad_norm": 0.5549703994167362, "learning_rate": 1.3610259555486152e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.06656062602996826, "step": 2770, "valid_targets_mean": 3052.9, "valid_targets_min": 1436 }, { "epoch": 4.512195121951219, "grad_norm": 0.6049685262855611, "learning_rate": 1.3533468104268078e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.06683901697397232, "step": 2775, "valid_targets_mean": 2855.1, "valid_targets_min": 643 }, { "epoch": 4.520325203252033, "grad_norm": 0.4671992162112881, "learning_rate": 1.3456782967268316e-05, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.06862746179103851, "step": 2780, "valid_targets_mean": 5073.0, "valid_targets_min": 922 }, { "epoch": 4.528455284552845, "grad_norm": 0.47375274833210074, "learning_rate": 1.3380205405243096e-05, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.07612131536006927, "step": 2785, "valid_targets_mean": 5507.6, "valid_targets_min": 2010 }, { "epoch": 4.536585365853659, "grad_norm": 0.5414741931961937, "learning_rate": 1.3303736677180044e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.09981250762939453, "step": 2790, "valid_targets_mean": 5963.1, "valid_targets_min": 1036 }, { "epoch": 4.544715447154472, "grad_norm": 0.6709409758759214, "learning_rate": 1.322737804027749e-05, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.08285298943519592, "step": 2795, "valid_targets_mean": 3114.9, "valid_targets_min": 929 }, { "epoch": 4.5528455284552845, "grad_norm": 0.5194948516731278, "learning_rate": 1.315113074992378e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.08558328449726105, "step": 2800, "valid_targets_mean": 5572.0, "valid_targets_min": 1874 }, { "epoch": 4.560975609756097, "grad_norm": 0.5529444345631296, "learning_rate": 1.3074996059676644e-05, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.09635849297046661, "step": 2805, "valid_targets_mean": 5840.8, "valid_targets_min": 1166 }, { "epoch": 4.569105691056911, "grad_norm": 0.7155725915999065, "learning_rate": 1.2998975221242596e-05, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.07258845120668411, "step": 2810, "valid_targets_mean": 3025.4, "valid_targets_min": 867 }, { "epoch": 4.5772357723577235, "grad_norm": 0.444103000708674, "learning_rate": 1.292306948445634e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.06945082545280457, "step": 2815, "valid_targets_mean": 5158.1, "valid_targets_min": 1065 }, { "epoch": 4.585365853658536, "grad_norm": 0.5428888205606085, "learning_rate": 1.2847280097260245e-05, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.12906724214553833, "step": 2820, "valid_targets_mean": 6604.4, "valid_targets_min": 1170 }, { "epoch": 4.59349593495935, "grad_norm": 0.5097400919260324, "learning_rate": 1.2771608305683798e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.08143587410449982, "step": 2825, "valid_targets_mean": 5530.2, "valid_targets_min": 924 }, { "epoch": 4.6016260162601625, "grad_norm": 0.5412216121050345, "learning_rate": 1.269605535382314e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.0613265261054039, "step": 2830, "valid_targets_mean": 3314.8, "valid_targets_min": 925 }, { "epoch": 4.609756097560975, "grad_norm": 0.5918540474436129, "learning_rate": 1.2620622483820604e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.10300006717443466, "step": 2835, "valid_targets_mean": 4694.0, "valid_targets_min": 1471 }, { "epoch": 4.617886178861789, "grad_norm": 0.61047667881045, "learning_rate": 1.2545310935844288e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.12697109580039978, "step": 2840, "valid_targets_mean": 6276.6, "valid_targets_min": 1088 }, { "epoch": 4.626016260162602, "grad_norm": 0.5019138523871594, "learning_rate": 1.2470121948067693e-05, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.07365751266479492, "step": 2845, "valid_targets_mean": 5933.0, "valid_targets_min": 1632 }, { "epoch": 4.634146341463414, "grad_norm": 0.6328067223359671, "learning_rate": 1.2395056756649328e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.06169738620519638, "step": 2850, "valid_targets_mean": 2991.8, "valid_targets_min": 1536 }, { "epoch": 4.642276422764228, "grad_norm": 0.4846398461498477, "learning_rate": 1.2320116595712413e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.07755859196186066, "step": 2855, "valid_targets_mean": 4616.4, "valid_targets_min": 1413 }, { "epoch": 4.650406504065041, "grad_norm": 0.5390784533983399, "learning_rate": 1.224530269732457e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.10266651213169098, "step": 2860, "valid_targets_mean": 4373.6, "valid_targets_min": 991 }, { "epoch": 4.658536585365853, "grad_norm": 0.5867138639624438, "learning_rate": 1.2170616291477595e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.11183062195777893, "step": 2865, "valid_targets_mean": 5506.8, "valid_targets_min": 1811 }, { "epoch": 4.666666666666667, "grad_norm": 0.39969362421251053, "learning_rate": 1.2096058606067205e-05, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.08079314231872559, "step": 2870, "valid_targets_mean": 7655.6, "valid_targets_min": 2121 }, { "epoch": 4.67479674796748, "grad_norm": 0.610173541641884, "learning_rate": 1.2021630866872877e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.09658057987689972, "step": 2875, "valid_targets_mean": 5048.4, "valid_targets_min": 177 }, { "epoch": 4.682926829268292, "grad_norm": 0.4945385952047977, "learning_rate": 1.1947334297537675e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.08059705793857574, "step": 2880, "valid_targets_mean": 5533.4, "valid_targets_min": 1190 }, { "epoch": 4.691056910569106, "grad_norm": 0.517671091788911, "learning_rate": 1.1873170119548134e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.043919868767261505, "step": 2885, "valid_targets_mean": 2010.0, "valid_targets_min": 1194 }, { "epoch": 4.699186991869919, "grad_norm": 0.4684498058104573, "learning_rate": 1.1799139552214202e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.10377422720193863, "step": 2890, "valid_targets_mean": 4968.1, "valid_targets_min": 1186 }, { "epoch": 4.7073170731707314, "grad_norm": 0.5414859072608289, "learning_rate": 1.1725243812649168e-05, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.08510809391736984, "step": 2895, "valid_targets_mean": 4427.8, "valid_targets_min": 1992 }, { "epoch": 4.715447154471545, "grad_norm": 0.4465041663785712, "learning_rate": 1.1651484115749647e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.07684445381164551, "step": 2900, "valid_targets_mean": 6517.6, "valid_targets_min": 940 }, { "epoch": 4.723577235772358, "grad_norm": 0.482172705141307, "learning_rate": 1.1577861674175645e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.04566498100757599, "step": 2905, "valid_targets_mean": 3679.8, "valid_targets_min": 1621 }, { "epoch": 4.7317073170731705, "grad_norm": 0.4268634412682329, "learning_rate": 1.1504377698330575e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.06258468329906464, "step": 2910, "valid_targets_mean": 5361.1, "valid_targets_min": 1430 }, { "epoch": 4.739837398373984, "grad_norm": 0.5016846825049857, "learning_rate": 1.1431033396341391e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.08513687551021576, "step": 2915, "valid_targets_mean": 5517.8, "valid_targets_min": 1160 }, { "epoch": 4.747967479674797, "grad_norm": 0.4895916965759536, "learning_rate": 1.1357829974038703e-05, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.07120572030544281, "step": 2920, "valid_targets_mean": 5064.2, "valid_targets_min": 1144 }, { "epoch": 4.7560975609756095, "grad_norm": 0.5482443932106592, "learning_rate": 1.1284768634936971e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.08294594287872314, "step": 2925, "valid_targets_mean": 5197.2, "valid_targets_min": 1551 }, { "epoch": 4.764227642276423, "grad_norm": 0.556353846679473, "learning_rate": 1.1211850580214703e-05, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.10283535718917847, "step": 2930, "valid_targets_mean": 5125.8, "valid_targets_min": 1901 }, { "epoch": 4.772357723577236, "grad_norm": 0.4808233021089258, "learning_rate": 1.1139077008694712e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.11738122254610062, "step": 2935, "valid_targets_mean": 6494.9, "valid_targets_min": 1664 }, { "epoch": 4.780487804878049, "grad_norm": 0.5713770145912805, "learning_rate": 1.1066449116824428e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.058336518704891205, "step": 2940, "valid_targets_mean": 2281.0, "valid_targets_min": 168 }, { "epoch": 4.788617886178862, "grad_norm": 0.4478697491677857, "learning_rate": 1.099396809865618e-05, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.10043537616729736, "step": 2945, "valid_targets_mean": 8086.2, "valid_targets_min": 2320 }, { "epoch": 4.796747967479675, "grad_norm": 0.49052761241781395, "learning_rate": 1.0921635145827611e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.0700555294752121, "step": 2950, "valid_targets_mean": 4055.2, "valid_targets_min": 1437 }, { "epoch": 4.804878048780488, "grad_norm": 0.6111681826738994, "learning_rate": 1.0849451447542054e-05, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.081040158867836, "step": 2955, "valid_targets_mean": 3611.6, "valid_targets_min": 783 }, { "epoch": 4.8130081300813, "grad_norm": 0.5902186935174121, "learning_rate": 1.0777418190549018e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.13564324378967285, "step": 2960, "valid_targets_mean": 5678.2, "valid_targets_min": 707 }, { "epoch": 4.821138211382114, "grad_norm": 0.5001179792330395, "learning_rate": 1.070553655912463e-05, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.04111259803175926, "step": 2965, "valid_targets_mean": 3067.0, "valid_targets_min": 745 }, { "epoch": 4.829268292682927, "grad_norm": 0.4870799940244146, "learning_rate": 1.0633807735052202e-05, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.06709617376327515, "step": 2970, "valid_targets_mean": 4227.9, "valid_targets_min": 733 }, { "epoch": 4.83739837398374, "grad_norm": 0.4339727111450907, "learning_rate": 1.056223289760278e-05, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.0654265433549881, "step": 2975, "valid_targets_mean": 5513.1, "valid_targets_min": 1037 }, { "epoch": 4.845528455284553, "grad_norm": 0.46974193213734666, "learning_rate": 1.0490813223515764e-05, "loss": 0.174, "loss_nan_ranks": 0, "loss_rank_avg": 0.06082771345973015, "step": 2980, "valid_targets_mean": 4017.0, "valid_targets_min": 1644 }, { "epoch": 4.853658536585366, "grad_norm": 0.5525599944295453, "learning_rate": 1.0419549886979582e-05, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.10106134414672852, "step": 2985, "valid_targets_mean": 4674.5, "valid_targets_min": 974 }, { "epoch": 4.861788617886178, "grad_norm": 0.4397832235714203, "learning_rate": 1.0348444059612338e-05, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.05799185484647751, "step": 2990, "valid_targets_mean": 5038.1, "valid_targets_min": 1479 }, { "epoch": 4.869918699186992, "grad_norm": 0.49575459892005325, "learning_rate": 1.0277496910442596e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.07994350790977478, "step": 2995, "valid_targets_mean": 6706.8, "valid_targets_min": 1003 }, { "epoch": 4.878048780487805, "grad_norm": 0.5531889849001992, "learning_rate": 1.0206709605890133e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.058995675295591354, "step": 3000, "valid_targets_mean": 3086.5, "valid_targets_min": 1344 }, { "epoch": 4.886178861788618, "grad_norm": 0.4730444503128787, "learning_rate": 1.0136083309746765e-05, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.06733112782239914, "step": 3005, "valid_targets_mean": 4750.6, "valid_targets_min": 1355 }, { "epoch": 4.894308943089431, "grad_norm": 0.4339111364079381, "learning_rate": 1.006561918315724e-05, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.059047698974609375, "step": 3010, "valid_targets_mean": 5023.9, "valid_targets_min": 1449 }, { "epoch": 4.902439024390244, "grad_norm": 0.4279855746329812, "learning_rate": 9.995318384600112e-06, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.09795396775007248, "step": 3015, "valid_targets_mean": 6714.2, "valid_targets_min": 1460 }, { "epoch": 4.9105691056910565, "grad_norm": 0.560210793984083, "learning_rate": 9.92518206986871e-06, "loss": 0.176, "loss_nan_ranks": 0, "loss_rank_avg": 0.11636665463447571, "step": 3020, "valid_targets_mean": 6159.1, "valid_targets_min": 971 }, { "epoch": 4.91869918699187, "grad_norm": 0.5174030242396476, "learning_rate": 9.855211392052139e-06, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.06636689603328705, "step": 3025, "valid_targets_mean": 4745.4, "valid_targets_min": 831 }, { "epoch": 4.926829268292683, "grad_norm": 0.5161039511538914, "learning_rate": 9.78540750151632e-06, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.06481475383043289, "step": 3030, "valid_targets_mean": 3857.6, "valid_targets_min": 778 }, { "epoch": 4.934959349593496, "grad_norm": 0.4799392581007463, "learning_rate": 9.715771545885076e-06, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.08936204761266708, "step": 3035, "valid_targets_mean": 5134.8, "valid_targets_min": 1634 }, { "epoch": 4.943089430894309, "grad_norm": 0.5277397274003789, "learning_rate": 9.646304670021263e-06, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.056844696402549744, "step": 3040, "valid_targets_mean": 3186.1, "valid_targets_min": 1271 }, { "epoch": 4.951219512195122, "grad_norm": 0.5192411182730533, "learning_rate": 9.577008016007956e-06, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.09345956891775131, "step": 3045, "valid_targets_mean": 5773.0, "valid_targets_min": 1945 }, { "epoch": 4.959349593495935, "grad_norm": 0.46714907038686426, "learning_rate": 9.50788272312966e-06, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.10420192778110504, "step": 3050, "valid_targets_mean": 7552.9, "valid_targets_min": 2637 }, { "epoch": 4.967479674796748, "grad_norm": 0.49116442306059277, "learning_rate": 9.43892992785358e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.046188224107027054, "step": 3055, "valid_targets_mean": 2851.2, "valid_targets_min": 735 }, { "epoch": 4.975609756097561, "grad_norm": 0.5080857505436233, "learning_rate": 9.370150763810966e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.11296803504228592, "step": 3060, "valid_targets_mean": 5853.9, "valid_targets_min": 650 }, { "epoch": 4.983739837398374, "grad_norm": 0.5563044568016549, "learning_rate": 9.301546361778424e-06, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.08238890022039413, "step": 3065, "valid_targets_mean": 4308.8, "valid_targets_min": 1807 }, { "epoch": 4.991869918699187, "grad_norm": 0.4859361498269127, "learning_rate": 9.233117849659367e-06, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.13086149096488953, "step": 3070, "valid_targets_mean": 7301.0, "valid_targets_min": 1202 }, { "epoch": 5.0, "grad_norm": 0.4859147272512682, "learning_rate": 9.164866352465447e-06, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.09017547965049744, "step": 3075, "valid_targets_mean": 6317.8, "valid_targets_min": 1575 }, { "epoch": 5.008130081300813, "grad_norm": 0.49854359536749215, "learning_rate": 9.096792992298089e-06, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.058648284524679184, "step": 3080, "valid_targets_mean": 3432.9, "valid_targets_min": 922 }, { "epoch": 5.016260162601626, "grad_norm": 0.5107970270890307, "learning_rate": 9.028898888330005e-06, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.07531550526618958, "step": 3085, "valid_targets_mean": 5513.6, "valid_targets_min": 2215 }, { "epoch": 5.024390243902439, "grad_norm": 0.5454600356098418, "learning_rate": 8.961185156786815e-06, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.059423185884952545, "step": 3090, "valid_targets_mean": 4991.8, "valid_targets_min": 982 }, { "epoch": 5.032520325203252, "grad_norm": 0.7173181761174011, "learning_rate": 8.893652910928698e-06, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.08933936804533005, "step": 3095, "valid_targets_mean": 3738.2, "valid_targets_min": 1147 }, { "epoch": 5.040650406504065, "grad_norm": 0.626787973324638, "learning_rate": 8.826303261032072e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.1016145721077919, "step": 3100, "valid_targets_mean": 4273.2, "valid_targets_min": 812 }, { "epoch": 5.048780487804878, "grad_norm": 0.4363980337643143, "learning_rate": 8.759137314371378e-06, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.06092683598399162, "step": 3105, "valid_targets_mean": 4570.0, "valid_targets_min": 1267 }, { "epoch": 5.056910569105691, "grad_norm": 0.47598532666763393, "learning_rate": 8.692156175200823e-06, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.08653100579977036, "step": 3110, "valid_targets_mean": 7743.2, "valid_targets_min": 1609 }, { "epoch": 5.065040650406504, "grad_norm": 0.5697905541211631, "learning_rate": 8.625360944736262e-06, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.06744492799043655, "step": 3115, "valid_targets_mean": 3678.8, "valid_targets_min": 862 }, { "epoch": 5.073170731707317, "grad_norm": 0.5310652799284886, "learning_rate": 8.558752721137089e-06, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.08869394659996033, "step": 3120, "valid_targets_mean": 4928.6, "valid_targets_min": 1058 }, { "epoch": 5.08130081300813, "grad_norm": 0.5037931186801259, "learning_rate": 8.492332599488157e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.12100984901189804, "step": 3125, "valid_targets_mean": 7846.2, "valid_targets_min": 1120 }, { "epoch": 5.0894308943089435, "grad_norm": 0.4762169133202216, "learning_rate": 8.42610167178183e-06, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.06363822519779205, "step": 3130, "valid_targets_mean": 4641.9, "valid_targets_min": 1211 }, { "epoch": 5.097560975609756, "grad_norm": 0.5531751995953906, "learning_rate": 8.360061026899962e-06, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.10041944682598114, "step": 3135, "valid_targets_mean": 5801.6, "valid_targets_min": 967 }, { "epoch": 5.105691056910569, "grad_norm": 0.5773466743368734, "learning_rate": 8.294211750596035e-06, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.06968657672405243, "step": 3140, "valid_targets_mean": 3366.9, "valid_targets_min": 798 }, { "epoch": 5.1138211382113825, "grad_norm": 0.5063964799160192, "learning_rate": 8.228554925477306e-06, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.05303658917546272, "step": 3145, "valid_targets_mean": 3915.9, "valid_targets_min": 1077 }, { "epoch": 5.121951219512195, "grad_norm": 0.6557565347169084, "learning_rate": 8.163091630987e-06, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.0775236189365387, "step": 3150, "valid_targets_mean": 2828.0, "valid_targets_min": 1349 }, { "epoch": 5.130081300813008, "grad_norm": 0.504707094696265, "learning_rate": 8.097822943386563e-06, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.1327846646308899, "step": 3155, "valid_targets_mean": 6904.1, "valid_targets_min": 1017 }, { "epoch": 5.138211382113822, "grad_norm": 0.4974966624143671, "learning_rate": 8.03274993573797e-06, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.07157565653324127, "step": 3160, "valid_targets_mean": 5011.9, "valid_targets_min": 993 }, { "epoch": 5.146341463414634, "grad_norm": 0.3671402281895943, "learning_rate": 7.96787367788609e-06, "loss": 0.1463, "loss_nan_ranks": 0, "loss_rank_avg": 0.06661646068096161, "step": 3165, "valid_targets_mean": 8203.4, "valid_targets_min": 1950 }, { "epoch": 5.154471544715447, "grad_norm": 0.44667433334720263, "learning_rate": 7.903195236441086e-06, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.07493871450424194, "step": 3170, "valid_targets_mean": 6196.5, "valid_targets_min": 1109 }, { "epoch": 5.16260162601626, "grad_norm": 0.49783463906067615, "learning_rate": 7.838715674760874e-06, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.07221659272909164, "step": 3175, "valid_targets_mean": 6492.0, "valid_targets_min": 1710 }, { "epoch": 5.170731707317073, "grad_norm": 0.5372739564428146, "learning_rate": 7.774436052933675e-06, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.08551802486181259, "step": 3180, "valid_targets_mean": 4486.5, "valid_targets_min": 1133 }, { "epoch": 5.178861788617886, "grad_norm": 0.4041059491827253, "learning_rate": 7.710357427760541e-06, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.05999711528420448, "step": 3185, "valid_targets_mean": 8748.9, "valid_targets_min": 1692 }, { "epoch": 5.186991869918699, "grad_norm": 0.518044448300407, "learning_rate": 7.646480852738008e-06, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.08598169684410095, "step": 3190, "valid_targets_mean": 6521.9, "valid_targets_min": 1654 }, { "epoch": 5.195121951219512, "grad_norm": 0.5780827294222305, "learning_rate": 7.5828073780407575e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.08051645755767822, "step": 3195, "valid_targets_mean": 4492.1, "valid_targets_min": 1174 }, { "epoch": 5.203252032520325, "grad_norm": 0.5238635777060622, "learning_rate": 7.51933805050439e-06, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.05375855416059494, "step": 3200, "valid_targets_mean": 3988.4, "valid_targets_min": 701 }, { "epoch": 5.211382113821138, "grad_norm": 0.5015015158588826, "learning_rate": 7.45607391360816e-06, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.06788468360900879, "step": 3205, "valid_targets_mean": 5458.2, "valid_targets_min": 1724 }, { "epoch": 5.219512195121951, "grad_norm": 0.4528447860323385, "learning_rate": 7.393016007457858e-06, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.07554462552070618, "step": 3210, "valid_targets_mean": 5808.5, "valid_targets_min": 977 }, { "epoch": 5.227642276422764, "grad_norm": 0.5302870185060073, "learning_rate": 7.3301653687687005e-06, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.04706777632236481, "step": 3215, "valid_targets_mean": 3385.8, "valid_targets_min": 1439 }, { "epoch": 5.235772357723577, "grad_norm": 0.5995348899933904, "learning_rate": 7.2675230308482715e-06, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.07221737504005432, "step": 3220, "valid_targets_mean": 3964.5, "valid_targets_min": 1024 }, { "epoch": 5.2439024390243905, "grad_norm": 0.4041689231278984, "learning_rate": 7.205090023579575e-06, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.04537433385848999, "step": 3225, "valid_targets_mean": 5532.2, "valid_targets_min": 1171 }, { "epoch": 5.252032520325203, "grad_norm": 0.48806925485849423, "learning_rate": 7.142867373404054e-06, "loss": 0.1418, "loss_nan_ranks": 0, "loss_rank_avg": 0.1001819372177124, "step": 3230, "valid_targets_mean": 5811.6, "valid_targets_min": 1225 }, { "epoch": 5.260162601626016, "grad_norm": 0.5676587706429211, "learning_rate": 7.080856103304739e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.094810351729393, "step": 3235, "valid_targets_mean": 5457.5, "valid_targets_min": 1081 }, { "epoch": 5.2682926829268295, "grad_norm": 0.589418070163673, "learning_rate": 7.019057232789432e-06, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.10773605853319168, "step": 3240, "valid_targets_mean": 4418.9, "valid_targets_min": 573 }, { "epoch": 5.276422764227642, "grad_norm": 0.6257292895524542, "learning_rate": 6.95747177787393e-06, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.10086464881896973, "step": 3245, "valid_targets_mean": 4056.5, "valid_targets_min": 1903 }, { "epoch": 5.284552845528455, "grad_norm": 0.4904374796790561, "learning_rate": 6.896100751065355e-06, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.08876670151948929, "step": 3250, "valid_targets_mean": 5023.5, "valid_targets_min": 1535 }, { "epoch": 5.2926829268292686, "grad_norm": 0.5496914353661247, "learning_rate": 6.834945161345458e-06, "loss": 0.1676, "loss_nan_ranks": 0, "loss_rank_avg": 0.058593012392520905, "step": 3255, "valid_targets_mean": 3781.8, "valid_targets_min": 981 }, { "epoch": 5.300813008130081, "grad_norm": 0.4978181792750339, "learning_rate": 6.7740060141540735e-06, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.055863749235868454, "step": 3260, "valid_targets_mean": 4500.1, "valid_targets_min": 1186 }, { "epoch": 5.308943089430894, "grad_norm": 0.4203568527752614, "learning_rate": 6.713284311372559e-06, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.0628855973482132, "step": 3265, "valid_targets_mean": 7745.5, "valid_targets_min": 1502 }, { "epoch": 5.317073170731708, "grad_norm": 0.663927317547951, "learning_rate": 6.652781051307347e-06, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.04293135553598404, "step": 3270, "valid_targets_mean": 2127.0, "valid_targets_min": 1492 }, { "epoch": 5.32520325203252, "grad_norm": 0.4781729388868269, "learning_rate": 6.592497228673515e-06, "loss": 0.1444, "loss_nan_ranks": 0, "loss_rank_avg": 0.08012019097805023, "step": 3275, "valid_targets_mean": 6378.5, "valid_targets_min": 444 }, { "epoch": 5.333333333333333, "grad_norm": 0.607414251381825, "learning_rate": 6.532433834578449e-06, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.07517934590578079, "step": 3280, "valid_targets_mean": 5569.0, "valid_targets_min": 684 }, { "epoch": 5.341463414634147, "grad_norm": 0.45673248053918214, "learning_rate": 6.472591856505526e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.07896129786968231, "step": 3285, "valid_targets_mean": 8128.4, "valid_targets_min": 1090 }, { "epoch": 5.349593495934959, "grad_norm": 0.5121223481371979, "learning_rate": 6.412972278297893e-06, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.059703271836042404, "step": 3290, "valid_targets_mean": 3892.6, "valid_targets_min": 220 }, { "epoch": 5.357723577235772, "grad_norm": 0.6849550131287704, "learning_rate": 6.353576080142309e-06, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.09094927459955215, "step": 3295, "valid_targets_mean": 2592.1, "valid_targets_min": 1194 }, { "epoch": 5.365853658536586, "grad_norm": 0.4298070556094885, "learning_rate": 6.294404238552994e-06, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.04759322851896286, "step": 3300, "valid_targets_mean": 4864.8, "valid_targets_min": 1912 }, { "epoch": 5.373983739837398, "grad_norm": 0.5148540712843253, "learning_rate": 6.235457726355591e-06, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.08303937315940857, "step": 3305, "valid_targets_mean": 6326.0, "valid_targets_min": 1237 }, { "epoch": 5.382113821138211, "grad_norm": 0.4977120202620715, "learning_rate": 6.176737512671182e-06, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.06961072981357574, "step": 3310, "valid_targets_mean": 4249.5, "valid_targets_min": 1883 }, { "epoch": 5.390243902439025, "grad_norm": 0.47882579814516146, "learning_rate": 6.11824456290034e-06, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.06477604806423187, "step": 3315, "valid_targets_mean": 5231.5, "valid_targets_min": 1151 }, { "epoch": 5.3983739837398375, "grad_norm": 0.579883922417472, "learning_rate": 6.05997983870727e-06, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.06657819449901581, "step": 3320, "valid_targets_mean": 4098.4, "valid_targets_min": 1209 }, { "epoch": 5.40650406504065, "grad_norm": 0.4740276499842878, "learning_rate": 6.00194429800399e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.06888905167579651, "step": 3325, "valid_targets_mean": 6041.8, "valid_targets_min": 502 }, { "epoch": 5.414634146341464, "grad_norm": 0.6709879863380092, "learning_rate": 5.944138894934582e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.08873364329338074, "step": 3330, "valid_targets_mean": 5908.1, "valid_targets_min": 937 }, { "epoch": 5.4227642276422765, "grad_norm": 0.5985145982762373, "learning_rate": 5.886564579859504e-06, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.09765864908695221, "step": 3335, "valid_targets_mean": 5333.6, "valid_targets_min": 1577 }, { "epoch": 5.430894308943089, "grad_norm": 0.4045576655293279, "learning_rate": 5.829222299339969e-06, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.08612416684627533, "step": 3340, "valid_targets_mean": 7717.9, "valid_targets_min": 1806 }, { "epoch": 5.439024390243903, "grad_norm": 0.6264324432727286, "learning_rate": 5.772112996122403e-06, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.08448145538568497, "step": 3345, "valid_targets_mean": 3572.1, "valid_targets_min": 1658 }, { "epoch": 5.4471544715447155, "grad_norm": 0.48969077905949704, "learning_rate": 5.715237609122896e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.10492876172065735, "step": 3350, "valid_targets_mean": 6810.0, "valid_targets_min": 1096 }, { "epoch": 5.455284552845528, "grad_norm": 0.542350082879983, "learning_rate": 5.658597073411816e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.0580582469701767, "step": 3355, "valid_targets_mean": 3644.1, "valid_targets_min": 1053 }, { "epoch": 5.463414634146342, "grad_norm": 0.5109663508257631, "learning_rate": 5.602192320198401e-06, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.052927643060684204, "step": 3360, "valid_targets_mean": 4242.1, "valid_targets_min": 554 }, { "epoch": 5.471544715447155, "grad_norm": 0.5108865212838303, "learning_rate": 5.546024276815467e-06, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.0898483395576477, "step": 3365, "valid_targets_mean": 6533.8, "valid_targets_min": 728 }, { "epoch": 5.479674796747967, "grad_norm": 0.6216505478797267, "learning_rate": 5.490093866704171e-06, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.10169227421283722, "step": 3370, "valid_targets_mean": 4857.0, "valid_targets_min": 1080 }, { "epoch": 5.487804878048781, "grad_norm": 0.5633469634869857, "learning_rate": 5.434402009398798e-06, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.08256097137928009, "step": 3375, "valid_targets_mean": 4313.6, "valid_targets_min": 1563 }, { "epoch": 5.495934959349594, "grad_norm": 0.4152905580329195, "learning_rate": 5.378949620511671e-06, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.07723593711853027, "step": 3380, "valid_targets_mean": 9008.1, "valid_targets_min": 3078 }, { "epoch": 5.504065040650406, "grad_norm": 0.5311623735869512, "learning_rate": 5.3237376117180854e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.08768315613269806, "step": 3385, "valid_targets_mean": 4967.6, "valid_targets_min": 1341 }, { "epoch": 5.512195121951219, "grad_norm": 0.568135953677004, "learning_rate": 5.268766890741315e-06, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.08434534072875977, "step": 3390, "valid_targets_mean": 3570.9, "valid_targets_min": 1926 }, { "epoch": 5.520325203252033, "grad_norm": 0.475746460031834, "learning_rate": 5.214038361337719e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.09175962209701538, "step": 3395, "valid_targets_mean": 8532.4, "valid_targets_min": 3389 }, { "epoch": 5.528455284552845, "grad_norm": 0.5085691695146316, "learning_rate": 5.159552923281841e-06, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.06383851170539856, "step": 3400, "valid_targets_mean": 3872.4, "valid_targets_min": 735 }, { "epoch": 5.536585365853659, "grad_norm": 0.6690261410952633, "learning_rate": 5.105311472351639e-06, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.05282168090343475, "step": 3405, "valid_targets_mean": 2115.5, "valid_targets_min": 850 }, { "epoch": 5.544715447154472, "grad_norm": 0.5100659086393543, "learning_rate": 5.051314900313764e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.04734280705451965, "step": 3410, "valid_targets_mean": 3005.0, "valid_targets_min": 529 }, { "epoch": 5.5528455284552845, "grad_norm": 0.49892887750042736, "learning_rate": 4.997564094908878e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.08764363825321198, "step": 3415, "valid_targets_mean": 5742.2, "valid_targets_min": 1868 }, { "epoch": 5.560975609756097, "grad_norm": 0.48648538778638434, "learning_rate": 4.944059939837082e-06, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.0696064680814743, "step": 3420, "valid_targets_mean": 6079.4, "valid_targets_min": 910 }, { "epoch": 5.569105691056911, "grad_norm": 0.5168959826292698, "learning_rate": 4.890803314743371e-06, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.05596218630671501, "step": 3425, "valid_targets_mean": 4584.6, "valid_targets_min": 1199 }, { "epoch": 5.5772357723577235, "grad_norm": 0.5503991908963576, "learning_rate": 4.837795095203175e-06, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.0811515673995018, "step": 3430, "valid_targets_mean": 4608.2, "valid_targets_min": 805 }, { "epoch": 5.585365853658536, "grad_norm": 0.4937547707850458, "learning_rate": 4.785036152707969e-06, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.07238927483558655, "step": 3435, "valid_targets_mean": 6213.9, "valid_targets_min": 2005 }, { "epoch": 5.59349593495935, "grad_norm": 0.5477537226170912, "learning_rate": 4.732527354650951e-06, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.10932628810405731, "step": 3440, "valid_targets_mean": 7147.6, "valid_targets_min": 2902 }, { "epoch": 5.6016260162601625, "grad_norm": 0.4397249981417704, "learning_rate": 4.68026956431276e-06, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.06082093343138695, "step": 3445, "valid_targets_mean": 6207.0, "valid_targets_min": 1971 }, { "epoch": 5.609756097560975, "grad_norm": 0.4460352266841392, "learning_rate": 4.628263640847304e-06, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.0991651713848114, "step": 3450, "valid_targets_mean": 7991.2, "valid_targets_min": 835 }, { "epoch": 5.617886178861789, "grad_norm": 0.46332791657614336, "learning_rate": 4.5765104392676205e-06, "loss": 0.1302, "loss_nan_ranks": 0, "loss_rank_avg": 0.07686010748147964, "step": 3455, "valid_targets_mean": 8166.8, "valid_targets_min": 3397 }, { "epoch": 5.626016260162602, "grad_norm": 0.609861782594922, "learning_rate": 4.525010810431825e-06, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.0901678130030632, "step": 3460, "valid_targets_mean": 4795.0, "valid_targets_min": 986 }, { "epoch": 5.634146341463414, "grad_norm": 0.5806616011047664, "learning_rate": 4.4737656010291366e-06, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.04445335268974304, "step": 3465, "valid_targets_mean": 2880.8, "valid_targets_min": 1356 }, { "epoch": 5.642276422764228, "grad_norm": 0.5359946789329091, "learning_rate": 4.422775653565934e-06, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.12036748230457306, "step": 3470, "valid_targets_mean": 6577.9, "valid_targets_min": 779 }, { "epoch": 5.650406504065041, "grad_norm": 0.5429212531785038, "learning_rate": 4.372041806351914e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.09158656001091003, "step": 3475, "valid_targets_mean": 5610.8, "valid_targets_min": 1274 }, { "epoch": 5.658536585365853, "grad_norm": 0.5937266326907074, "learning_rate": 4.321564893486312e-06, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.17133484780788422, "step": 3480, "valid_targets_mean": 5507.4, "valid_targets_min": 1032 }, { "epoch": 5.666666666666667, "grad_norm": 0.43760484322305737, "learning_rate": 4.271345744844182e-06, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.07250078022480011, "step": 3485, "valid_targets_mean": 7164.9, "valid_targets_min": 926 }, { "epoch": 5.67479674796748, "grad_norm": 1.0195875786667528, "learning_rate": 4.2213851860627696e-06, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.048584144562482834, "step": 3490, "valid_targets_mean": 2628.4, "valid_targets_min": 1065 }, { "epoch": 5.682926829268292, "grad_norm": 0.4924348871704833, "learning_rate": 4.171684038527914e-06, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.06494857370853424, "step": 3495, "valid_targets_mean": 5082.6, "valid_targets_min": 1198 }, { "epoch": 5.691056910569106, "grad_norm": 0.6452555282215298, "learning_rate": 4.12224311936056e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.0747845247387886, "step": 3500, "valid_targets_mean": 3321.0, "valid_targets_min": 1041 }, { "epoch": 5.699186991869919, "grad_norm": 0.5336793890509473, "learning_rate": 4.073063241403316e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.07798875868320465, "step": 3505, "valid_targets_mean": 4852.4, "valid_targets_min": 1228 }, { "epoch": 5.7073170731707314, "grad_norm": 0.6185768410415784, "learning_rate": 4.024145213207103e-06, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.1081596165895462, "step": 3510, "valid_targets_mean": 4946.0, "valid_targets_min": 1489 }, { "epoch": 5.715447154471545, "grad_norm": 0.6178884977151816, "learning_rate": 3.975489839017846e-06, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.08012266457080841, "step": 3515, "valid_targets_mean": 3635.9, "valid_targets_min": 1167 }, { "epoch": 5.723577235772358, "grad_norm": 0.5165843575579899, "learning_rate": 3.9270979187632516e-06, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.08562658727169037, "step": 3520, "valid_targets_mean": 5898.1, "valid_targets_min": 2167 }, { "epoch": 5.7317073170731705, "grad_norm": 0.5308627260490062, "learning_rate": 3.878970248039678e-06, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.057754069566726685, "step": 3525, "valid_targets_mean": 3393.5, "valid_targets_min": 1695 }, { "epoch": 5.739837398373984, "grad_norm": 0.5169969359187669, "learning_rate": 3.831107618099026e-06, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.08548920601606369, "step": 3530, "valid_targets_mean": 6755.8, "valid_targets_min": 1659 }, { "epoch": 5.747967479674797, "grad_norm": 0.4911127509964081, "learning_rate": 3.7835108158357537e-06, "loss": 0.1359, "loss_nan_ranks": 0, "loss_rank_avg": 0.07760560512542725, "step": 3535, "valid_targets_mean": 4701.1, "valid_targets_min": 1200 }, { "epoch": 5.7560975609756095, "grad_norm": 0.6256653476163969, "learning_rate": 3.7361806237739264e-06, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.10821224749088287, "step": 3540, "valid_targets_mean": 4438.8, "valid_targets_min": 1605 }, { "epoch": 5.764227642276423, "grad_norm": 0.6143418161665082, "learning_rate": 3.689117820054351e-06, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.09576346725225449, "step": 3545, "valid_targets_mean": 4500.5, "valid_targets_min": 1088 }, { "epoch": 5.772357723577236, "grad_norm": 0.5053101481674264, "learning_rate": 3.6423231784217918e-06, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.06341202557086945, "step": 3550, "valid_targets_mean": 4709.8, "valid_targets_min": 1743 }, { "epoch": 5.780487804878049, "grad_norm": 0.5185945828988379, "learning_rate": 3.595797468212241e-06, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.058721110224723816, "step": 3555, "valid_targets_mean": 4438.8, "valid_targets_min": 431 }, { "epoch": 5.788617886178862, "grad_norm": 0.485826882756074, "learning_rate": 3.549541454340284e-06, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.046945132315158844, "step": 3560, "valid_targets_mean": 3586.6, "valid_targets_min": 810 }, { "epoch": 5.796747967479675, "grad_norm": 0.4795063932843012, "learning_rate": 3.503555897286499e-06, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.07797123491764069, "step": 3565, "valid_targets_mean": 7539.5, "valid_targets_min": 2072 }, { "epoch": 5.804878048780488, "grad_norm": 0.4988624493218227, "learning_rate": 3.4578415530849794e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.06318468600511551, "step": 3570, "valid_targets_mean": 5519.1, "valid_targets_min": 971 }, { "epoch": 5.8130081300813, "grad_norm": 0.5915061462334097, "learning_rate": 3.4123991733108852e-06, "loss": 0.1348, "loss_nan_ranks": 0, "loss_rank_avg": 0.07162193953990936, "step": 3575, "valid_targets_mean": 4290.6, "valid_targets_min": 2837 }, { "epoch": 5.821138211382114, "grad_norm": 0.6339526576145084, "learning_rate": 3.3672295050680946e-06, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.1004466712474823, "step": 3580, "valid_targets_mean": 3266.6, "valid_targets_min": 1135 }, { "epoch": 5.829268292682927, "grad_norm": 0.6144764996603019, "learning_rate": 3.322333290976936e-06, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.047704365104436874, "step": 3585, "valid_targets_mean": 3931.6, "valid_targets_min": 971 }, { "epoch": 5.83739837398374, "grad_norm": 0.6233426593748503, "learning_rate": 3.2777112691619473e-06, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.04878469556570053, "step": 3590, "valid_targets_mean": 2275.9, "valid_targets_min": 1493 }, { "epoch": 5.845528455284553, "grad_norm": 0.513146176569118, "learning_rate": 3.233364173239766e-06, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.11057032644748688, "step": 3595, "valid_targets_mean": 7431.9, "valid_targets_min": 3803 }, { "epoch": 5.853658536585366, "grad_norm": 0.39338525950024467, "learning_rate": 3.189292732307052e-06, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.0750330239534378, "step": 3600, "valid_targets_mean": 7109.9, "valid_targets_min": 1844 }, { "epoch": 5.861788617886178, "grad_norm": 0.5491212859348665, "learning_rate": 3.1454976709285124e-06, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.09204214811325073, "step": 3605, "valid_targets_mean": 5398.6, "valid_targets_min": 816 }, { "epoch": 5.869918699186992, "grad_norm": 0.44758859530282585, "learning_rate": 3.1019797091249938e-06, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.09642410278320312, "step": 3610, "valid_targets_mean": 5608.8, "valid_targets_min": 1155 }, { "epoch": 5.878048780487805, "grad_norm": 0.492246176203537, "learning_rate": 3.058739562361621e-06, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.06799611449241638, "step": 3615, "valid_targets_mean": 4828.1, "valid_targets_min": 1790 }, { "epoch": 5.886178861788618, "grad_norm": 0.6805281486892042, "learning_rate": 3.015777941536058e-06, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.0549367219209671, "step": 3620, "valid_targets_mean": 2295.9, "valid_targets_min": 917 }, { "epoch": 5.894308943089431, "grad_norm": 0.6639345621677888, "learning_rate": 2.973095552966805e-06, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.09857673943042755, "step": 3625, "valid_targets_mean": 4574.8, "valid_targets_min": 1036 }, { "epoch": 5.902439024390244, "grad_norm": 0.6124750331186275, "learning_rate": 2.9306930983816005e-06, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.0993262380361557, "step": 3630, "valid_targets_mean": 4096.4, "valid_targets_min": 1536 }, { "epoch": 5.9105691056910565, "grad_norm": 0.5643588254261337, "learning_rate": 2.8885712749058737e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.13022960722446442, "step": 3635, "valid_targets_mean": 6864.2, "valid_targets_min": 1937 }, { "epoch": 5.91869918699187, "grad_norm": 0.5905977400403103, "learning_rate": 2.8467307750512808e-06, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.11141015589237213, "step": 3640, "valid_targets_mean": 6235.9, "valid_targets_min": 2238 }, { "epoch": 5.926829268292683, "grad_norm": 0.530786441642335, "learning_rate": 2.80517228670433e-06, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.05851534754037857, "step": 3645, "valid_targets_mean": 4112.1, "valid_targets_min": 907 }, { "epoch": 5.934959349593496, "grad_norm": 0.4913256912751018, "learning_rate": 2.7638964931150637e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.059017717838287354, "step": 3650, "valid_targets_mean": 3893.6, "valid_targets_min": 707 }, { "epoch": 5.943089430894309, "grad_norm": 0.536687522630536, "learning_rate": 2.7229040728858323e-06, "loss": 0.1379, "loss_nan_ranks": 0, "loss_rank_avg": 0.0714992955327034, "step": 3655, "valid_targets_mean": 4946.5, "valid_targets_min": 1911 }, { "epoch": 5.951219512195122, "grad_norm": 0.5506461888892271, "learning_rate": 2.6821956999601306e-06, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.07032961398363113, "step": 3660, "valid_targets_mean": 5594.8, "valid_targets_min": 1285 }, { "epoch": 5.959349593495935, "grad_norm": 0.6553289921069847, "learning_rate": 2.641772043611521e-06, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.08100451529026031, "step": 3665, "valid_targets_mean": 3261.0, "valid_targets_min": 759 }, { "epoch": 5.967479674796748, "grad_norm": 0.4351322730145396, "learning_rate": 2.6016337684326342e-06, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.06324901431798935, "step": 3670, "valid_targets_mean": 6432.2, "valid_targets_min": 1780 }, { "epoch": 5.975609756097561, "grad_norm": 0.5475367305498099, "learning_rate": 2.5617815343242327e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.05930344760417938, "step": 3675, "valid_targets_mean": 4173.6, "valid_targets_min": 958 }, { "epoch": 5.983739837398374, "grad_norm": 0.44102078305259657, "learning_rate": 2.522215996484374e-06, "loss": 0.167, "loss_nan_ranks": 0, "loss_rank_avg": 0.09785904735326767, "step": 3680, "valid_targets_mean": 7297.8, "valid_targets_min": 1333 }, { "epoch": 5.991869918699187, "grad_norm": 0.5240924440683472, "learning_rate": 2.4829378053976318e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.08522488176822662, "step": 3685, "valid_targets_mean": 4658.1, "valid_targets_min": 770 }, { "epoch": 6.0, "grad_norm": 0.7123764922525749, "learning_rate": 2.4439476068243927e-06, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.09183523058891296, "step": 3690, "valid_targets_mean": 3641.5, "valid_targets_min": 1351 }, { "epoch": 6.008130081300813, "grad_norm": 0.5125951187250442, "learning_rate": 2.4052460417902613e-06, "loss": 0.1268, "loss_nan_ranks": 0, "loss_rank_avg": 0.09160792827606201, "step": 3695, "valid_targets_mean": 6559.5, "valid_targets_min": 673 }, { "epoch": 6.016260162601626, "grad_norm": 0.5255921018708041, "learning_rate": 2.3668337465754985e-06, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.03819496929645538, "step": 3700, "valid_targets_mean": 2973.6, "valid_targets_min": 1301 }, { "epoch": 6.024390243902439, "grad_norm": 0.5991271116563525, "learning_rate": 2.3287113527045823e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.06017238274216652, "step": 3705, "valid_targets_mean": 2995.0, "valid_targets_min": 478 }, { "epoch": 6.032520325203252, "grad_norm": 0.5028295236068805, "learning_rate": 2.2908794869358044e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.09328052401542664, "step": 3710, "valid_targets_mean": 7330.5, "valid_targets_min": 1051 }, { "epoch": 6.040650406504065, "grad_norm": 0.48577732509794, "learning_rate": 2.253338771250977e-06, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.08138886094093323, "step": 3715, "valid_targets_mean": 6913.5, "valid_targets_min": 1350 }, { "epoch": 6.048780487804878, "grad_norm": 0.5607320105097346, "learning_rate": 2.216089822845211e-06, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.05849029868841171, "step": 3720, "valid_targets_mean": 3197.2, "valid_targets_min": 1356 }, { "epoch": 6.056910569105691, "grad_norm": 0.4265467163633901, "learning_rate": 2.1791332541167497e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.05778588354587555, "step": 3725, "valid_targets_mean": 7165.9, "valid_targets_min": 2124 }, { "epoch": 6.065040650406504, "grad_norm": 0.4998525125501409, "learning_rate": 2.142469672656935e-06, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.05413878709077835, "step": 3730, "valid_targets_mean": 5275.1, "valid_targets_min": 1558 }, { "epoch": 6.073170731707317, "grad_norm": 0.48601634546744743, "learning_rate": 2.106099681240179e-06, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.09387250244617462, "step": 3735, "valid_targets_mean": 5513.5, "valid_targets_min": 887 }, { "epoch": 6.08130081300813, "grad_norm": 0.49009376407302246, "learning_rate": 2.07002387781408e-06, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.04371977224946022, "step": 3740, "valid_targets_mean": 2684.4, "valid_targets_min": 748 }, { "epoch": 6.0894308943089435, "grad_norm": 0.529756719074617, "learning_rate": 2.0342428554895788e-06, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.06981755793094635, "step": 3745, "valid_targets_mean": 6925.4, "valid_targets_min": 1802 }, { "epoch": 6.097560975609756, "grad_norm": 0.4352521155481912, "learning_rate": 1.998757202531223e-06, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.06377846002578735, "step": 3750, "valid_targets_mean": 6639.2, "valid_targets_min": 1671 }, { "epoch": 6.105691056910569, "grad_norm": 0.6759392847299264, "learning_rate": 1.9635675023474764e-06, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.10881119966506958, "step": 3755, "valid_targets_mean": 3663.0, "valid_targets_min": 1057 }, { "epoch": 6.1138211382113825, "grad_norm": 0.5911778807260428, "learning_rate": 1.92867433348114e-06, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.1204938068985939, "step": 3760, "valid_targets_mean": 7143.0, "valid_targets_min": 541 }, { "epoch": 6.121951219512195, "grad_norm": 0.5223695837378161, "learning_rate": 1.8940782695998305e-06, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.07732852548360825, "step": 3765, "valid_targets_mean": 7005.0, "valid_targets_min": 1058 }, { "epoch": 6.130081300813008, "grad_norm": 0.5828560978961865, "learning_rate": 1.859779879486565e-06, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.08834804594516754, "step": 3770, "valid_targets_mean": 5369.8, "valid_targets_min": 1953 }, { "epoch": 6.138211382113822, "grad_norm": 0.5361855011928899, "learning_rate": 1.8257797270303924e-06, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.0897950530052185, "step": 3775, "valid_targets_mean": 5802.2, "valid_targets_min": 965 }, { "epoch": 6.146341463414634, "grad_norm": 0.4839573459279249, "learning_rate": 1.792078371217132e-06, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.06997618824243546, "step": 3780, "valid_targets_mean": 5035.6, "valid_targets_min": 1968 }, { "epoch": 6.154471544715447, "grad_norm": 0.629972769197006, "learning_rate": 1.7586763661201821e-06, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.08012628555297852, "step": 3785, "valid_targets_mean": 3025.5, "valid_targets_min": 1493 }, { "epoch": 6.16260162601626, "grad_norm": 0.474069267594382, "learning_rate": 1.7255742608914095e-06, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.06208975240588188, "step": 3790, "valid_targets_mean": 5872.8, "valid_targets_min": 2008 }, { "epoch": 6.170731707317073, "grad_norm": 0.4809531766745778, "learning_rate": 1.6927725997521171e-06, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.061438895761966705, "step": 3795, "valid_targets_mean": 5967.9, "valid_targets_min": 836 }, { "epoch": 6.178861788617886, "grad_norm": 0.45267282211135207, "learning_rate": 1.6602719219841135e-06, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.09101088345050812, "step": 3800, "valid_targets_mean": 7909.1, "valid_targets_min": 937 }, { "epoch": 6.186991869918699, "grad_norm": 0.5388804148566072, "learning_rate": 1.6280727619208202e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.05914738029241562, "step": 3805, "valid_targets_mean": 4102.5, "valid_targets_min": 2015 }, { "epoch": 6.195121951219512, "grad_norm": 0.5485002339679745, "learning_rate": 1.5961756489385117e-06, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.06488044559955597, "step": 3810, "valid_targets_mean": 4093.6, "valid_targets_min": 612 }, { "epoch": 6.203252032520325, "grad_norm": 0.6060789228357235, "learning_rate": 1.5645811074475915e-06, "loss": 0.1346, "loss_nan_ranks": 0, "loss_rank_avg": 0.05854189395904541, "step": 3815, "valid_targets_mean": 3103.6, "valid_targets_min": 1558 }, { "epoch": 6.211382113821138, "grad_norm": 0.4619822811719695, "learning_rate": 1.533289656883985e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.048693303018808365, "step": 3820, "valid_targets_mean": 3227.4, "valid_targets_min": 1126 }, { "epoch": 6.219512195121951, "grad_norm": 0.5014566562350612, "learning_rate": 1.5023018117005995e-06, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.07048257440328598, "step": 3825, "valid_targets_mean": 6760.8, "valid_targets_min": 1532 }, { "epoch": 6.227642276422764, "grad_norm": 0.5301070173999823, "learning_rate": 1.4716180813588566e-06, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.06466139107942581, "step": 3830, "valid_targets_mean": 3930.5, "valid_targets_min": 979 }, { "epoch": 6.235772357723577, "grad_norm": 0.55669387206407, "learning_rate": 1.44123897032032e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.08089330792427063, "step": 3835, "valid_targets_mean": 4741.6, "valid_targets_min": 1071 }, { "epoch": 6.2439024390243905, "grad_norm": 0.4980057098811839, "learning_rate": 1.411164978038404e-06, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.07480640709400177, "step": 3840, "valid_targets_mean": 6420.6, "valid_targets_min": 1351 }, { "epoch": 6.252032520325203, "grad_norm": 0.48567479881201847, "learning_rate": 1.3813965989501687e-06, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.07757849991321564, "step": 3845, "valid_targets_mean": 5568.0, "valid_targets_min": 1500 }, { "epoch": 6.260162601626016, "grad_norm": 0.6038613597717304, "learning_rate": 1.3519343224681758e-06, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.05287151038646698, "step": 3850, "valid_targets_mean": 3085.2, "valid_targets_min": 1668 }, { "epoch": 6.2682926829268295, "grad_norm": 0.4676572755074319, "learning_rate": 1.3227786329724479e-06, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.06467849016189575, "step": 3855, "valid_targets_mean": 7109.8, "valid_targets_min": 1681 }, { "epoch": 6.276422764227642, "grad_norm": 0.5119627189260858, "learning_rate": 1.2939300098025177e-06, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.05341634154319763, "step": 3860, "valid_targets_mean": 3681.2, "valid_targets_min": 603 }, { "epoch": 6.284552845528455, "grad_norm": 0.5609118530581023, "learning_rate": 1.2653889272495223e-06, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.06689933687448502, "step": 3865, "valid_targets_mean": 3262.0, "valid_targets_min": 1597 }, { "epoch": 6.2926829268292686, "grad_norm": 0.6452235400709166, "learning_rate": 1.2371558545484375e-06, "loss": 0.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.05612143129110336, "step": 3870, "valid_targets_mean": 2529.9, "valid_targets_min": 946 }, { "epoch": 6.300813008130081, "grad_norm": 0.6646309846895969, "learning_rate": 1.2092312558703333e-06, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.10385371744632721, "step": 3875, "valid_targets_mean": 4806.8, "valid_targets_min": 972 }, { "epoch": 6.308943089430894, "grad_norm": 0.43883177294111547, "learning_rate": 1.181615590314762e-06, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.06866000592708588, "step": 3880, "valid_targets_mean": 8409.5, "valid_targets_min": 827 }, { "epoch": 6.317073170731708, "grad_norm": 0.5400337744941237, "learning_rate": 1.1543093119021976e-06, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.05641719698905945, "step": 3885, "valid_targets_mean": 3760.0, "valid_targets_min": 979 }, { "epoch": 6.32520325203252, "grad_norm": 0.6869017454510746, "learning_rate": 1.1273128695665814e-06, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.07005228102207184, "step": 3890, "valid_targets_mean": 3259.8, "valid_targets_min": 929 }, { "epoch": 6.333333333333333, "grad_norm": 0.5877646145381491, "learning_rate": 1.1006267071479359e-06, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.049145568162202835, "step": 3895, "valid_targets_mean": 2465.6, "valid_targets_min": 644 }, { "epoch": 6.341463414634147, "grad_norm": 0.4822132210234282, "learning_rate": 1.074251263385071e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.07078665494918823, "step": 3900, "valid_targets_mean": 5522.6, "valid_targets_min": 1681 }, { "epoch": 6.349593495934959, "grad_norm": 0.5689782271232432, "learning_rate": 1.0481869719083647e-06, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.04569226875901222, "step": 3905, "valid_targets_mean": 3140.6, "valid_targets_min": 998 }, { "epoch": 6.357723577235772, "grad_norm": 0.4138881875099752, "learning_rate": 1.022434261232641e-06, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.045029543340206146, "step": 3910, "valid_targets_mean": 7257.1, "valid_targets_min": 1349 }, { "epoch": 6.365853658536586, "grad_norm": 0.45628440702603473, "learning_rate": 9.969935547501208e-07, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.07180604338645935, "step": 3915, "valid_targets_mean": 6870.4, "valid_targets_min": 1190 }, { "epoch": 6.373983739837398, "grad_norm": 0.5661858360921957, "learning_rate": 9.718652707234667e-07, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.0554160550236702, "step": 3920, "valid_targets_mean": 4203.9, "valid_targets_min": 360 }, { "epoch": 6.382113821138211, "grad_norm": 0.4866834728523311, "learning_rate": 9.47049822278896e-07, "loss": 0.1367, "loss_nan_ranks": 0, "loss_rank_avg": 0.08370758593082428, "step": 3925, "valid_targets_mean": 7344.5, "valid_targets_min": 2113 }, { "epoch": 6.390243902439025, "grad_norm": 0.5879680171481766, "learning_rate": 9.225476173993941e-07, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.05219414085149765, "step": 3930, "valid_targets_mean": 2731.0, "valid_targets_min": 862 }, { "epoch": 6.3983739837398375, "grad_norm": 0.6125432746278001, "learning_rate": 8.983590589180125e-07, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.07979313284158707, "step": 3935, "valid_targets_mean": 3850.1, "valid_targets_min": 1271 }, { "epoch": 6.40650406504065, "grad_norm": 0.5378493409154269, "learning_rate": 8.744845445112337e-07, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.0704009160399437, "step": 3940, "valid_targets_mean": 4573.4, "valid_targets_min": 1459 }, { "epoch": 6.414634146341464, "grad_norm": 0.49988189892518614, "learning_rate": 8.50924466692451e-07, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.05998336151242256, "step": 3945, "valid_targets_mean": 4343.2, "valid_targets_min": 1346 }, { "epoch": 6.4227642276422765, "grad_norm": 0.47818008070317997, "learning_rate": 8.276792128054967e-07, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.06701447069644928, "step": 3950, "valid_targets_mean": 6133.1, "valid_targets_min": 734 }, { "epoch": 6.430894308943089, "grad_norm": 0.5823763883113064, "learning_rate": 8.047491650182815e-07, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.0805363804101944, "step": 3955, "valid_targets_mean": 4293.2, "valid_targets_min": 840 }, { "epoch": 6.439024390243903, "grad_norm": 0.42979185701439304, "learning_rate": 7.821347003165125e-07, "loss": 0.1395, "loss_nan_ranks": 0, "loss_rank_avg": 0.07834421843290329, "step": 3960, "valid_targets_mean": 8628.5, "valid_targets_min": 2240 }, { "epoch": 6.4471544715447155, "grad_norm": 0.7579165515450033, "learning_rate": 7.598361904974982e-07, "loss": 0.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.08511120826005936, "step": 3965, "valid_targets_mean": 2386.4, "valid_targets_min": 810 }, { "epoch": 6.455284552845528, "grad_norm": 0.4460991570733875, "learning_rate": 7.378540021640313e-07, "loss": 0.1373, "loss_nan_ranks": 0, "loss_rank_avg": 0.04093274101614952, "step": 3970, "valid_targets_mean": 3864.4, "valid_targets_min": 1250 }, { "epoch": 6.463414634146342, "grad_norm": 0.48481029732724185, "learning_rate": 7.161884967183552e-07, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.06909462809562683, "step": 3975, "valid_targets_mean": 5614.2, "valid_targets_min": 1116 }, { "epoch": 6.471544715447155, "grad_norm": 0.46376076172514147, "learning_rate": 6.948400303562386e-07, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.048643216490745544, "step": 3980, "valid_targets_mean": 3914.6, "valid_targets_min": 1289 }, { "epoch": 6.479674796747967, "grad_norm": 0.6206279837594318, "learning_rate": 6.738089540611059e-07, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.05547118932008743, "step": 3985, "valid_targets_mean": 2721.2, "valid_targets_min": 1149 }, { "epoch": 6.487804878048781, "grad_norm": 0.5184236921242481, "learning_rate": 6.530956135982713e-07, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.06311732530593872, "step": 3990, "valid_targets_mean": 4710.1, "valid_targets_min": 919 }, { "epoch": 6.495934959349594, "grad_norm": 0.4768554900383388, "learning_rate": 6.327003495092565e-07, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.06617482751607895, "step": 3995, "valid_targets_mean": 5106.1, "valid_targets_min": 1003 }, { "epoch": 6.504065040650406, "grad_norm": 0.4743940396358253, "learning_rate": 6.126234971061861e-07, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.0865192711353302, "step": 4000, "valid_targets_mean": 8140.4, "valid_targets_min": 1437 }, { "epoch": 6.512195121951219, "grad_norm": 0.5736904558956544, "learning_rate": 5.928653864662815e-07, "loss": 0.1283, "loss_nan_ranks": 0, "loss_rank_avg": 0.0700342208147049, "step": 4005, "valid_targets_mean": 7398.9, "valid_targets_min": 2092 }, { "epoch": 6.520325203252033, "grad_norm": 0.5725691985725135, "learning_rate": 5.734263424264242e-07, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.05735783651471138, "step": 4010, "valid_targets_mean": 3289.0, "valid_targets_min": 1358 }, { "epoch": 6.528455284552845, "grad_norm": 0.5081434910962875, "learning_rate": 5.543066845778345e-07, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.0788717046380043, "step": 4015, "valid_targets_mean": 5680.4, "valid_targets_min": 1660 }, { "epoch": 6.536585365853659, "grad_norm": 0.4838819599909031, "learning_rate": 5.355067272607928e-07, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.07935932278633118, "step": 4020, "valid_targets_mean": 5819.2, "valid_targets_min": 1032 }, { "epoch": 6.544715447154472, "grad_norm": 0.464037313182742, "learning_rate": 5.170267795594886e-07, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.09259124845266342, "step": 4025, "valid_targets_mean": 10793.4, "valid_targets_min": 2508 }, { "epoch": 6.5528455284552845, "grad_norm": 0.5586258416927378, "learning_rate": 4.988671452969329e-07, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.057701949030160904, "step": 4030, "valid_targets_mean": 4107.9, "valid_targets_min": 456 }, { "epoch": 6.560975609756097, "grad_norm": 0.4939958155467588, "learning_rate": 4.810281230299674e-07, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.0794210284948349, "step": 4035, "valid_targets_mean": 6762.2, "valid_targets_min": 1740 }, { "epoch": 6.569105691056911, "grad_norm": 0.5341037134579636, "learning_rate": 4.6351000604434537e-07, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.07311007380485535, "step": 4040, "valid_targets_mean": 5182.4, "valid_targets_min": 1765 }, { "epoch": 6.5772357723577235, "grad_norm": 0.5912301404194484, "learning_rate": 4.463130823499273e-07, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.059849344193935394, "step": 4045, "valid_targets_mean": 3271.9, "valid_targets_min": 1359 }, { "epoch": 6.585365853658536, "grad_norm": 0.5056447034085019, "learning_rate": 4.2943763467592436e-07, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.1126769632101059, "step": 4050, "valid_targets_mean": 7062.9, "valid_targets_min": 1388 }, { "epoch": 6.59349593495935, "grad_norm": 0.6145348678862775, "learning_rate": 4.12883940466271e-07, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.08739953488111496, "step": 4055, "valid_targets_mean": 5414.8, "valid_targets_min": 1257 }, { "epoch": 6.6016260162601625, "grad_norm": 0.4804777492198502, "learning_rate": 3.9665227187505097e-07, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.08290360867977142, "step": 4060, "valid_targets_mean": 7208.0, "valid_targets_min": 2560 }, { "epoch": 6.609756097560975, "grad_norm": 0.5574166118518863, "learning_rate": 3.8074289576202295e-07, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.0751386508345604, "step": 4065, "valid_targets_mean": 3869.2, "valid_targets_min": 181 }, { "epoch": 6.617886178861789, "grad_norm": 0.5970083675443173, "learning_rate": 3.6515607368824203e-07, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.06374109536409378, "step": 4070, "valid_targets_mean": 2811.4, "valid_targets_min": 588 }, { "epoch": 6.626016260162602, "grad_norm": 0.45025626837485694, "learning_rate": 3.498920619117474e-07, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.0788019597530365, "step": 4075, "valid_targets_mean": 5441.9, "valid_targets_min": 926 }, { "epoch": 6.634146341463414, "grad_norm": 0.6562690543794055, "learning_rate": 3.3495111138336147e-07, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.0719897598028183, "step": 4080, "valid_targets_mean": 3231.2, "valid_targets_min": 1237 }, { "epoch": 6.642276422764228, "grad_norm": 0.6175575954289109, "learning_rate": 3.203334677425529e-07, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.08788205683231354, "step": 4085, "valid_targets_mean": 3920.8, "valid_targets_min": 1831 }, { "epoch": 6.650406504065041, "grad_norm": 0.46032067090434414, "learning_rate": 3.060393713134091e-07, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.05151630565524101, "step": 4090, "valid_targets_mean": 4635.9, "valid_targets_min": 1944 }, { "epoch": 6.658536585365853, "grad_norm": 0.6777596078038732, "learning_rate": 2.920690571006768e-07, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.07666124403476715, "step": 4095, "valid_targets_mean": 3438.9, "valid_targets_min": 735 }, { "epoch": 6.666666666666667, "grad_norm": 0.5028120819216886, "learning_rate": 2.784227547858964e-07, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.04650210589170456, "step": 4100, "valid_targets_mean": 4073.6, "valid_targets_min": 792 }, { "epoch": 6.67479674796748, "grad_norm": 0.6470682484314884, "learning_rate": 2.651006887236385e-07, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.07603412866592407, "step": 4105, "valid_targets_mean": 3719.8, "valid_targets_min": 963 }, { "epoch": 6.682926829268292, "grad_norm": 0.3881852697738965, "learning_rate": 2.52103077937802e-07, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.050025589764118195, "step": 4110, "valid_targets_mean": 7249.2, "valid_targets_min": 1435 }, { "epoch": 6.691056910569106, "grad_norm": 0.4778383612041256, "learning_rate": 2.394301361180218e-07, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.08101027458906174, "step": 4115, "valid_targets_mean": 6453.9, "valid_targets_min": 2403 }, { "epoch": 6.699186991869919, "grad_norm": 0.5599821459547166, "learning_rate": 2.2708207161615147e-07, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.09059727191925049, "step": 4120, "valid_targets_mean": 5527.4, "valid_targets_min": 904 }, { "epoch": 6.7073170731707314, "grad_norm": 0.5107814718189087, "learning_rate": 2.150590874428371e-07, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.05344102531671524, "step": 4125, "valid_targets_mean": 3575.5, "valid_targets_min": 829 }, { "epoch": 6.715447154471545, "grad_norm": 0.44330650995397963, "learning_rate": 2.0336138126417994e-07, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.05584095045924187, "step": 4130, "valid_targets_mean": 5482.6, "valid_targets_min": 942 }, { "epoch": 6.723577235772358, "grad_norm": 0.5119468559996024, "learning_rate": 1.9198914539849455e-07, "loss": 0.1337, "loss_nan_ranks": 0, "loss_rank_avg": 0.07401560246944427, "step": 4135, "valid_targets_mean": 7082.9, "valid_targets_min": 691 }, { "epoch": 6.7317073170731705, "grad_norm": 0.5249108227392534, "learning_rate": 1.8094256681313593e-07, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.0827220231294632, "step": 4140, "valid_targets_mean": 5094.2, "valid_targets_min": 719 }, { "epoch": 6.739837398373984, "grad_norm": 0.4495364105204827, "learning_rate": 1.702218271214262e-07, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.1008179783821106, "step": 4145, "valid_targets_mean": 6540.8, "valid_targets_min": 1350 }, { "epoch": 6.747967479674797, "grad_norm": 0.6030073637414436, "learning_rate": 1.598271025796816e-07, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.05886147543787956, "step": 4150, "valid_targets_mean": 3254.4, "valid_targets_min": 885 }, { "epoch": 6.7560975609756095, "grad_norm": 0.5871020155634131, "learning_rate": 1.4975856408429912e-07, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.09096332639455795, "step": 4155, "valid_targets_mean": 5843.1, "valid_targets_min": 1355 }, { "epoch": 6.764227642276423, "grad_norm": 0.46246696208880583, "learning_rate": 1.4001637716895445e-07, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.046735212206840515, "step": 4160, "valid_targets_mean": 4893.9, "valid_targets_min": 1704 }, { "epoch": 6.772357723577236, "grad_norm": 0.4694362534443668, "learning_rate": 1.3060070200188179e-07, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.07222121953964233, "step": 4165, "valid_targets_mean": 6710.2, "valid_targets_min": 1205 }, { "epoch": 6.780487804878049, "grad_norm": 0.4947694554035908, "learning_rate": 1.215116933832361e-07, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.06739296019077301, "step": 4170, "valid_targets_mean": 4189.8, "valid_targets_min": 1452 }, { "epoch": 6.788617886178862, "grad_norm": 0.5225895943348434, "learning_rate": 1.1274950074255053e-07, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.062162332236766815, "step": 4175, "valid_targets_mean": 4134.5, "valid_targets_min": 1576 }, { "epoch": 6.796747967479675, "grad_norm": 0.4640767809543489, "learning_rate": 1.0431426813628298e-07, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.05863991379737854, "step": 4180, "valid_targets_mean": 4159.4, "valid_targets_min": 1530 }, { "epoch": 6.804878048780488, "grad_norm": 0.5113628508634667, "learning_rate": 9.62061342454379e-08, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.05690145492553711, "step": 4185, "valid_targets_mean": 5318.1, "valid_targets_min": 1401 }, { "epoch": 6.8130081300813, "grad_norm": 0.5272021984897712, "learning_rate": 8.842523237329925e-08, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.07422936707735062, "step": 4190, "valid_targets_mean": 4156.2, "valid_targets_min": 1188 }, { "epoch": 6.821138211382114, "grad_norm": 0.5070110218380924, "learning_rate": 8.097169044322561e-08, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.07301990687847137, "step": 4195, "valid_targets_mean": 6095.6, "valid_targets_min": 1064 }, { "epoch": 6.829268292682927, "grad_norm": 0.5135907171507096, "learning_rate": 7.38456309965585e-08, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.08123864233493805, "step": 4200, "valid_targets_mean": 6417.5, "valid_targets_min": 1919 }, { "epoch": 6.83739837398374, "grad_norm": 0.5134073522886069, "learning_rate": 6.7047171190604e-08, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.08525604754686356, "step": 4205, "valid_targets_mean": 6880.0, "valid_targets_min": 1722 }, { "epoch": 6.845528455284553, "grad_norm": 0.5709205723526362, "learning_rate": 6.057642279669874e-08, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.07911784946918488, "step": 4210, "valid_targets_mean": 5972.6, "valid_targets_min": 1329 }, { "epoch": 6.853658536585366, "grad_norm": 0.5907167020531751, "learning_rate": 5.4433492198386895e-08, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.07390086352825165, "step": 4215, "valid_targets_mean": 5442.9, "valid_targets_min": 1270 }, { "epoch": 6.861788617886178, "grad_norm": 0.5367609462420859, "learning_rate": 4.861848038965722e-08, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.08721356093883514, "step": 4220, "valid_targets_mean": 5648.6, "valid_targets_min": 1930 }, { "epoch": 6.869918699186992, "grad_norm": 0.4807256951021462, "learning_rate": 4.313148297328873e-08, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.05554955452680588, "step": 4225, "valid_targets_mean": 4789.0, "valid_targets_min": 484 }, { "epoch": 6.878048780487805, "grad_norm": 0.48597528746316876, "learning_rate": 3.797259015928534e-08, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.08914779871702194, "step": 4230, "valid_targets_mean": 7303.0, "valid_targets_min": 1005 }, { "epoch": 6.886178861788618, "grad_norm": 0.6424700552312324, "learning_rate": 3.314188676338148e-08, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.07850663363933563, "step": 4235, "valid_targets_mean": 4603.0, "valid_targets_min": 1167 }, { "epoch": 6.894308943089431, "grad_norm": 0.6000297335645017, "learning_rate": 2.863945220565434e-08, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.05064990371465683, "step": 4240, "valid_targets_mean": 2443.1, "valid_targets_min": 1117 }, { "epoch": 6.902439024390244, "grad_norm": 0.8593534803222749, "learning_rate": 2.4465360509211555e-08, "loss": 0.1346, "loss_nan_ranks": 0, "loss_rank_avg": 0.05758367478847504, "step": 4245, "valid_targets_mean": 4781.9, "valid_targets_min": 627 }, { "epoch": 6.9105691056910565, "grad_norm": 0.4766491724568221, "learning_rate": 2.0619680298983313e-08, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.09008824825286865, "step": 4250, "valid_targets_mean": 6260.6, "valid_targets_min": 1378 }, { "epoch": 6.91869918699187, "grad_norm": 0.5745428938529575, "learning_rate": 1.7102474800592128e-08, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.06578895449638367, "step": 4255, "valid_targets_mean": 4985.1, "valid_targets_min": 2101 }, { "epoch": 6.926829268292683, "grad_norm": 0.505947880091739, "learning_rate": 1.3913801839307017e-08, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.06309238076210022, "step": 4260, "valid_targets_mean": 3601.9, "valid_targets_min": 1374 }, { "epoch": 6.934959349593496, "grad_norm": 0.4862231953156758, "learning_rate": 1.105371383909759e-08, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.08454480767250061, "step": 4265, "valid_targets_mean": 5506.6, "valid_targets_min": 1091 }, { "epoch": 6.943089430894309, "grad_norm": 0.6257612208316857, "learning_rate": 8.522257821770296e-09, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.056995876133441925, "step": 4270, "valid_targets_mean": 2835.4, "valid_targets_min": 1005 }, { "epoch": 6.951219512195122, "grad_norm": 0.49445438205373704, "learning_rate": 6.319475406200148e-09, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.058740273118019104, "step": 4275, "valid_targets_mean": 5342.2, "valid_targets_min": 1527 }, { "epoch": 6.959349593495935, "grad_norm": 0.47126210521609696, "learning_rate": 4.445402807637944e-09, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.07837090641260147, "step": 4280, "valid_targets_mean": 6361.8, "valid_targets_min": 2564 }, { "epoch": 6.967479674796748, "grad_norm": 0.521579117805132, "learning_rate": 2.9000708371240695e-09, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.09207534790039062, "step": 4285, "valid_targets_mean": 5779.9, "valid_targets_min": 1122 }, { "epoch": 6.975609756097561, "grad_norm": 0.5972935543752566, "learning_rate": 1.6835049009755745e-09, "loss": 0.1302, "loss_nan_ranks": 0, "loss_rank_avg": 0.040843117982149124, "step": 4290, "valid_targets_mean": 2254.1, "valid_targets_min": 972 }, { "epoch": 6.983739837398374, "grad_norm": 0.43801218688294546, "learning_rate": 7.9572500036873e-10, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.045577868819236755, "step": 4295, "valid_targets_mean": 4745.5, "valid_targets_min": 570 }, { "epoch": 6.991869918699187, "grad_norm": 0.6040499813695474, "learning_rate": 2.367457310170629e-10, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.05143870413303375, "step": 4300, "valid_targets_mean": 2775.6, "valid_targets_min": 933 }, { "epoch": 7.0, "grad_norm": 0.5643379353921059, "learning_rate": 6.5762829204452095e-12, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.08443116396665573, "step": 4305, "valid_targets_mean": 4994.4, "valid_targets_min": 1365 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.08443116396665573, "step": 4305, "total_flos": 1.4965206994208686e+18, "train_loss": 0.19276038985634514, "train_runtime": 135959.8594, "train_samples_per_second": 0.506, "train_steps_per_second": 0.032, "valid_targets_mean": 4994.4, "valid_targets_min": 1365 } ], "logging_steps": 5, "max_steps": 4305, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.4965206994208686e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }