{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 6.999053926206244, "eval_steps": 500, "global_step": 3702, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.00946073793755913, "grad_norm": 13.292386854280902, "learning_rate": 4.3126684636118604e-07, "loss": 0.6679, "loss_nan_ranks": 0, "loss_rank_avg": 0.3716040849685669, "step": 5, "valid_targets_mean": 5111.2, "valid_targets_min": 2497 }, { "epoch": 0.01892147587511826, "grad_norm": 12.976120695301127, "learning_rate": 9.703504043126686e-07, "loss": 0.6941, "loss_nan_ranks": 0, "loss_rank_avg": 0.35731813311576843, "step": 10, "valid_targets_mean": 6041.9, "valid_targets_min": 2037 }, { "epoch": 0.02838221381267739, "grad_norm": 10.94543088614748, "learning_rate": 1.509433962264151e-06, "loss": 0.6462, "loss_nan_ranks": 0, "loss_rank_avg": 0.3353500962257385, "step": 15, "valid_targets_mean": 7048.9, "valid_targets_min": 4111 }, { "epoch": 0.03784295175023652, "grad_norm": 6.852368736442926, "learning_rate": 2.0485175202156334e-06, "loss": 0.6181, "loss_nan_ranks": 0, "loss_rank_avg": 0.3063059449195862, "step": 20, "valid_targets_mean": 5856.1, "valid_targets_min": 1539 }, { "epoch": 0.04730368968779565, "grad_norm": 5.3977018080734664, "learning_rate": 2.587601078167116e-06, "loss": 0.5614, "loss_nan_ranks": 0, "loss_rank_avg": 0.2615411579608917, "step": 25, "valid_targets_mean": 5350.4, "valid_targets_min": 3761 }, { "epoch": 0.05676442762535478, "grad_norm": 5.111568881695973, "learning_rate": 3.126684636118599e-06, "loss": 0.5349, "loss_nan_ranks": 0, "loss_rank_avg": 0.26117661595344543, "step": 30, "valid_targets_mean": 5490.1, "valid_targets_min": 3061 }, { "epoch": 0.06622516556291391, "grad_norm": 2.365906594146852, "learning_rate": 3.665768194070081e-06, "loss": 0.4884, "loss_nan_ranks": 0, "loss_rank_avg": 0.2334306240081787, "step": 35, "valid_targets_mean": 4899.1, "valid_targets_min": 3363 }, { "epoch": 0.07568590350047304, "grad_norm": 1.5154295873967274, "learning_rate": 4.204851752021563e-06, "loss": 0.4499, "loss_nan_ranks": 0, "loss_rank_avg": 0.2000514566898346, "step": 40, "valid_targets_mean": 6593.0, "valid_targets_min": 4641 }, { "epoch": 0.08514664143803216, "grad_norm": 1.0580075894605687, "learning_rate": 4.7439353099730466e-06, "loss": 0.4271, "loss_nan_ranks": 0, "loss_rank_avg": 0.20875361561775208, "step": 45, "valid_targets_mean": 5423.5, "valid_targets_min": 2180 }, { "epoch": 0.0946073793755913, "grad_norm": 0.8888840325402044, "learning_rate": 5.283018867924529e-06, "loss": 0.405, "loss_nan_ranks": 0, "loss_rank_avg": 0.1873297393321991, "step": 50, "valid_targets_mean": 4690.0, "valid_targets_min": 2271 }, { "epoch": 0.10406811731315042, "grad_norm": 0.8025966922773096, "learning_rate": 5.822102425876012e-06, "loss": 0.4054, "loss_nan_ranks": 0, "loss_rank_avg": 0.1847410500049591, "step": 55, "valid_targets_mean": 4564.8, "valid_targets_min": 2231 }, { "epoch": 0.11352885525070956, "grad_norm": 0.6830098620481699, "learning_rate": 6.3611859838274934e-06, "loss": 0.3772, "loss_nan_ranks": 0, "loss_rank_avg": 0.2122303694486618, "step": 60, "valid_targets_mean": 5382.4, "valid_targets_min": 3694 }, { "epoch": 0.12298959318826869, "grad_norm": 0.6468269510795552, "learning_rate": 6.9002695417789766e-06, "loss": 0.3941, "loss_nan_ranks": 0, "loss_rank_avg": 0.21036577224731445, "step": 65, "valid_targets_mean": 5506.9, "valid_targets_min": 2545 }, { "epoch": 0.13245033112582782, "grad_norm": 0.7269588227001985, "learning_rate": 7.439353099730459e-06, "loss": 0.3786, "loss_nan_ranks": 0, "loss_rank_avg": 0.2026107907295227, "step": 70, "valid_targets_mean": 4666.8, "valid_targets_min": 802 }, { "epoch": 0.14191106906338694, "grad_norm": 0.5464115365342573, "learning_rate": 7.978436657681942e-06, "loss": 0.386, "loss_nan_ranks": 0, "loss_rank_avg": 0.2121516317129135, "step": 75, "valid_targets_mean": 6398.2, "valid_targets_min": 3254 }, { "epoch": 0.15137180700094607, "grad_norm": 0.4679041488767007, "learning_rate": 8.517520215633423e-06, "loss": 0.3615, "loss_nan_ranks": 0, "loss_rank_avg": 0.17857977747917175, "step": 80, "valid_targets_mean": 7090.0, "valid_targets_min": 5052 }, { "epoch": 0.1608325449385052, "grad_norm": 0.5071840524513592, "learning_rate": 9.056603773584907e-06, "loss": 0.3474, "loss_nan_ranks": 0, "loss_rank_avg": 0.16061782836914062, "step": 85, "valid_targets_mean": 5421.2, "valid_targets_min": 4155 }, { "epoch": 0.17029328287606432, "grad_norm": 0.48784327498178953, "learning_rate": 9.595687331536388e-06, "loss": 0.3496, "loss_nan_ranks": 0, "loss_rank_avg": 0.17591124773025513, "step": 90, "valid_targets_mean": 6018.5, "valid_targets_min": 3622 }, { "epoch": 0.17975402081362346, "grad_norm": 0.581900644799806, "learning_rate": 1.0134770889487871e-05, "loss": 0.3459, "loss_nan_ranks": 0, "loss_rank_avg": 0.16716624796390533, "step": 95, "valid_targets_mean": 5178.4, "valid_targets_min": 2243 }, { "epoch": 0.1892147587511826, "grad_norm": 0.5846177681039163, "learning_rate": 1.0673854447439354e-05, "loss": 0.3315, "loss_nan_ranks": 0, "loss_rank_avg": 0.15679748356342316, "step": 100, "valid_targets_mean": 4752.1, "valid_targets_min": 2315 }, { "epoch": 0.1986754966887417, "grad_norm": 0.4995428447108845, "learning_rate": 1.1212938005390836e-05, "loss": 0.3175, "loss_nan_ranks": 0, "loss_rank_avg": 0.1597537100315094, "step": 105, "valid_targets_mean": 5816.5, "valid_targets_min": 4068 }, { "epoch": 0.20813623462630085, "grad_norm": 0.4479628789945412, "learning_rate": 1.1752021563342319e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.13424637913703918, "step": 110, "valid_targets_mean": 6035.2, "valid_targets_min": 2868 }, { "epoch": 0.21759697256385999, "grad_norm": 0.4837864823725436, "learning_rate": 1.2291105121293802e-05, "loss": 0.314, "loss_nan_ranks": 0, "loss_rank_avg": 0.145084410905838, "step": 115, "valid_targets_mean": 5793.4, "valid_targets_min": 1596 }, { "epoch": 0.22705771050141912, "grad_norm": 0.44889049614325, "learning_rate": 1.2830188679245283e-05, "loss": 0.3122, "loss_nan_ranks": 0, "loss_rank_avg": 0.16734957695007324, "step": 120, "valid_targets_mean": 7349.1, "valid_targets_min": 5043 }, { "epoch": 0.23651844843897823, "grad_norm": 0.5223670515741717, "learning_rate": 1.3369272237196767e-05, "loss": 0.3124, "loss_nan_ranks": 0, "loss_rank_avg": 0.16438248753547668, "step": 125, "valid_targets_mean": 6178.2, "valid_targets_min": 3920 }, { "epoch": 0.24597918637653737, "grad_norm": 0.5321194979031634, "learning_rate": 1.390835579514825e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.16952776908874512, "step": 130, "valid_targets_mean": 5167.1, "valid_targets_min": 2006 }, { "epoch": 0.2554399243140965, "grad_norm": 0.4835554531647342, "learning_rate": 1.4447439353099733e-05, "loss": 0.2976, "loss_nan_ranks": 0, "loss_rank_avg": 0.16980065405368805, "step": 135, "valid_targets_mean": 7014.2, "valid_targets_min": 4174 }, { "epoch": 0.26490066225165565, "grad_norm": 0.5105644710675021, "learning_rate": 1.4986522911051213e-05, "loss": 0.3204, "loss_nan_ranks": 0, "loss_rank_avg": 0.1570666879415512, "step": 140, "valid_targets_mean": 5961.8, "valid_targets_min": 3944 }, { "epoch": 0.27436140018921473, "grad_norm": 0.5169522126281623, "learning_rate": 1.5525606469002698e-05, "loss": 0.3139, "loss_nan_ranks": 0, "loss_rank_avg": 0.141907200217247, "step": 145, "valid_targets_mean": 4846.5, "valid_targets_min": 770 }, { "epoch": 0.28382213812677387, "grad_norm": 0.5685567387490885, "learning_rate": 1.606469002695418e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.16263222694396973, "step": 150, "valid_targets_mean": 5686.2, "valid_targets_min": 1786 }, { "epoch": 0.293282876064333, "grad_norm": 0.5517286923292966, "learning_rate": 1.6603773584905664e-05, "loss": 0.3139, "loss_nan_ranks": 0, "loss_rank_avg": 0.16692663729190826, "step": 155, "valid_targets_mean": 7328.5, "valid_targets_min": 3874 }, { "epoch": 0.30274361400189215, "grad_norm": 0.5473844718628933, "learning_rate": 1.7142857142857142e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.14560210704803467, "step": 160, "valid_targets_mean": 5436.2, "valid_targets_min": 2790 }, { "epoch": 0.3122043519394513, "grad_norm": 0.5176673018224341, "learning_rate": 1.7681940700808627e-05, "loss": 0.2961, "loss_nan_ranks": 0, "loss_rank_avg": 0.1517486870288849, "step": 165, "valid_targets_mean": 6114.5, "valid_targets_min": 3759 }, { "epoch": 0.3216650898770104, "grad_norm": 0.5490412433918316, "learning_rate": 1.8221024258760108e-05, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.16231662034988403, "step": 170, "valid_targets_mean": 5257.4, "valid_targets_min": 1685 }, { "epoch": 0.33112582781456956, "grad_norm": 0.6410599828811149, "learning_rate": 1.8760107816711593e-05, "loss": 0.2955, "loss_nan_ranks": 0, "loss_rank_avg": 0.1378370225429535, "step": 175, "valid_targets_mean": 5678.0, "valid_targets_min": 1733 }, { "epoch": 0.34058656575212864, "grad_norm": 0.5033919157641096, "learning_rate": 1.9299191374663074e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.1563076674938202, "step": 180, "valid_targets_mean": 6886.4, "valid_targets_min": 5241 }, { "epoch": 0.3500473036896878, "grad_norm": 0.5392935569955783, "learning_rate": 1.9838274932614556e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.14293016493320465, "step": 185, "valid_targets_mean": 5918.0, "valid_targets_min": 2193 }, { "epoch": 0.3595080416272469, "grad_norm": 0.6472564298900539, "learning_rate": 2.037735849056604e-05, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.15237551927566528, "step": 190, "valid_targets_mean": 4608.6, "valid_targets_min": 2221 }, { "epoch": 0.36896877956480606, "grad_norm": 0.523153782721405, "learning_rate": 2.0916442048517522e-05, "loss": 0.294, "loss_nan_ranks": 0, "loss_rank_avg": 0.1513247787952423, "step": 195, "valid_targets_mean": 5764.5, "valid_targets_min": 2296 }, { "epoch": 0.3784295175023652, "grad_norm": 0.469616501289577, "learning_rate": 2.1455525606469007e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.1403075009584427, "step": 200, "valid_targets_mean": 6505.8, "valid_targets_min": 4664 }, { "epoch": 0.38789025543992434, "grad_norm": 0.5985188869226783, "learning_rate": 2.199460916442049e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.14567717909812927, "step": 205, "valid_targets_mean": 4861.4, "valid_targets_min": 1942 }, { "epoch": 0.3973509933774834, "grad_norm": 0.5326077341773564, "learning_rate": 2.253369272237197e-05, "loss": 0.3083, "loss_nan_ranks": 0, "loss_rank_avg": 0.1557682603597641, "step": 210, "valid_targets_mean": 5819.1, "valid_targets_min": 2582 }, { "epoch": 0.40681173131504256, "grad_norm": 0.5326693796335378, "learning_rate": 2.307277628032345e-05, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.14654016494750977, "step": 215, "valid_targets_mean": 5031.5, "valid_targets_min": 2136 }, { "epoch": 0.4162724692526017, "grad_norm": 0.5314292194307515, "learning_rate": 2.3611859838274933e-05, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.14354923367500305, "step": 220, "valid_targets_mean": 6880.5, "valid_targets_min": 4200 }, { "epoch": 0.42573320719016083, "grad_norm": 0.6305540146764549, "learning_rate": 2.4150943396226418e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.1796898990869522, "step": 225, "valid_targets_mean": 6977.6, "valid_targets_min": 4666 }, { "epoch": 0.43519394512771997, "grad_norm": 0.5230649535123192, "learning_rate": 2.46900269541779e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.11889778077602386, "step": 230, "valid_targets_mean": 4415.1, "valid_targets_min": 1499 }, { "epoch": 0.4446546830652791, "grad_norm": 0.4766065436527936, "learning_rate": 2.5229110512129384e-05, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.1293986439704895, "step": 235, "valid_targets_mean": 6849.5, "valid_targets_min": 3405 }, { "epoch": 0.45411542100283825, "grad_norm": 0.48511924294158426, "learning_rate": 2.5768194070080865e-05, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.14730864763259888, "step": 240, "valid_targets_mean": 6809.1, "valid_targets_min": 4854 }, { "epoch": 0.46357615894039733, "grad_norm": 0.5187932119629264, "learning_rate": 2.6307277628032347e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.18547989428043365, "step": 245, "valid_targets_mean": 5634.8, "valid_targets_min": 1005 }, { "epoch": 0.47303689687795647, "grad_norm": 0.5491633455944653, "learning_rate": 2.684636118598383e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.1189369261264801, "step": 250, "valid_targets_mean": 4453.9, "valid_targets_min": 2453 }, { "epoch": 0.4824976348155156, "grad_norm": 0.5668350991526823, "learning_rate": 2.7385444743935313e-05, "loss": 0.2703, "loss_nan_ranks": 0, "loss_rank_avg": 0.14132535457611084, "step": 255, "valid_targets_mean": 5330.2, "valid_targets_min": 4411 }, { "epoch": 0.49195837275307475, "grad_norm": 0.6537132489951805, "learning_rate": 2.7924528301886794e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.14046913385391235, "step": 260, "valid_targets_mean": 4396.1, "valid_targets_min": 2557 }, { "epoch": 0.5014191106906338, "grad_norm": 0.539558133701292, "learning_rate": 2.8463611859838276e-05, "loss": 0.2727, "loss_nan_ranks": 0, "loss_rank_avg": 0.12411429733037949, "step": 265, "valid_targets_mean": 4548.0, "valid_targets_min": 1822 }, { "epoch": 0.510879848628193, "grad_norm": 0.6355091138525413, "learning_rate": 2.9002695417789757e-05, "loss": 0.2786, "loss_nan_ranks": 0, "loss_rank_avg": 0.13668765127658844, "step": 270, "valid_targets_mean": 4930.8, "valid_targets_min": 2156 }, { "epoch": 0.5203405865657521, "grad_norm": 0.6045780561492375, "learning_rate": 2.9541778975741242e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.15746136009693146, "step": 275, "valid_targets_mean": 4315.5, "valid_targets_min": 953 }, { "epoch": 0.5298013245033113, "grad_norm": 0.517544515682634, "learning_rate": 3.0080862533692724e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.13427172601222992, "step": 280, "valid_targets_mean": 6005.6, "valid_targets_min": 4778 }, { "epoch": 0.5392620624408704, "grad_norm": 0.5242395110498128, "learning_rate": 3.061994609164421e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.17519372701644897, "step": 285, "valid_targets_mean": 6570.9, "valid_targets_min": 1759 }, { "epoch": 0.5487228003784295, "grad_norm": 0.5371360158794343, "learning_rate": 3.115902964959569e-05, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.12191037833690643, "step": 290, "valid_targets_mean": 5542.8, "valid_targets_min": 2077 }, { "epoch": 0.5581835383159887, "grad_norm": 0.4852881118368173, "learning_rate": 3.169811320754717e-05, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.14533182978630066, "step": 295, "valid_targets_mean": 6815.5, "valid_targets_min": 5442 }, { "epoch": 0.5676442762535477, "grad_norm": 0.5631185669619292, "learning_rate": 3.223719676549865e-05, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.16672319173812866, "step": 300, "valid_targets_mean": 6902.6, "valid_targets_min": 2676 }, { "epoch": 0.5771050141911069, "grad_norm": 0.5415919755101368, "learning_rate": 3.2776280323450134e-05, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.13607017695903778, "step": 305, "valid_targets_mean": 5954.1, "valid_targets_min": 2974 }, { "epoch": 0.586565752128666, "grad_norm": 0.543397988361979, "learning_rate": 3.3315363881401616e-05, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.17378760874271393, "step": 310, "valid_targets_mean": 6095.9, "valid_targets_min": 863 }, { "epoch": 0.5960264900662252, "grad_norm": 0.49985231481941134, "learning_rate": 3.3854447439353104e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.11618228256702423, "step": 315, "valid_targets_mean": 6216.5, "valid_targets_min": 3483 }, { "epoch": 0.6054872280037843, "grad_norm": 0.46620526718099603, "learning_rate": 3.4393530997304585e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.10228373855352402, "step": 320, "valid_targets_mean": 6214.8, "valid_targets_min": 4465 }, { "epoch": 0.6149479659413434, "grad_norm": 0.47078096185272866, "learning_rate": 3.493261455525607e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.14976316690444946, "step": 325, "valid_targets_mean": 5927.4, "valid_targets_min": 1832 }, { "epoch": 0.6244087038789026, "grad_norm": 0.4726439579386601, "learning_rate": 3.547169811320755e-05, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.11369471251964569, "step": 330, "valid_targets_mean": 6614.4, "valid_targets_min": 3123 }, { "epoch": 0.6338694418164617, "grad_norm": 0.5320768196095412, "learning_rate": 3.6010781671159037e-05, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.1185142993927002, "step": 335, "valid_targets_mean": 5876.6, "valid_targets_min": 3191 }, { "epoch": 0.6433301797540208, "grad_norm": 0.575530878563886, "learning_rate": 3.654986522911052e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.1460418999195099, "step": 340, "valid_targets_mean": 5636.5, "valid_targets_min": 2726 }, { "epoch": 0.6527909176915799, "grad_norm": 0.5147665527633908, "learning_rate": 3.708894878706199e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1212029904127121, "step": 345, "valid_targets_mean": 5861.5, "valid_targets_min": 2541 }, { "epoch": 0.6622516556291391, "grad_norm": 0.5595903582250489, "learning_rate": 3.762803234501348e-05, "loss": 0.2786, "loss_nan_ranks": 0, "loss_rank_avg": 0.16101306676864624, "step": 350, "valid_targets_mean": 6207.0, "valid_targets_min": 2967 }, { "epoch": 0.6717123935666982, "grad_norm": 0.5018111369885371, "learning_rate": 3.816711590296496e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.10931664705276489, "step": 355, "valid_targets_mean": 4495.9, "valid_targets_min": 3049 }, { "epoch": 0.6811731315042573, "grad_norm": 0.5359690061267144, "learning_rate": 3.8706199460916444e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.11740469187498093, "step": 360, "valid_targets_mean": 5280.0, "valid_targets_min": 1868 }, { "epoch": 0.6906338694418165, "grad_norm": 0.5193656060152103, "learning_rate": 3.9245283018867925e-05, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.13573291897773743, "step": 365, "valid_targets_mean": 6098.8, "valid_targets_min": 3118 }, { "epoch": 0.7000946073793756, "grad_norm": 0.49067627735159125, "learning_rate": 3.9784366576819413e-05, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.13638558983802795, "step": 370, "valid_targets_mean": 6597.8, "valid_targets_min": 4328 }, { "epoch": 0.7095553453169348, "grad_norm": 0.4717473773346668, "learning_rate": 3.999991999226427e-05, "loss": 0.2605, "loss_nan_ranks": 0, "loss_rank_avg": 0.10433489084243774, "step": 375, "valid_targets_mean": 6252.5, "valid_targets_min": 3697 }, { "epoch": 0.7190160832544938, "grad_norm": 0.5221922736723413, "learning_rate": 3.9999431058419585e-05, "loss": 0.2661, "loss_nan_ranks": 0, "loss_rank_avg": 0.10979779809713364, "step": 380, "valid_targets_mean": 5049.9, "valid_targets_min": 1939 }, { "epoch": 0.7284768211920529, "grad_norm": 0.4484218939396918, "learning_rate": 3.999849765032536e-05, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.11232994496822357, "step": 385, "valid_targets_mean": 6655.4, "valid_targets_min": 980 }, { "epoch": 0.7379375591296121, "grad_norm": 0.5274283464918212, "learning_rate": 3.999711978872596e-05, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.14474813640117645, "step": 390, "valid_targets_mean": 6887.2, "valid_targets_min": 4247 }, { "epoch": 0.7473982970671712, "grad_norm": 0.5017473030214095, "learning_rate": 3.9995297504243475e-05, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.12366019934415817, "step": 395, "valid_targets_mean": 5045.4, "valid_targets_min": 1967 }, { "epoch": 0.7568590350047304, "grad_norm": 0.4797605012842134, "learning_rate": 3.9993030837376985e-05, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.12161791324615479, "step": 400, "valid_targets_mean": 5767.5, "valid_targets_min": 3755 }, { "epoch": 0.7663197729422895, "grad_norm": 0.5591748230420274, "learning_rate": 3.999031983850166e-05, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.13065151870250702, "step": 405, "valid_targets_mean": 4916.5, "valid_targets_min": 2663 }, { "epoch": 0.7757805108798487, "grad_norm": 0.5768281800754327, "learning_rate": 3.9987164567867677e-05, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.12214967608451843, "step": 410, "valid_targets_mean": 6337.4, "valid_targets_min": 4123 }, { "epoch": 0.7852412488174078, "grad_norm": 0.565949691954824, "learning_rate": 3.998356509559886e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.17523278295993805, "step": 415, "valid_targets_mean": 7005.5, "valid_targets_min": 2171 }, { "epoch": 0.7947019867549668, "grad_norm": 0.5329664506953494, "learning_rate": 3.997952150169114e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.13902133703231812, "step": 420, "valid_targets_mean": 5315.2, "valid_targets_min": 1666 }, { "epoch": 0.804162724692526, "grad_norm": 0.43499678564104083, "learning_rate": 3.997503387601071e-05, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.10180394351482391, "step": 425, "valid_targets_mean": 6322.8, "valid_targets_min": 4931 }, { "epoch": 0.8136234626300851, "grad_norm": 0.5283450256927239, "learning_rate": 3.9970102318292136e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.12599720060825348, "step": 430, "valid_targets_mean": 4579.4, "valid_targets_min": 1802 }, { "epoch": 0.8230842005676443, "grad_norm": 0.5213620926766653, "learning_rate": 3.996472693813604e-05, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.10283877700567245, "step": 435, "valid_targets_mean": 5204.2, "valid_targets_min": 1539 }, { "epoch": 0.8325449385052034, "grad_norm": 0.5538525613580271, "learning_rate": 3.995890785500673e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.17035773396492004, "step": 440, "valid_targets_mean": 5642.4, "valid_targets_min": 1934 }, { "epoch": 0.8420056764427626, "grad_norm": 0.5952043541599361, "learning_rate": 3.995264519822952e-05, "loss": 0.242, "loss_nan_ranks": 0, "loss_rank_avg": 0.12181451171636581, "step": 445, "valid_targets_mean": 6117.1, "valid_targets_min": 4919 }, { "epoch": 0.8514664143803217, "grad_norm": 0.6436408548808031, "learning_rate": 3.994593910698784e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.11498317122459412, "step": 450, "valid_targets_mean": 4079.9, "valid_targets_min": 1209 }, { "epoch": 0.8609271523178808, "grad_norm": 0.5717709103219628, "learning_rate": 3.9938789730320184e-05, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.12665092945098877, "step": 455, "valid_targets_mean": 5659.0, "valid_targets_min": 2717 }, { "epoch": 0.8703878902554399, "grad_norm": 0.5017091918547645, "learning_rate": 3.993119722711676e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.11396554857492447, "step": 460, "valid_targets_mean": 5425.6, "valid_targets_min": 1864 }, { "epoch": 0.879848628192999, "grad_norm": 0.49964492415668416, "learning_rate": 3.9923161766115975e-05, "loss": 0.2463, "loss_nan_ranks": 0, "loss_rank_avg": 0.14272227883338928, "step": 465, "valid_targets_mean": 5635.0, "valid_targets_min": 2072 }, { "epoch": 0.8893093661305582, "grad_norm": 0.47619622508106707, "learning_rate": 3.991468352590069e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.10488211363554001, "step": 470, "valid_targets_mean": 6403.9, "valid_targets_min": 4611 }, { "epoch": 0.8987701040681173, "grad_norm": 0.5493491032822436, "learning_rate": 3.990576269489424e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.14750590920448303, "step": 475, "valid_targets_mean": 6374.0, "valid_targets_min": 3082 }, { "epoch": 0.9082308420056765, "grad_norm": 0.4929437751955924, "learning_rate": 3.9896399471356234e-05, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.10722912847995758, "step": 480, "valid_targets_mean": 5189.4, "valid_targets_min": 1142 }, { "epoch": 0.9176915799432356, "grad_norm": 0.521230777881251, "learning_rate": 3.9886594063378185e-05, "loss": 0.2409, "loss_nan_ranks": 0, "loss_rank_avg": 0.12368421256542206, "step": 485, "valid_targets_mean": 7125.4, "valid_targets_min": 5267 }, { "epoch": 0.9271523178807947, "grad_norm": 0.501801100355575, "learning_rate": 3.987634668887887e-05, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.1744682639837265, "step": 490, "valid_targets_mean": 6161.8, "valid_targets_min": 2821 }, { "epoch": 0.9366130558183539, "grad_norm": 0.565532137296215, "learning_rate": 3.986565757559945e-05, "loss": 0.2551, "loss_nan_ranks": 0, "loss_rank_avg": 0.11137732863426208, "step": 495, "valid_targets_mean": 5410.9, "valid_targets_min": 2383 }, { "epoch": 0.9460737937559129, "grad_norm": 0.4739992359384424, "learning_rate": 3.985452696109849e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.12591904401779175, "step": 500, "valid_targets_mean": 5950.1, "valid_targets_min": 4596 }, { "epoch": 0.9555345316934721, "grad_norm": 0.4916133738725745, "learning_rate": 3.984295509274659e-05, "loss": 0.2455, "loss_nan_ranks": 0, "loss_rank_avg": 0.12242468446493149, "step": 505, "valid_targets_mean": 6121.0, "valid_targets_min": 3563 }, { "epoch": 0.9649952696310312, "grad_norm": 1.3514558105735277, "learning_rate": 3.983094222772094e-05, "loss": 0.2592, "loss_nan_ranks": 0, "loss_rank_avg": 0.14152546226978302, "step": 510, "valid_targets_mean": 5866.8, "valid_targets_min": 2482 }, { "epoch": 0.9744560075685903, "grad_norm": 0.47290691029164367, "learning_rate": 3.981848863299959e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1114603728055954, "step": 515, "valid_targets_mean": 6109.9, "valid_targets_min": 3956 }, { "epoch": 0.9839167455061495, "grad_norm": 0.6155174685504273, "learning_rate": 3.9805594585355536e-05, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.13362428545951843, "step": 520, "valid_targets_mean": 4292.6, "valid_targets_min": 1739 }, { "epoch": 0.9933774834437086, "grad_norm": 0.47493615981359083, "learning_rate": 3.9792260371350526e-05, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.09970583021640778, "step": 525, "valid_targets_mean": 5427.1, "valid_targets_min": 2479 }, { "epoch": 1.0018921475875118, "grad_norm": 0.5624585903547664, "learning_rate": 3.977848628732872e-05, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.11141172051429749, "step": 530, "valid_targets_mean": 4299.5, "valid_targets_min": 1091 }, { "epoch": 1.0113528855250709, "grad_norm": 0.5499877032447721, "learning_rate": 3.976427263941013e-05, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.10701591521501541, "step": 535, "valid_targets_mean": 4795.1, "valid_targets_min": 920 }, { "epoch": 1.0208136234626302, "grad_norm": 0.4838371795926738, "learning_rate": 3.9749619743483754e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.12711255252361298, "step": 540, "valid_targets_mean": 6530.5, "valid_targets_min": 4416 }, { "epoch": 1.0302743614001892, "grad_norm": 0.5169768860706256, "learning_rate": 3.9734527925200594e-05, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.11072207987308502, "step": 545, "valid_targets_mean": 5097.2, "valid_targets_min": 3049 }, { "epoch": 1.0397350993377483, "grad_norm": 0.4926699291142721, "learning_rate": 3.9718997519966444e-05, "loss": 0.244, "loss_nan_ranks": 0, "loss_rank_avg": 0.12459664046764374, "step": 550, "valid_targets_mean": 5628.1, "valid_targets_min": 2771 }, { "epoch": 1.0491958372753074, "grad_norm": 0.4966980686685516, "learning_rate": 3.970302887293437e-05, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.11457451432943344, "step": 555, "valid_targets_mean": 5203.2, "valid_targets_min": 3449 }, { "epoch": 1.0586565752128667, "grad_norm": 0.5305519729560744, "learning_rate": 3.968662233899708e-05, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.12242069840431213, "step": 560, "valid_targets_mean": 5241.4, "valid_targets_min": 2249 }, { "epoch": 1.0681173131504258, "grad_norm": 0.5240554490130925, "learning_rate": 3.966977828277905e-05, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.1389508992433548, "step": 565, "valid_targets_mean": 5881.6, "valid_targets_min": 2174 }, { "epoch": 1.0775780510879849, "grad_norm": 0.5289561091662918, "learning_rate": 3.96524970786284e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.11946485936641693, "step": 570, "valid_targets_mean": 5437.6, "valid_targets_min": 3626 }, { "epoch": 1.087038789025544, "grad_norm": 0.5405317266225187, "learning_rate": 3.963477911060855e-05, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.11820094287395477, "step": 575, "valid_targets_mean": 5014.4, "valid_targets_min": 2052 }, { "epoch": 1.096499526963103, "grad_norm": 0.500712987964929, "learning_rate": 3.961662477248973e-05, "loss": 0.2201, "loss_nan_ranks": 0, "loss_rank_avg": 0.09292806684970856, "step": 580, "valid_targets_mean": 5671.1, "valid_targets_min": 3119 }, { "epoch": 1.1059602649006623, "grad_norm": 0.5638466017332864, "learning_rate": 3.959803446774022e-05, "loss": 0.2526, "loss_nan_ranks": 0, "loss_rank_avg": 0.1443258821964264, "step": 585, "valid_targets_mean": 5097.2, "valid_targets_min": 1365 }, { "epoch": 1.1154210028382214, "grad_norm": 0.4867201503195808, "learning_rate": 3.957900860951736e-05, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.13219431042671204, "step": 590, "valid_targets_mean": 6045.9, "valid_targets_min": 2643 }, { "epoch": 1.1248817407757805, "grad_norm": 0.4757816321592032, "learning_rate": 3.9559547620658366e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.10074618458747864, "step": 595, "valid_targets_mean": 5344.8, "valid_targets_min": 2280 }, { "epoch": 1.1343424787133396, "grad_norm": 0.6128758775517067, "learning_rate": 3.9539651933670977e-05, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.1107979565858841, "step": 600, "valid_targets_mean": 3639.5, "valid_targets_min": 467 }, { "epoch": 1.1438032166508987, "grad_norm": 0.5121856535536162, "learning_rate": 3.9519321990723796e-05, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.11904571950435638, "step": 605, "valid_targets_mean": 6200.5, "valid_targets_min": 2171 }, { "epoch": 1.153263954588458, "grad_norm": 0.4762180442392512, "learning_rate": 3.949855824363647e-05, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.115460604429245, "step": 610, "valid_targets_mean": 5414.8, "valid_targets_min": 835 }, { "epoch": 1.162724692526017, "grad_norm": 0.4836410961268961, "learning_rate": 3.94773611538697e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.1263769567012787, "step": 615, "valid_targets_mean": 5787.6, "valid_targets_min": 1293 }, { "epoch": 1.1721854304635762, "grad_norm": 0.48420895744183057, "learning_rate": 3.945573119251489e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.12540149688720703, "step": 620, "valid_targets_mean": 5621.6, "valid_targets_min": 3937 }, { "epoch": 1.1816461684011352, "grad_norm": 0.5668323089533568, "learning_rate": 3.9433668840283756e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.11952169239521027, "step": 625, "valid_targets_mean": 5713.2, "valid_targets_min": 182 }, { "epoch": 1.1911069063386943, "grad_norm": 0.5079376916359959, "learning_rate": 3.9411174587497636e-05, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.10352667421102524, "step": 630, "valid_targets_mean": 5267.4, "valid_targets_min": 3874 }, { "epoch": 1.2005676442762536, "grad_norm": 0.44993465294635854, "learning_rate": 3.938824893407655e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.09414789080619812, "step": 635, "valid_targets_mean": 5855.6, "valid_targets_min": 3171 }, { "epoch": 1.2100283822138127, "grad_norm": 0.4266804320387502, "learning_rate": 3.9364892389528116e-05, "loss": 0.2248, "loss_nan_ranks": 0, "loss_rank_avg": 0.09374960511922836, "step": 640, "valid_targets_mean": 6662.6, "valid_targets_min": 4858 }, { "epoch": 1.2194891201513718, "grad_norm": 0.4894876148798196, "learning_rate": 3.9341105472936234e-05, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.11348379403352737, "step": 645, "valid_targets_mean": 5026.5, "valid_targets_min": 2383 }, { "epoch": 1.2289498580889309, "grad_norm": 0.4861141591545541, "learning_rate": 3.9316888712949546e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.10222115367650986, "step": 650, "valid_targets_mean": 4663.4, "valid_targets_min": 501 }, { "epoch": 1.23841059602649, "grad_norm": 0.5580509660668194, "learning_rate": 3.9292242647769664e-05, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.10276462882757187, "step": 655, "valid_targets_mean": 5688.8, "valid_targets_min": 2494 }, { "epoch": 1.2478713339640493, "grad_norm": 0.5600748404923863, "learning_rate": 3.926716782513924e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.12437956780195236, "step": 660, "valid_targets_mean": 5957.5, "valid_targets_min": 1816 }, { "epoch": 1.2573320719016083, "grad_norm": 0.48680567022663485, "learning_rate": 3.924166480232977e-05, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.10580234229564667, "step": 665, "valid_targets_mean": 4815.4, "valid_targets_min": 2054 }, { "epoch": 1.2667928098391674, "grad_norm": 0.5012312020890741, "learning_rate": 3.921573414612923e-05, "loss": 0.2365, "loss_nan_ranks": 0, "loss_rank_avg": 0.10871803760528564, "step": 670, "valid_targets_mean": 5644.4, "valid_targets_min": 3270 }, { "epoch": 1.2762535477767265, "grad_norm": 0.6526213288816137, "learning_rate": 3.918937643282946e-05, "loss": 0.2507, "loss_nan_ranks": 0, "loss_rank_avg": 0.13784456253051758, "step": 675, "valid_targets_mean": 4337.4, "valid_targets_min": 1461 }, { "epoch": 1.2857142857142856, "grad_norm": 0.45243111873658154, "learning_rate": 3.9162592248213364e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.09919239580631256, "step": 680, "valid_targets_mean": 5475.1, "valid_targets_min": 1303 }, { "epoch": 1.295175023651845, "grad_norm": 0.46993510603366306, "learning_rate": 3.913538218754189e-05, "loss": 0.2431, "loss_nan_ranks": 0, "loss_rank_avg": 0.11857247352600098, "step": 685, "valid_targets_mean": 5503.6, "valid_targets_min": 2736 }, { "epoch": 1.304635761589404, "grad_norm": 0.5288647977319975, "learning_rate": 3.9107746855540815e-05, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.10459893196821213, "step": 690, "valid_targets_mean": 4416.6, "valid_targets_min": 1457 }, { "epoch": 1.314096499526963, "grad_norm": 0.47853397074365556, "learning_rate": 3.907968686638728e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.11762518435716629, "step": 695, "valid_targets_mean": 5999.4, "valid_targets_min": 1795 }, { "epoch": 1.3235572374645224, "grad_norm": 0.4653678345529489, "learning_rate": 3.9051202843696154e-05, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.11448341608047485, "step": 700, "valid_targets_mean": 5763.0, "valid_targets_min": 1931 }, { "epoch": 1.3330179754020814, "grad_norm": 0.4855084018479891, "learning_rate": 3.902229542050617e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.11349400877952576, "step": 705, "valid_targets_mean": 4518.6, "valid_targets_min": 2050 }, { "epoch": 1.3424787133396405, "grad_norm": 0.5064849346903338, "learning_rate": 3.899296523926588e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.12586739659309387, "step": 710, "valid_targets_mean": 5059.2, "valid_targets_min": 2228 }, { "epoch": 1.3519394512771996, "grad_norm": 0.5683940427049139, "learning_rate": 3.896321295181932e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.11889487504959106, "step": 715, "valid_targets_mean": 5142.8, "valid_targets_min": 2903 }, { "epoch": 1.3614001892147587, "grad_norm": 0.5067048884888564, "learning_rate": 3.8933039219391604e-05, "loss": 0.2316, "loss_nan_ranks": 0, "loss_rank_avg": 0.09034863114356995, "step": 720, "valid_targets_mean": 4853.4, "valid_targets_min": 1109 }, { "epoch": 1.370860927152318, "grad_norm": 0.5713266940700944, "learning_rate": 3.890244471257415e-05, "loss": 0.223, "loss_nan_ranks": 0, "loss_rank_avg": 0.10502117872238159, "step": 725, "valid_targets_mean": 6282.2, "valid_targets_min": 2621 }, { "epoch": 1.380321665089877, "grad_norm": 0.47167945802336014, "learning_rate": 3.8871430111309817e-05, "loss": 0.2246, "loss_nan_ranks": 0, "loss_rank_avg": 0.10523657500743866, "step": 730, "valid_targets_mean": 5265.6, "valid_targets_min": 1669 }, { "epoch": 1.3897824030274362, "grad_norm": 0.4972267194987453, "learning_rate": 3.883999610487782e-05, "loss": 0.2133, "loss_nan_ranks": 0, "loss_rank_avg": 0.11264175176620483, "step": 735, "valid_targets_mean": 5413.1, "valid_targets_min": 1752 }, { "epoch": 1.3992431409649952, "grad_norm": 0.4857236391537851, "learning_rate": 3.880814339187832e-05, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.1228969469666481, "step": 740, "valid_targets_mean": 6460.1, "valid_targets_min": 2751 }, { "epoch": 1.4087038789025543, "grad_norm": 0.47731532767819274, "learning_rate": 3.877587268021701e-05, "loss": 0.2279, "loss_nan_ranks": 0, "loss_rank_avg": 0.1144258975982666, "step": 745, "valid_targets_mean": 6142.0, "valid_targets_min": 3992 }, { "epoch": 1.4181646168401136, "grad_norm": 0.45393688275595756, "learning_rate": 3.874318468708931e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.09872148185968399, "step": 750, "valid_targets_mean": 5503.8, "valid_targets_min": 2060 }, { "epoch": 1.4276253547776727, "grad_norm": 0.5303507483697673, "learning_rate": 3.871008013896444e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.10745839029550552, "step": 755, "valid_targets_mean": 5164.8, "valid_targets_min": 1538 }, { "epoch": 1.4370860927152318, "grad_norm": 0.461682203378725, "learning_rate": 3.8676559771569294e-05, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.11055511236190796, "step": 760, "valid_targets_mean": 6175.9, "valid_targets_min": 3847 }, { "epoch": 1.4465468306527909, "grad_norm": 0.4296391460871339, "learning_rate": 3.864262432987206e-05, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.09028683602809906, "step": 765, "valid_targets_mean": 5604.2, "valid_targets_min": 3031 }, { "epoch": 1.45600756859035, "grad_norm": 0.4667109187535618, "learning_rate": 3.860827456806571e-05, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.12354136258363724, "step": 770, "valid_targets_mean": 5927.1, "valid_targets_min": 3111 }, { "epoch": 1.4654683065279093, "grad_norm": 0.4716805812736505, "learning_rate": 3.857351124955118e-05, "loss": 0.2385, "loss_nan_ranks": 0, "loss_rank_avg": 0.10110399127006531, "step": 775, "valid_targets_mean": 5077.1, "valid_targets_min": 1075 }, { "epoch": 1.4749290444654684, "grad_norm": 0.4722294808263683, "learning_rate": 3.853833514692044e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.10581814497709274, "step": 780, "valid_targets_mean": 5985.8, "valid_targets_min": 1757 }, { "epoch": 1.4843897824030274, "grad_norm": 0.46649393641526554, "learning_rate": 3.850274704193932e-05, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.10153012722730637, "step": 785, "valid_targets_mean": 6183.6, "valid_targets_min": 2006 }, { "epoch": 1.4938505203405865, "grad_norm": 0.4773875252367172, "learning_rate": 3.846674772553014e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.12223786860704422, "step": 790, "valid_targets_mean": 6154.8, "valid_targets_min": 5044 }, { "epoch": 1.5033112582781456, "grad_norm": 0.4748127013380771, "learning_rate": 3.843033799775411e-05, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.093946173787117, "step": 795, "valid_targets_mean": 6119.9, "valid_targets_min": 3720 }, { "epoch": 1.512771996215705, "grad_norm": 0.467050356933497, "learning_rate": 3.839351866779358e-05, "loss": 0.2385, "loss_nan_ranks": 0, "loss_rank_avg": 0.10543806850910187, "step": 800, "valid_targets_mean": 6435.6, "valid_targets_min": 5034 }, { "epoch": 1.522232734153264, "grad_norm": 0.43867305636821574, "learning_rate": 3.835629055393401e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.11679120361804962, "step": 805, "valid_targets_mean": 6308.0, "valid_targets_min": 3711 }, { "epoch": 1.531693472090823, "grad_norm": 0.48079409142806057, "learning_rate": 3.8318654483545865e-05, "loss": 0.2225, "loss_nan_ranks": 0, "loss_rank_avg": 0.12533718347549438, "step": 810, "valid_targets_mean": 6162.1, "valid_targets_min": 3455 }, { "epoch": 1.5411542100283824, "grad_norm": 0.41889792201675763, "learning_rate": 3.828061129306612e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.10481228679418564, "step": 815, "valid_targets_mean": 6216.2, "valid_targets_min": 3346 }, { "epoch": 1.5506149479659412, "grad_norm": 0.4955138763469212, "learning_rate": 3.824216182797976e-05, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.11373977363109589, "step": 820, "valid_targets_mean": 5359.9, "valid_targets_min": 2126 }, { "epoch": 1.5600756859035005, "grad_norm": 0.4872548119969948, "learning_rate": 3.8203306942800956e-05, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.10969603061676025, "step": 825, "valid_targets_mean": 4700.9, "valid_targets_min": 1915 }, { "epoch": 1.5695364238410596, "grad_norm": 0.47970332008609884, "learning_rate": 3.8164047501054064e-05, "loss": 0.2256, "loss_nan_ranks": 0, "loss_rank_avg": 0.10819444060325623, "step": 830, "valid_targets_mean": 5609.9, "valid_targets_min": 3566 }, { "epoch": 1.5789971617786187, "grad_norm": 0.580079095541343, "learning_rate": 3.8124384375254454e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.10750003904104233, "step": 835, "valid_targets_mean": 5338.2, "valid_targets_min": 571 }, { "epoch": 1.588457899716178, "grad_norm": 0.5673488057662988, "learning_rate": 3.808431844688911e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.11036446690559387, "step": 840, "valid_targets_mean": 5426.0, "valid_targets_min": 2462 }, { "epoch": 1.5979186376537369, "grad_norm": 0.42103950384674316, "learning_rate": 3.8043850606397026e-05, "loss": 0.2307, "loss_nan_ranks": 0, "loss_rank_avg": 0.09853754937648773, "step": 845, "valid_targets_mean": 6793.1, "valid_targets_min": 4564 }, { "epoch": 1.6073793755912962, "grad_norm": 0.4776716012442452, "learning_rate": 3.800298175314943e-05, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.10229594260454178, "step": 850, "valid_targets_mean": 4796.5, "valid_targets_min": 869 }, { "epoch": 1.6168401135288553, "grad_norm": 0.4784444842339034, "learning_rate": 3.796171279542983e-05, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.12016277015209198, "step": 855, "valid_targets_mean": 5666.8, "valid_targets_min": 4213 }, { "epoch": 1.6263008514664143, "grad_norm": 0.514714610117917, "learning_rate": 3.792004465041374e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.10403918474912643, "step": 860, "valid_targets_mean": 5254.9, "valid_targets_min": 3210 }, { "epoch": 1.6357615894039736, "grad_norm": 0.5112000027216482, "learning_rate": 3.787797824414839e-05, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.10923796147108078, "step": 865, "valid_targets_mean": 4763.4, "valid_targets_min": 2980 }, { "epoch": 1.6452223273415325, "grad_norm": 0.4787828716925675, "learning_rate": 3.7835514511532106e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.11811286211013794, "step": 870, "valid_targets_mean": 6723.4, "valid_targets_min": 2899 }, { "epoch": 1.6546830652790918, "grad_norm": 0.4851598879974133, "learning_rate": 3.779265439629349e-05, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.12126254290342331, "step": 875, "valid_targets_mean": 5780.9, "valid_targets_min": 4520 }, { "epoch": 1.664143803216651, "grad_norm": 0.4742437333915908, "learning_rate": 3.774939885097054e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.11021271347999573, "step": 880, "valid_targets_mean": 4854.0, "valid_targets_min": 2821 }, { "epoch": 1.67360454115421, "grad_norm": 0.4960836751821523, "learning_rate": 3.7705748836889394e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.13386490941047668, "step": 885, "valid_targets_mean": 6546.0, "valid_targets_min": 1321 }, { "epoch": 1.6830652790917693, "grad_norm": 0.4036549231565226, "learning_rate": 3.7661705324143015e-05, "loss": 0.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.08332087099552155, "step": 890, "valid_targets_mean": 6718.4, "valid_targets_min": 2034 }, { "epoch": 1.6925260170293281, "grad_norm": 0.49131023862826795, "learning_rate": 3.761726929156961e-05, "loss": 0.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.11716383695602417, "step": 895, "valid_targets_mean": 6500.2, "valid_targets_min": 3450 }, { "epoch": 1.7019867549668874, "grad_norm": 0.45414353126458956, "learning_rate": 3.757244172673089e-05, "loss": 0.2248, "loss_nan_ranks": 0, "loss_rank_avg": 0.11022776365280151, "step": 900, "valid_targets_mean": 6545.5, "valid_targets_min": 5104 }, { "epoch": 1.7114474929044465, "grad_norm": 0.4665861040208616, "learning_rate": 3.75272236258901e-05, "loss": 0.2205, "loss_nan_ranks": 0, "loss_rank_avg": 0.10109938681125641, "step": 905, "valid_targets_mean": 5423.8, "valid_targets_min": 2046 }, { "epoch": 1.7209082308420056, "grad_norm": 0.5390908507043201, "learning_rate": 3.74816159939899e-05, "loss": 0.2157, "loss_nan_ranks": 0, "loss_rank_avg": 0.11916151642799377, "step": 910, "valid_targets_mean": 5598.9, "valid_targets_min": 3342 }, { "epoch": 1.730368968779565, "grad_norm": 0.4802137890384671, "learning_rate": 3.743561984463002e-05, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.20065706968307495, "step": 915, "valid_targets_mean": 4943.9, "valid_targets_min": 1064 }, { "epoch": 1.7398297067171238, "grad_norm": 0.4905362325837713, "learning_rate": 3.738923620004475e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.107704758644104, "step": 920, "valid_targets_mean": 5806.9, "valid_targets_min": 4816 }, { "epoch": 1.749290444654683, "grad_norm": 0.4581079118093888, "learning_rate": 3.734246609108018e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.09412605315446854, "step": 925, "valid_targets_mean": 4781.8, "valid_targets_min": 449 }, { "epoch": 1.7587511825922422, "grad_norm": 0.45771521539019777, "learning_rate": 3.729531055717135e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.08951415121555328, "step": 930, "valid_targets_mean": 5657.9, "valid_targets_min": 4066 }, { "epoch": 1.7682119205298013, "grad_norm": 0.4219395696573571, "learning_rate": 3.724777064631909e-05, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.10585498809814453, "step": 935, "valid_targets_mean": 6137.9, "valid_targets_min": 1896 }, { "epoch": 1.7776726584673606, "grad_norm": 0.4750153042604821, "learning_rate": 3.719984741506676e-05, "loss": 0.2285, "loss_nan_ranks": 0, "loss_rank_avg": 0.1056283712387085, "step": 940, "valid_targets_mean": 6157.4, "valid_targets_min": 4827 }, { "epoch": 1.7871333964049196, "grad_norm": 0.5007065871315426, "learning_rate": 3.7151541928476775e-05, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.11300000548362732, "step": 945, "valid_targets_mean": 6049.8, "valid_targets_min": 1787 }, { "epoch": 1.7965941343424787, "grad_norm": 0.4556642995476161, "learning_rate": 3.710285526010693e-05, "loss": 0.2235, "loss_nan_ranks": 0, "loss_rank_avg": 0.10112877935171127, "step": 950, "valid_targets_mean": 5844.6, "valid_targets_min": 1902 }, { "epoch": 1.8060548722800378, "grad_norm": 0.4695420382110502, "learning_rate": 3.705378849198651e-05, "loss": 0.2233, "loss_nan_ranks": 0, "loss_rank_avg": 0.09273075312376022, "step": 955, "valid_targets_mean": 5799.4, "valid_targets_min": 3405 }, { "epoch": 1.8155156102175969, "grad_norm": 0.4582464273228831, "learning_rate": 3.700434271459229e-05, "loss": 0.2233, "loss_nan_ranks": 0, "loss_rank_avg": 0.11421730369329453, "step": 960, "valid_targets_mean": 6082.0, "valid_targets_min": 2838 }, { "epoch": 1.8249763481551562, "grad_norm": 0.45724998496227603, "learning_rate": 3.6954519026824265e-05, "loss": 0.2307, "loss_nan_ranks": 0, "loss_rank_avg": 0.11946368962526321, "step": 965, "valid_targets_mean": 6126.4, "valid_targets_min": 3686 }, { "epoch": 1.8344370860927153, "grad_norm": 0.42553397621822625, "learning_rate": 3.6904318535981254e-05, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.09127740561962128, "step": 970, "valid_targets_mean": 6550.4, "valid_targets_min": 4443 }, { "epoch": 1.8438978240302744, "grad_norm": 0.5055145067804998, "learning_rate": 3.6853742357736265e-05, "loss": 0.2236, "loss_nan_ranks": 0, "loss_rank_avg": 0.13003841042518616, "step": 975, "valid_targets_mean": 6482.6, "valid_targets_min": 3467 }, { "epoch": 1.8533585619678334, "grad_norm": 0.46511645025886095, "learning_rate": 3.6802791616111716e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.1227150559425354, "step": 980, "valid_targets_mean": 6854.8, "valid_targets_min": 3556 }, { "epoch": 1.8628192999053925, "grad_norm": 0.5656028012040354, "learning_rate": 3.6751467443454455e-05, "loss": 0.2172, "loss_nan_ranks": 0, "loss_rank_avg": 0.10680273920297623, "step": 985, "valid_targets_mean": 5882.6, "valid_targets_min": 3572 }, { "epoch": 1.8722800378429518, "grad_norm": 0.6508509853322608, "learning_rate": 3.6699770980410586e-05, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.1327436864376068, "step": 990, "valid_targets_mean": 5812.0, "valid_targets_min": 2484 }, { "epoch": 1.881740775780511, "grad_norm": 0.5305852714830951, "learning_rate": 3.664770337590011e-05, "loss": 0.2163, "loss_nan_ranks": 0, "loss_rank_avg": 0.0990646705031395, "step": 995, "valid_targets_mean": 5233.1, "valid_targets_min": 1906 }, { "epoch": 1.89120151371807, "grad_norm": 0.5306949827252334, "learning_rate": 3.659526578709144e-05, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.13009144365787506, "step": 1000, "valid_targets_mean": 4655.4, "valid_targets_min": 2019 }, { "epoch": 1.9006622516556293, "grad_norm": 0.46674719483256766, "learning_rate": 3.654245937937561e-05, "loss": 0.2197, "loss_nan_ranks": 0, "loss_rank_avg": 0.11824624240398407, "step": 1005, "valid_targets_mean": 6255.9, "valid_targets_min": 3204 }, { "epoch": 1.9101229895931882, "grad_norm": 0.47173335317739623, "learning_rate": 3.6489285326340424e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.1149347722530365, "step": 1010, "valid_targets_mean": 5612.1, "valid_targets_min": 3308 }, { "epoch": 1.9195837275307475, "grad_norm": 0.416058820987745, "learning_rate": 3.6435744809744376e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.10606338828802109, "step": 1015, "valid_targets_mean": 6607.4, "valid_targets_min": 1916 }, { "epoch": 1.9290444654683065, "grad_norm": 0.4694345655227754, "learning_rate": 3.638183901949036e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.1187274232506752, "step": 1020, "valid_targets_mean": 5897.4, "valid_targets_min": 3745 }, { "epoch": 1.9385052034058656, "grad_norm": 0.47018658031073185, "learning_rate": 3.6327569153599236e-05, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.12189055234193802, "step": 1025, "valid_targets_mean": 5487.2, "valid_targets_min": 1457 }, { "epoch": 1.947965941343425, "grad_norm": 0.5101801225439047, "learning_rate": 3.62729364181832e-05, "loss": 0.2116, "loss_nan_ranks": 0, "loss_rank_avg": 0.09667861461639404, "step": 1030, "valid_targets_mean": 4755.6, "valid_targets_min": 1412 }, { "epoch": 1.9574266792809838, "grad_norm": 0.45299632084357455, "learning_rate": 3.6217942027419025e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.12895835936069489, "step": 1035, "valid_targets_mean": 7236.1, "valid_targets_min": 4546 }, { "epoch": 1.966887417218543, "grad_norm": 0.6043045119332607, "learning_rate": 3.616258720352097e-05, "loss": 0.2233, "loss_nan_ranks": 0, "loss_rank_avg": 0.12101536989212036, "step": 1040, "valid_targets_mean": 6235.6, "valid_targets_min": 4103 }, { "epoch": 1.9763481551561022, "grad_norm": 0.4657858161318268, "learning_rate": 3.6106873176713764e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.1308978646993637, "step": 1045, "valid_targets_mean": 6750.4, "valid_targets_min": 4365 }, { "epoch": 1.9858088930936613, "grad_norm": 0.4339354389433891, "learning_rate": 3.60508011852051e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.08882288634777069, "step": 1050, "valid_targets_mean": 4971.6, "valid_targets_min": 1957 }, { "epoch": 1.9952696310312206, "grad_norm": 0.4452210444563202, "learning_rate": 3.5994372475158276e-05, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.09936431050300598, "step": 1055, "valid_targets_mean": 6430.6, "valid_targets_min": 5264 }, { "epoch": 2.0037842951750235, "grad_norm": 0.4902441128877412, "learning_rate": 3.593758830066438e-05, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.12074028700590134, "step": 1060, "valid_targets_mean": 5225.4, "valid_targets_min": 2454 }, { "epoch": 2.013245033112583, "grad_norm": 0.5026112447798428, "learning_rate": 3.5880449923714484e-05, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.10387119650840759, "step": 1065, "valid_targets_mean": 5289.6, "valid_targets_min": 2424 }, { "epoch": 2.0227057710501417, "grad_norm": 0.4750712293258598, "learning_rate": 3.582295861417158e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.08582209795713425, "step": 1070, "valid_targets_mean": 6166.4, "valid_targets_min": 3853 }, { "epoch": 2.032166508987701, "grad_norm": 0.5282966500285186, "learning_rate": 3.576511564974233e-05, "loss": 0.2082, "loss_nan_ranks": 0, "loss_rank_avg": 0.09549730271100998, "step": 1075, "valid_targets_mean": 5699.4, "valid_targets_min": 3149 }, { "epoch": 2.0416272469252603, "grad_norm": 0.4390532347283631, "learning_rate": 3.5706922315948726e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.09387944638729095, "step": 1080, "valid_targets_mean": 6100.9, "valid_targets_min": 1599 }, { "epoch": 2.051087984862819, "grad_norm": 0.46546608867761813, "learning_rate": 3.5648379906099474e-05, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.11074842512607574, "step": 1085, "valid_targets_mean": 5845.8, "valid_targets_min": 4153 }, { "epoch": 2.0605487228003785, "grad_norm": 0.81977637281519, "learning_rate": 3.558948972126127e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.10561281442642212, "step": 1090, "valid_targets_mean": 7041.9, "valid_targets_min": 4457 }, { "epoch": 2.0700094607379373, "grad_norm": 0.4202717416437528, "learning_rate": 3.5530253070229886e-05, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.10468418896198273, "step": 1095, "valid_targets_mean": 7051.8, "valid_targets_min": 5570 }, { "epoch": 2.0794701986754967, "grad_norm": 0.4337227095105579, "learning_rate": 3.547067126950106e-05, "loss": 0.194, "loss_nan_ranks": 0, "loss_rank_avg": 0.1010643020272255, "step": 1100, "valid_targets_mean": 6779.9, "valid_targets_min": 4810 }, { "epoch": 2.088930936613056, "grad_norm": 0.4925480521020738, "learning_rate": 3.541074564324129e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.12354034930467606, "step": 1105, "valid_targets_mean": 6516.4, "valid_targets_min": 2833 }, { "epoch": 2.098391674550615, "grad_norm": 0.42636976344945043, "learning_rate": 3.5350477523258334e-05, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.10801876336336136, "step": 1110, "valid_targets_mean": 6759.4, "valid_targets_min": 2643 }, { "epoch": 2.107852412488174, "grad_norm": 0.42517617143639164, "learning_rate": 3.528986824897167e-05, "loss": 0.2049, "loss_nan_ranks": 0, "loss_rank_avg": 0.08121705800294876, "step": 1115, "valid_targets_mean": 5760.4, "valid_targets_min": 2593 }, { "epoch": 2.1173131504257334, "grad_norm": 0.5312337215642596, "learning_rate": 3.522891916738269e-05, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.08871275186538696, "step": 1120, "valid_targets_mean": 4302.4, "valid_targets_min": 1285 }, { "epoch": 2.1267738883632923, "grad_norm": 0.4692448326166772, "learning_rate": 3.516763163304481e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.10534701496362686, "step": 1125, "valid_targets_mean": 5519.6, "valid_targets_min": 2362 }, { "epoch": 2.1362346263008516, "grad_norm": 0.4268146337366665, "learning_rate": 3.5106007008033306e-05, "loss": 0.2108, "loss_nan_ranks": 0, "loss_rank_avg": 0.11514265835285187, "step": 1130, "valid_targets_mean": 7479.1, "valid_targets_min": 1440 }, { "epoch": 2.1456953642384105, "grad_norm": 0.49100296123591713, "learning_rate": 3.50440466619151e-05, "loss": 0.214, "loss_nan_ranks": 0, "loss_rank_avg": 0.08796236664056778, "step": 1135, "valid_targets_mean": 5922.1, "valid_targets_min": 3934 }, { "epoch": 2.1551561021759698, "grad_norm": 0.5216092308914664, "learning_rate": 3.498175197171827e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.10339146107435226, "step": 1140, "valid_targets_mean": 5577.0, "valid_targets_min": 1475 }, { "epoch": 2.164616840113529, "grad_norm": 0.42621845398225777, "learning_rate": 3.491912432190147e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.10287053883075714, "step": 1145, "valid_targets_mean": 6644.6, "valid_targets_min": 4517 }, { "epoch": 2.174077578051088, "grad_norm": 0.49466569394221804, "learning_rate": 3.485616510432321e-05, "loss": 0.2046, "loss_nan_ranks": 0, "loss_rank_avg": 0.12411276996135712, "step": 1150, "valid_targets_mean": 5787.5, "valid_targets_min": 4705 }, { "epoch": 2.1835383159886472, "grad_norm": 0.4788842052660544, "learning_rate": 3.479287571821082e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.09818103909492493, "step": 1155, "valid_targets_mean": 5502.1, "valid_targets_min": 2850 }, { "epoch": 2.192999053926206, "grad_norm": 0.4760444243683465, "learning_rate": 3.4729257570129436e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.10555780678987503, "step": 1160, "valid_targets_mean": 5504.0, "valid_targets_min": 2222 }, { "epoch": 2.2024597918637654, "grad_norm": 0.5175946771783035, "learning_rate": 3.466531207395072e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.11507289856672287, "step": 1165, "valid_targets_mean": 4728.1, "valid_targets_min": 1177 }, { "epoch": 2.2119205298013247, "grad_norm": 0.5117776327063412, "learning_rate": 3.46010406508214e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.11044911295175552, "step": 1170, "valid_targets_mean": 4711.1, "valid_targets_min": 2573 }, { "epoch": 2.2213812677388836, "grad_norm": 0.5590952933682073, "learning_rate": 3.453644472913176e-05, "loss": 0.2087, "loss_nan_ranks": 0, "loss_rank_avg": 0.10522548109292984, "step": 1175, "valid_targets_mean": 4766.1, "valid_targets_min": 1915 }, { "epoch": 2.230842005676443, "grad_norm": 0.5025362223001963, "learning_rate": 3.4471525744483826e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.10610745847225189, "step": 1180, "valid_targets_mean": 6096.0, "valid_targets_min": 4585 }, { "epoch": 2.2403027436140017, "grad_norm": 0.4645208598899087, "learning_rate": 3.440628513965947e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.08891929686069489, "step": 1185, "valid_targets_mean": 4895.5, "valid_targets_min": 1524 }, { "epoch": 2.249763481551561, "grad_norm": 0.6318891734380099, "learning_rate": 3.4340724364588405e-05, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.08534630388021469, "step": 1190, "valid_targets_mean": 4529.2, "valid_targets_min": 1166 }, { "epoch": 2.2592242194891203, "grad_norm": 0.44200205332456727, "learning_rate": 3.4274844876315885e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.09655225276947021, "step": 1195, "valid_targets_mean": 6800.4, "valid_targets_min": 3424 }, { "epoch": 2.268684957426679, "grad_norm": 0.4615805475383118, "learning_rate": 3.4208648138970366e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.09694427251815796, "step": 1200, "valid_targets_mean": 5259.1, "valid_targets_min": 3358 }, { "epoch": 2.2781456953642385, "grad_norm": 0.4050381330325965, "learning_rate": 3.4142135623730954e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.10238818824291229, "step": 1205, "valid_targets_mean": 7746.4, "valid_targets_min": 3172 }, { "epoch": 2.2876064333017974, "grad_norm": 0.47392587771674227, "learning_rate": 3.407530880879472e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.09218434244394302, "step": 1210, "valid_targets_mean": 4792.6, "valid_targets_min": 1795 }, { "epoch": 2.2970671712393567, "grad_norm": 0.5019723788934695, "learning_rate": 3.400816917934383e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.11557125300168991, "step": 1215, "valid_targets_mean": 6118.2, "valid_targets_min": 2081 }, { "epoch": 2.306527909176916, "grad_norm": 0.4341351471127814, "learning_rate": 3.394071822751255e-05, "loss": 0.2154, "loss_nan_ranks": 0, "loss_rank_avg": 0.11432911455631256, "step": 1220, "valid_targets_mean": 7413.2, "valid_targets_min": 5062 }, { "epoch": 2.315988647114475, "grad_norm": 0.48447458616548483, "learning_rate": 3.3872957452354085e-05, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.10207293927669525, "step": 1225, "valid_targets_mean": 5568.5, "valid_targets_min": 2966 }, { "epoch": 2.325449385052034, "grad_norm": 0.49502495306040073, "learning_rate": 3.380488835980726e-05, "loss": 0.2041, "loss_nan_ranks": 0, "loss_rank_avg": 0.1068793311715126, "step": 1230, "valid_targets_mean": 5244.4, "valid_targets_min": 3183 }, { "epoch": 2.334910122989593, "grad_norm": 0.472235805272251, "learning_rate": 3.373651246266306e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.10191547870635986, "step": 1235, "valid_targets_mean": 6612.2, "valid_targets_min": 4516 }, { "epoch": 2.3443708609271523, "grad_norm": 0.4651068349442188, "learning_rate": 3.366783128053097e-05, "loss": 0.1952, "loss_nan_ranks": 0, "loss_rank_avg": 0.08761796355247498, "step": 1240, "valid_targets_mean": 4062.6, "valid_targets_min": 1091 }, { "epoch": 2.3538315988647116, "grad_norm": 0.44567297458048116, "learning_rate": 3.359884633980528e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.08401072025299072, "step": 1245, "valid_targets_mean": 5205.4, "valid_targets_min": 1799 }, { "epoch": 2.3632923368022705, "grad_norm": 0.5648360804071922, "learning_rate": 3.352955917363108e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.12823820114135742, "step": 1250, "valid_targets_mean": 5323.9, "valid_targets_min": 2926 }, { "epoch": 2.3727530747398298, "grad_norm": 0.39813339146433463, "learning_rate": 3.345997132187022e-05, "loss": 0.1942, "loss_nan_ranks": 0, "loss_rank_avg": 0.09695559740066528, "step": 1255, "valid_targets_mean": 7675.4, "valid_targets_min": 2773 }, { "epoch": 2.3822138126773886, "grad_norm": 0.4375240114279496, "learning_rate": 3.339008433106713e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.08221010863780975, "step": 1260, "valid_targets_mean": 6793.2, "valid_targets_min": 3433 }, { "epoch": 2.391674550614948, "grad_norm": 0.46728845602150615, "learning_rate": 3.331989975441437e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.1225174069404602, "step": 1265, "valid_targets_mean": 6902.6, "valid_targets_min": 4716 }, { "epoch": 2.4011352885525072, "grad_norm": 0.4907015096558724, "learning_rate": 3.324941915171817e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.1086108461022377, "step": 1270, "valid_targets_mean": 5772.2, "valid_targets_min": 4619 }, { "epoch": 2.410596026490066, "grad_norm": 0.5288905896743813, "learning_rate": 3.3178644089363726e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.0829245075583458, "step": 1275, "valid_targets_mean": 4927.6, "valid_targets_min": 1720 }, { "epoch": 2.4200567644276254, "grad_norm": 0.4616750373070165, "learning_rate": 3.310757614028043e-05, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.10950164496898651, "step": 1280, "valid_targets_mean": 5469.9, "valid_targets_min": 2366 }, { "epoch": 2.4295175023651847, "grad_norm": 0.48785513225115845, "learning_rate": 3.303621688390688e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.10254321247339249, "step": 1285, "valid_targets_mean": 4784.5, "valid_targets_min": 1528 }, { "epoch": 2.4389782403027436, "grad_norm": 0.47006830003545064, "learning_rate": 3.2964567906155775e-05, "loss": 0.2105, "loss_nan_ranks": 0, "loss_rank_avg": 0.10443936288356781, "step": 1290, "valid_targets_mean": 5922.1, "valid_targets_min": 4665 }, { "epoch": 2.448438978240303, "grad_norm": 0.5303981405733078, "learning_rate": 3.28926307993787e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.10440479218959808, "step": 1295, "valid_targets_mean": 4983.1, "valid_targets_min": 1544 }, { "epoch": 2.4578997161778617, "grad_norm": 0.41697399320560447, "learning_rate": 3.282040716233073e-05, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.11425549536943436, "step": 1300, "valid_targets_mean": 7874.9, "valid_targets_min": 3015 }, { "epoch": 2.467360454115421, "grad_norm": 0.4637165828897811, "learning_rate": 3.274789860013484e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.10167668759822845, "step": 1305, "valid_targets_mean": 5048.4, "valid_targets_min": 4028 }, { "epoch": 2.47682119205298, "grad_norm": 0.45904308662548016, "learning_rate": 3.267510672424633e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.10144510865211487, "step": 1310, "valid_targets_mean": 5632.4, "valid_targets_min": 1561 }, { "epoch": 2.486281929990539, "grad_norm": 0.5117482006460289, "learning_rate": 3.260203315241693e-05, "loss": 0.2167, "loss_nan_ranks": 0, "loss_rank_avg": 0.11750157177448273, "step": 1315, "valid_targets_mean": 5832.9, "valid_targets_min": 2221 }, { "epoch": 2.4957426679280985, "grad_norm": 0.4821146207280302, "learning_rate": 3.25286795086589e-05, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.10111722350120544, "step": 1320, "valid_targets_mean": 6177.2, "valid_targets_min": 4508 }, { "epoch": 2.5052034058656574, "grad_norm": 0.4703343391187789, "learning_rate": 3.245504742320889e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.111258864402771, "step": 1325, "valid_targets_mean": 6082.4, "valid_targets_min": 1854 }, { "epoch": 2.5146641438032167, "grad_norm": 0.4096048017619596, "learning_rate": 3.238113853249176e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.09202168136835098, "step": 1330, "valid_targets_mean": 6705.9, "valid_targets_min": 5581 }, { "epoch": 2.524124881740776, "grad_norm": 0.4794504102641663, "learning_rate": 3.230695447908416e-05, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.12047106772661209, "step": 1335, "valid_targets_mean": 6179.9, "valid_targets_min": 1678 }, { "epoch": 2.533585619678335, "grad_norm": 0.42853949355775744, "learning_rate": 3.223249691167808e-05, "loss": 0.2056, "loss_nan_ranks": 0, "loss_rank_avg": 0.09987708181142807, "step": 1340, "valid_targets_mean": 6150.5, "valid_targets_min": 2052 }, { "epoch": 2.543046357615894, "grad_norm": 0.45038054848136166, "learning_rate": 3.215776748504415e-05, "loss": 0.1952, "loss_nan_ranks": 0, "loss_rank_avg": 0.09696616977453232, "step": 1345, "valid_targets_mean": 5926.5, "valid_targets_min": 4793 }, { "epoch": 2.552507095553453, "grad_norm": 0.46275515871952516, "learning_rate": 3.208276785999491e-05, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.09807568788528442, "step": 1350, "valid_targets_mean": 5176.4, "valid_targets_min": 3229 }, { "epoch": 2.5619678334910123, "grad_norm": 0.5405973660041345, "learning_rate": 3.200749970334788e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.11471271514892578, "step": 1355, "valid_targets_mean": 6159.6, "valid_targets_min": 2018 }, { "epoch": 2.571428571428571, "grad_norm": 0.6206982063058315, "learning_rate": 3.193196468788852e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.11576743423938751, "step": 1360, "valid_targets_mean": 4677.5, "valid_targets_min": 1588 }, { "epoch": 2.5808893093661305, "grad_norm": 0.4509216554262047, "learning_rate": 3.1856164492333045e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.09978030622005463, "step": 1365, "valid_targets_mean": 6171.2, "valid_targets_min": 4374 }, { "epoch": 2.59035004730369, "grad_norm": 0.5022130091375908, "learning_rate": 3.178010080129114e-05, "loss": 0.2109, "loss_nan_ranks": 0, "loss_rank_avg": 0.11894027888774872, "step": 1370, "valid_targets_mean": 4665.2, "valid_targets_min": 2530 }, { "epoch": 2.5998107852412486, "grad_norm": 0.49048450775706764, "learning_rate": 3.1703775305228476e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.12461340427398682, "step": 1375, "valid_targets_mean": 5434.1, "valid_targets_min": 2890 }, { "epoch": 2.609271523178808, "grad_norm": 0.4352184740333695, "learning_rate": 3.16271897004292e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.0782010406255722, "step": 1380, "valid_targets_mean": 5664.6, "valid_targets_min": 3486 }, { "epoch": 2.6187322611163673, "grad_norm": 0.548234031499346, "learning_rate": 3.1550345688958186e-05, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.12204037606716156, "step": 1385, "valid_targets_mean": 4753.4, "valid_targets_min": 2308 }, { "epoch": 2.628192999053926, "grad_norm": 0.4695384861258868, "learning_rate": 3.147324497862323e-05, "loss": 0.2069, "loss_nan_ranks": 0, "loss_rank_avg": 0.09967264533042908, "step": 1390, "valid_targets_mean": 5173.1, "valid_targets_min": 2358 }, { "epoch": 2.6376537369914854, "grad_norm": 0.4704020408844116, "learning_rate": 3.139588928293711e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.12265658378601074, "step": 1395, "valid_targets_mean": 6174.9, "valid_targets_min": 2043 }, { "epoch": 2.6471144749290447, "grad_norm": 0.5094346857161342, "learning_rate": 3.131828032107945e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.08958130329847336, "step": 1400, "valid_targets_mean": 4513.2, "valid_targets_min": 2441 }, { "epoch": 2.6565752128666036, "grad_norm": 0.4335492269233461, "learning_rate": 3.124041981785859e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.10349221527576447, "step": 1405, "valid_targets_mean": 6694.0, "valid_targets_min": 4944 }, { "epoch": 2.666035950804163, "grad_norm": 0.48204121851722115, "learning_rate": 3.1162309503673176e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.1139221042394638, "step": 1410, "valid_targets_mean": 6066.9, "valid_targets_min": 3755 }, { "epoch": 2.6754966887417218, "grad_norm": 0.5313576753857829, "learning_rate": 3.108395111447376e-05, "loss": 0.1993, "loss_nan_ranks": 0, "loss_rank_avg": 0.10339981317520142, "step": 1415, "valid_targets_mean": 5164.8, "valid_targets_min": 3608 }, { "epoch": 2.684957426679281, "grad_norm": 0.4992222498448238, "learning_rate": 3.1005346391724195e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.11738509684801102, "step": 1420, "valid_targets_mean": 5114.2, "valid_targets_min": 1631 }, { "epoch": 2.69441816461684, "grad_norm": 0.46001559873179254, "learning_rate": 3.092649708236293e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.0868842750787735, "step": 1425, "valid_targets_mean": 5085.1, "valid_targets_min": 3443 }, { "epoch": 2.703878902554399, "grad_norm": 0.4496410745031232, "learning_rate": 3.08474049387642e-05, "loss": 0.1993, "loss_nan_ranks": 0, "loss_rank_avg": 0.07558328658342361, "step": 1430, "valid_targets_mean": 5919.5, "valid_targets_min": 2787 }, { "epoch": 2.7133396404919585, "grad_norm": 0.42890955889144455, "learning_rate": 3.076807171869907e-05, "loss": 0.2074, "loss_nan_ranks": 0, "loss_rank_avg": 0.09730438888072968, "step": 1435, "valid_targets_mean": 6386.8, "valid_targets_min": 4754 }, { "epoch": 2.7228003784295174, "grad_norm": 0.5252335037883175, "learning_rate": 3.068849918529635e-05, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.11477208137512207, "step": 1440, "valid_targets_mean": 6028.5, "valid_targets_min": 2391 }, { "epoch": 2.7322611163670767, "grad_norm": 0.4705003773792761, "learning_rate": 3.060868910700348e-05, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.1162232756614685, "step": 1445, "valid_targets_mean": 5627.2, "valid_targets_min": 2560 }, { "epoch": 2.741721854304636, "grad_norm": 0.4885389985755956, "learning_rate": 3.052864325754712e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.10556751489639282, "step": 1450, "valid_targets_mean": 5362.4, "valid_targets_min": 807 }, { "epoch": 2.751182592242195, "grad_norm": 0.4311091763286013, "learning_rate": 3.0448363415893838e-05, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.09206240624189377, "step": 1455, "valid_targets_mean": 6032.2, "valid_targets_min": 3468 }, { "epoch": 2.760643330179754, "grad_norm": 0.5188781789839139, "learning_rate": 3.0367851366210507e-05, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.1059696152806282, "step": 1460, "valid_targets_mean": 5727.2, "valid_targets_min": 2454 }, { "epoch": 2.770104068117313, "grad_norm": 0.44581971955569505, "learning_rate": 3.028710889782466e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.0931185930967331, "step": 1465, "valid_targets_mean": 6201.0, "valid_targets_min": 2649 }, { "epoch": 2.7795648060548723, "grad_norm": 0.5236206344540041, "learning_rate": 3.020613780518476e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.10026657581329346, "step": 1470, "valid_targets_mean": 3980.8, "valid_targets_min": 2704 }, { "epoch": 2.789025543992431, "grad_norm": 0.47947188557970327, "learning_rate": 3.0124939887820264e-05, "loss": 0.2018, "loss_nan_ranks": 0, "loss_rank_avg": 0.0977272316813469, "step": 1475, "valid_targets_mean": 5940.4, "valid_targets_min": 1596 }, { "epoch": 2.7984862819299905, "grad_norm": 0.5143786896824261, "learning_rate": 3.0043516950301695e-05, "loss": 0.2022, "loss_nan_ranks": 0, "loss_rank_avg": 0.10160660743713379, "step": 1480, "valid_targets_mean": 4532.6, "valid_targets_min": 1334 }, { "epoch": 2.80794701986755, "grad_norm": 0.5672714165027751, "learning_rate": 2.996187080220047e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.10727030038833618, "step": 1485, "valid_targets_mean": 5066.0, "valid_targets_min": 3600 }, { "epoch": 2.8174077578051087, "grad_norm": 0.4306113138051286, "learning_rate": 2.9880003258048723e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.08836518228054047, "step": 1490, "valid_targets_mean": 5612.1, "valid_targets_min": 2974 }, { "epoch": 2.826868495742668, "grad_norm": 0.45476672936562934, "learning_rate": 2.9797916137298988e-05, "loss": 0.1933, "loss_nan_ranks": 0, "loss_rank_avg": 0.10338494181632996, "step": 1495, "valid_targets_mean": 5809.8, "valid_targets_min": 4592 }, { "epoch": 2.8363292336802273, "grad_norm": 0.5113296216520785, "learning_rate": 2.9715611264283723e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.1314087212085724, "step": 1500, "valid_targets_mean": 5553.6, "valid_targets_min": 3370 }, { "epoch": 2.845789971617786, "grad_norm": 0.4672791860190598, "learning_rate": 2.96330904681748e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.10095086693763733, "step": 1505, "valid_targets_mean": 6344.9, "valid_targets_min": 2582 }, { "epoch": 2.8552507095553454, "grad_norm": 0.46439688017624076, "learning_rate": 2.955035558294283e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.09525062888860703, "step": 1510, "valid_targets_mean": 5109.4, "valid_targets_min": 2243 }, { "epoch": 2.8647114474929043, "grad_norm": 0.5570784090311692, "learning_rate": 2.946740844731643e-05, "loss": 0.2044, "loss_nan_ranks": 0, "loss_rank_avg": 0.10325586795806885, "step": 1515, "valid_targets_mean": 6684.5, "valid_targets_min": 3214 }, { "epoch": 2.8741721854304636, "grad_norm": 0.5490977740057562, "learning_rate": 2.9384250904741328e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.13034790754318237, "step": 1520, "valid_targets_mean": 6380.8, "valid_targets_min": 3437 }, { "epoch": 2.8836329233680225, "grad_norm": 0.43561915051047767, "learning_rate": 2.9300884803339412e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.11554377526044846, "step": 1525, "valid_targets_mean": 7014.2, "valid_targets_min": 1085 }, { "epoch": 2.8930936613055818, "grad_norm": 0.46308857342667414, "learning_rate": 2.921731199586766e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.11941996216773987, "step": 1530, "valid_targets_mean": 6537.1, "valid_targets_min": 5272 }, { "epoch": 2.902554399243141, "grad_norm": 0.494911072684399, "learning_rate": 2.9133534339676954e-05, "loss": 0.2127, "loss_nan_ranks": 0, "loss_rank_avg": 0.11458069831132889, "step": 1535, "valid_targets_mean": 5210.6, "valid_targets_min": 1040 }, { "epoch": 2.9120151371807, "grad_norm": 0.4565372967082708, "learning_rate": 2.904955369667079e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.1161235123872757, "step": 1540, "valid_targets_mean": 6230.1, "valid_targets_min": 3877 }, { "epoch": 2.9214758751182592, "grad_norm": 0.5257513036521178, "learning_rate": 2.896537193326394e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.07970878481864929, "step": 1545, "valid_targets_mean": 6027.5, "valid_targets_min": 1539 }, { "epoch": 2.9309366130558185, "grad_norm": 0.45864182955167, "learning_rate": 2.8880990920340934e-05, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.09612005203962326, "step": 1550, "valid_targets_mean": 6322.1, "valid_targets_min": 2915 }, { "epoch": 2.9403973509933774, "grad_norm": 0.5623643431157161, "learning_rate": 2.879641253321447e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.10082189738750458, "step": 1555, "valid_targets_mean": 5255.1, "valid_targets_min": 3086 }, { "epoch": 2.9498580889309367, "grad_norm": 0.419930873720357, "learning_rate": 2.8711638651583797e-05, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.09671846032142639, "step": 1560, "valid_targets_mean": 6054.9, "valid_targets_min": 4136 }, { "epoch": 2.959318826868496, "grad_norm": 0.49967856491339036, "learning_rate": 2.862667115949287e-05, "loss": 0.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.09958822280168533, "step": 1565, "valid_targets_mean": 5343.4, "valid_targets_min": 3509 }, { "epoch": 2.968779564806055, "grad_norm": 0.4934284890500926, "learning_rate": 2.8541511945288523e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.09759525954723358, "step": 1570, "valid_targets_mean": 4621.4, "valid_targets_min": 926 }, { "epoch": 2.9782403027436137, "grad_norm": 0.48690869973678, "learning_rate": 2.8456162901578487e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.11360782384872437, "step": 1575, "valid_targets_mean": 6146.0, "valid_targets_min": 4705 }, { "epoch": 2.987701040681173, "grad_norm": 0.4432563490002925, "learning_rate": 2.837062592518933e-05, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.09611258655786514, "step": 1580, "valid_targets_mean": 6504.1, "valid_targets_min": 3859 }, { "epoch": 2.9971617786187323, "grad_norm": 0.4504000335980572, "learning_rate": 2.82849029171243e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.0998939573764801, "step": 1585, "valid_targets_mean": 5823.0, "valid_targets_min": 2563 }, { "epoch": 3.0056764427625353, "grad_norm": 0.42152223908884334, "learning_rate": 2.8198995782521077e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.09116984158754349, "step": 1590, "valid_targets_mean": 5818.8, "valid_targets_min": 2488 }, { "epoch": 3.0151371807000946, "grad_norm": 0.4506184282378153, "learning_rate": 2.8112906430609422e-05, "loss": 0.1913, "loss_nan_ranks": 0, "loss_rank_avg": 0.08673819899559021, "step": 1595, "valid_targets_mean": 6112.6, "valid_targets_min": 802 }, { "epoch": 3.024597918637654, "grad_norm": 0.4670333283993799, "learning_rate": 2.8026636774668783e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.09848645329475403, "step": 1600, "valid_targets_mean": 5506.5, "valid_targets_min": 1044 }, { "epoch": 3.034058656575213, "grad_norm": 0.47281036714970165, "learning_rate": 2.794018873198572e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.08072401583194733, "step": 1605, "valid_targets_mean": 5369.8, "valid_targets_min": 3436 }, { "epoch": 3.043519394512772, "grad_norm": 0.5353102435511196, "learning_rate": 2.7853564223811335e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.12510089576244354, "step": 1610, "valid_targets_mean": 6217.0, "valid_targets_min": 1687 }, { "epoch": 3.052980132450331, "grad_norm": 0.45973494835215695, "learning_rate": 2.776676517531856e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.09097345173358917, "step": 1615, "valid_targets_mean": 5983.0, "valid_targets_min": 3373 }, { "epoch": 3.0624408703878903, "grad_norm": 0.4445904803046461, "learning_rate": 2.7679793515559353e-05, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.09214864671230316, "step": 1620, "valid_targets_mean": 6430.4, "valid_targets_min": 3760 }, { "epoch": 3.0719016083254496, "grad_norm": 0.45328388544245035, "learning_rate": 2.759265117742188e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.08195392042398453, "step": 1625, "valid_targets_mean": 6079.6, "valid_targets_min": 1854 }, { "epoch": 3.0813623462630084, "grad_norm": 0.4690831711406225, "learning_rate": 2.7505340097587488e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.07273884117603302, "step": 1630, "valid_targets_mean": 4507.9, "valid_targets_min": 1597 }, { "epoch": 3.0908230842005677, "grad_norm": 0.4982006186841341, "learning_rate": 2.741786221648771e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.09364055097103119, "step": 1635, "valid_targets_mean": 5213.9, "valid_targets_min": 2643 }, { "epoch": 3.1002838221381266, "grad_norm": 0.46695428152371093, "learning_rate": 2.7330219478261138e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.09143832325935364, "step": 1640, "valid_targets_mean": 5311.4, "valid_targets_min": 3182 }, { "epoch": 3.109744560075686, "grad_norm": 0.49109477671766877, "learning_rate": 2.724241383071019e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.10723137855529785, "step": 1645, "valid_targets_mean": 5124.5, "valid_targets_min": 2652 }, { "epoch": 3.119205298013245, "grad_norm": 0.5290442016673559, "learning_rate": 2.7154447225257842e-05, "loss": 0.1987, "loss_nan_ranks": 0, "loss_rank_avg": 0.09807565808296204, "step": 1650, "valid_targets_mean": 5157.8, "valid_targets_min": 3662 }, { "epoch": 3.128666035950804, "grad_norm": 0.48302398328264, "learning_rate": 2.706632161690426e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.09389762580394745, "step": 1655, "valid_targets_mean": 5592.8, "valid_targets_min": 1365 }, { "epoch": 3.1381267738883634, "grad_norm": 0.5462595291125024, "learning_rate": 2.697803896418334e-05, "loss": 0.1736, "loss_nan_ranks": 0, "loss_rank_avg": 0.10734741389751434, "step": 1660, "valid_targets_mean": 7472.8, "valid_targets_min": 4511 }, { "epoch": 3.1475875118259222, "grad_norm": 0.45299896030231057, "learning_rate": 2.688960122911918e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.08676080405712128, "step": 1665, "valid_targets_mean": 5139.8, "valid_targets_min": 1530 }, { "epoch": 3.1570482497634815, "grad_norm": 0.46794779615343984, "learning_rate": 2.6801010377182498e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.08032511174678802, "step": 1670, "valid_targets_mean": 5465.9, "valid_targets_min": 3171 }, { "epoch": 3.166508987701041, "grad_norm": 0.4856091599422471, "learning_rate": 2.6712268377246913e-05, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.0756412222981453, "step": 1675, "valid_targets_mean": 5436.9, "valid_targets_min": 627 }, { "epoch": 3.1759697256385997, "grad_norm": 0.47735489114418606, "learning_rate": 2.6623377201545232e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.09691169857978821, "step": 1680, "valid_targets_mean": 5656.2, "valid_targets_min": 2768 }, { "epoch": 3.185430463576159, "grad_norm": 0.648435722014724, "learning_rate": 2.6534338825625577e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.10382549464702606, "step": 1685, "valid_targets_mean": 4963.2, "valid_targets_min": 2124 }, { "epoch": 3.194891201513718, "grad_norm": 0.4544568017139005, "learning_rate": 2.644515522830751e-05, "loss": 0.1816, "loss_nan_ranks": 0, "loss_rank_avg": 0.10306219756603241, "step": 1690, "valid_targets_mean": 6162.6, "valid_targets_min": 3162 }, { "epoch": 3.204351939451277, "grad_norm": 0.4291214030564758, "learning_rate": 2.6355828391638036e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.09292907267808914, "step": 1695, "valid_targets_mean": 5851.0, "valid_targets_min": 2481 }, { "epoch": 3.2138126773888365, "grad_norm": 0.45738947684126524, "learning_rate": 2.6266360300847563e-05, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.1131470575928688, "step": 1700, "valid_targets_mean": 6184.0, "valid_targets_min": 4281 }, { "epoch": 3.2232734153263953, "grad_norm": 0.47467928987027785, "learning_rate": 2.6176752944305783e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.08909299969673157, "step": 1705, "valid_targets_mean": 6111.5, "valid_targets_min": 1841 }, { "epoch": 3.2327341532639546, "grad_norm": 0.5220218655815788, "learning_rate": 2.6087008313477466e-05, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.10415120422840118, "step": 1710, "valid_targets_mean": 5395.8, "valid_targets_min": 2458 }, { "epoch": 3.242194891201514, "grad_norm": 0.4495107583419274, "learning_rate": 2.5997128402878233e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.09865536540746689, "step": 1715, "valid_targets_mean": 6275.6, "valid_targets_min": 869 }, { "epoch": 3.251655629139073, "grad_norm": 0.49558805488934193, "learning_rate": 2.5907115210030197e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.09733089804649353, "step": 1720, "valid_targets_mean": 5592.8, "valid_targets_min": 2553 }, { "epoch": 3.261116367076632, "grad_norm": 0.4876674508910489, "learning_rate": 2.5816970735417578e-05, "loss": 0.1883, "loss_nan_ranks": 0, "loss_rank_avg": 0.07756301015615463, "step": 1725, "valid_targets_mean": 5107.4, "valid_targets_min": 767 }, { "epoch": 3.270577105014191, "grad_norm": 0.46350530049832817, "learning_rate": 2.5726696982442258e-05, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.10111121833324432, "step": 1730, "valid_targets_mean": 7226.6, "valid_targets_min": 1849 }, { "epoch": 3.2800378429517503, "grad_norm": 0.47528950500021455, "learning_rate": 2.5636295957379233e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.09195686876773834, "step": 1735, "valid_targets_mean": 4867.9, "valid_targets_min": 3253 }, { "epoch": 3.289498580889309, "grad_norm": 0.40763971058722337, "learning_rate": 2.554576966933205e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.07847525179386139, "step": 1740, "valid_targets_mean": 6001.9, "valid_targets_min": 3797 }, { "epoch": 3.2989593188268684, "grad_norm": 0.5034722798936512, "learning_rate": 2.5455120130188135e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.08941084891557693, "step": 1745, "valid_targets_mean": 5322.4, "valid_targets_min": 2052 }, { "epoch": 3.3084200567644277, "grad_norm": 0.5247106920229991, "learning_rate": 2.5364349354574088e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.1243121474981308, "step": 1750, "valid_targets_mean": 6789.8, "valid_targets_min": 4550 }, { "epoch": 3.3178807947019866, "grad_norm": 0.4698194956877122, "learning_rate": 2.527345935981093e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.07875726372003555, "step": 1755, "valid_targets_mean": 4845.9, "valid_targets_min": 3364 }, { "epoch": 3.327341532639546, "grad_norm": 0.48545938207903017, "learning_rate": 2.5182452165869228e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.10978685319423676, "step": 1760, "valid_targets_mean": 4839.4, "valid_targets_min": 2004 }, { "epoch": 3.336802270577105, "grad_norm": 0.5109977977924978, "learning_rate": 2.5091329795324216e-05, "loss": 0.1923, "loss_nan_ranks": 0, "loss_rank_avg": 0.12365156412124634, "step": 1765, "valid_targets_mean": 5637.5, "valid_targets_min": 1829 }, { "epoch": 3.346263008514664, "grad_norm": 0.4419123564130073, "learning_rate": 2.500009427331088e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.07800058275461197, "step": 1770, "valid_targets_mean": 5704.9, "valid_targets_min": 3640 }, { "epoch": 3.3557237464522234, "grad_norm": 0.45652225709926536, "learning_rate": 2.4908747627478907e-05, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.08916126191616058, "step": 1775, "valid_targets_mean": 5361.8, "valid_targets_min": 1670 }, { "epoch": 3.3651844843897822, "grad_norm": 0.4662575708880977, "learning_rate": 2.481729188794764e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.08234363794326782, "step": 1780, "valid_targets_mean": 5800.2, "valid_targets_min": 3387 }, { "epoch": 3.3746452223273415, "grad_norm": 0.46065275741497946, "learning_rate": 2.472572908726096e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.09126449376344681, "step": 1785, "valid_targets_mean": 6144.8, "valid_targets_min": 3222 }, { "epoch": 3.384105960264901, "grad_norm": 0.47805331428588804, "learning_rate": 2.4634061260342107e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.09208405017852783, "step": 1790, "valid_targets_mean": 5238.8, "valid_targets_min": 3058 }, { "epoch": 3.3935666982024597, "grad_norm": 0.4669551990683149, "learning_rate": 2.4542290444448474e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.09105228632688522, "step": 1795, "valid_targets_mean": 5250.6, "valid_targets_min": 1781 }, { "epoch": 3.403027436140019, "grad_norm": 0.4590860719695206, "learning_rate": 2.445041867912629e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.09819218516349792, "step": 1800, "valid_targets_mean": 6047.4, "valid_targets_min": 4673 }, { "epoch": 3.412488174077578, "grad_norm": 0.4362989208375527, "learning_rate": 2.4358448006165345e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.08421623706817627, "step": 1805, "valid_targets_mean": 6545.9, "valid_targets_min": 4508 }, { "epoch": 3.421948912015137, "grad_norm": 0.48268909107786695, "learning_rate": 2.4266380469553586e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.08917456865310669, "step": 1810, "valid_targets_mean": 5196.9, "valid_targets_min": 3762 }, { "epoch": 3.4314096499526965, "grad_norm": 0.4149350257700459, "learning_rate": 2.4174218115431664e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.07774756103754044, "step": 1815, "valid_targets_mean": 4807.4, "valid_targets_min": 981 }, { "epoch": 3.4408703878902553, "grad_norm": 0.45130542433765514, "learning_rate": 2.408196299204751e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.09889756143093109, "step": 1820, "valid_targets_mean": 7054.2, "valid_targets_min": 4049 }, { "epoch": 3.4503311258278146, "grad_norm": 0.4989612810684145, "learning_rate": 2.3989617149710795e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.0977402999997139, "step": 1825, "valid_targets_mean": 5030.0, "valid_targets_min": 1329 }, { "epoch": 3.4597918637653735, "grad_norm": 0.42867511962488714, "learning_rate": 2.3897182640747336e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.08124013245105743, "step": 1830, "valid_targets_mean": 5519.9, "valid_targets_min": 3561 }, { "epoch": 3.469252601702933, "grad_norm": 0.4419227173372084, "learning_rate": 2.3804661519453532e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.07726781070232391, "step": 1835, "valid_targets_mean": 5114.1, "valid_targets_min": 2530 }, { "epoch": 3.478713339640492, "grad_norm": 0.4542904237834484, "learning_rate": 2.3712055842050676e-05, "loss": 0.1983, "loss_nan_ranks": 0, "loss_rank_avg": 0.11132301390171051, "step": 1840, "valid_targets_mean": 6203.1, "valid_targets_min": 3088 }, { "epoch": 3.488174077578051, "grad_norm": 0.5030994582312769, "learning_rate": 2.3619367666639256e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.09856734424829483, "step": 1845, "valid_targets_mean": 4904.2, "valid_targets_min": 2168 }, { "epoch": 3.4976348155156103, "grad_norm": 0.4591629662594089, "learning_rate": 2.3526599053153235e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.10106822848320007, "step": 1850, "valid_targets_mean": 5359.8, "valid_targets_min": 1166 }, { "epoch": 3.507095553453169, "grad_norm": 0.4555316025566089, "learning_rate": 2.3433752063314254e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.0851808488368988, "step": 1855, "valid_targets_mean": 5974.2, "valid_targets_min": 1865 }, { "epoch": 3.5165562913907285, "grad_norm": 0.5024235368504653, "learning_rate": 2.3340828760585827e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.08733783662319183, "step": 1860, "valid_targets_mean": 5503.6, "valid_targets_min": 1538 }, { "epoch": 3.5260170293282878, "grad_norm": 0.4567600934191136, "learning_rate": 2.3247831210127454e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.08546096086502075, "step": 1865, "valid_targets_mean": 5547.2, "valid_targets_min": 3440 }, { "epoch": 3.5354777672658466, "grad_norm": 0.4245415652272897, "learning_rate": 2.3154761478748752e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.08123698830604553, "step": 1870, "valid_targets_mean": 6187.4, "valid_targets_min": 2815 }, { "epoch": 3.544938505203406, "grad_norm": 0.4365000880114343, "learning_rate": 2.3061621634863524e-05, "loss": 0.1861, "loss_nan_ranks": 0, "loss_rank_avg": 0.10243307054042816, "step": 1875, "valid_targets_mean": 6236.2, "valid_targets_min": 2980 }, { "epoch": 3.5543992431409652, "grad_norm": 0.3915829839381538, "learning_rate": 2.296841374844375e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.07283614575862885, "step": 1880, "valid_targets_mean": 6081.2, "valid_targets_min": 4115 }, { "epoch": 3.563859981078524, "grad_norm": 0.529852157820633, "learning_rate": 2.287513989097364e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.07238370925188065, "step": 1885, "valid_targets_mean": 3611.2, "valid_targets_min": 1075 }, { "epoch": 3.5733207190160834, "grad_norm": 0.4293563741817337, "learning_rate": 2.2781802135403537e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.11047909408807755, "step": 1890, "valid_targets_mean": 7641.8, "valid_targets_min": 5269 }, { "epoch": 3.5827814569536423, "grad_norm": 0.47152119543132176, "learning_rate": 2.2688402556103906e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.09570799767971039, "step": 1895, "valid_targets_mean": 5092.1, "valid_targets_min": 2448 }, { "epoch": 3.5922421948912016, "grad_norm": 0.45350737772342575, "learning_rate": 2.2594943228819202e-05, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.08095633238554001, "step": 1900, "valid_targets_mean": 5481.2, "valid_targets_min": 1967 }, { "epoch": 3.6017029328287604, "grad_norm": 0.4755232122518845, "learning_rate": 2.2501426230621703e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.10834428668022156, "step": 1905, "valid_targets_mean": 5960.0, "valid_targets_min": 1879 }, { "epoch": 3.6111636707663197, "grad_norm": 0.45128717519347217, "learning_rate": 2.240785363986543e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.09623943269252777, "step": 1910, "valid_targets_mean": 5373.8, "valid_targets_min": 1537 }, { "epoch": 3.620624408703879, "grad_norm": 0.4387093767351713, "learning_rate": 2.2314227536139893e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.09231283515691757, "step": 1915, "valid_targets_mean": 6112.9, "valid_targets_min": 4051 }, { "epoch": 3.630085146641438, "grad_norm": 0.4402931522259467, "learning_rate": 2.2220550000223886e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.0882110446691513, "step": 1920, "valid_targets_mean": 6283.5, "valid_targets_min": 1538 }, { "epoch": 3.639545884578997, "grad_norm": 0.5398531884274245, "learning_rate": 2.212682311403926e-05, "loss": 0.1909, "loss_nan_ranks": 0, "loss_rank_avg": 0.10761941969394684, "step": 1925, "valid_targets_mean": 4044.2, "valid_targets_min": 1596 }, { "epoch": 3.6490066225165565, "grad_norm": 0.4565238432681483, "learning_rate": 2.2033048960604648e-05, "loss": 0.1862, "loss_nan_ranks": 0, "loss_rank_avg": 0.09304339438676834, "step": 1930, "valid_targets_mean": 6390.2, "valid_targets_min": 4754 }, { "epoch": 3.6584673604541154, "grad_norm": 0.44850280991108504, "learning_rate": 2.1939229623989146e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.11164131760597229, "step": 1935, "valid_targets_mean": 6644.2, "valid_targets_min": 1349 }, { "epoch": 3.6679280983916747, "grad_norm": 0.4640262426777603, "learning_rate": 2.184536718926604e-05, "loss": 0.192, "loss_nan_ranks": 0, "loss_rank_avg": 0.09215334802865982, "step": 1940, "valid_targets_mean": 5631.9, "valid_targets_min": 3043 }, { "epoch": 3.6773888363292335, "grad_norm": 0.46824021321893416, "learning_rate": 2.1751463742466437e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.0910329818725586, "step": 1945, "valid_targets_mean": 5201.4, "valid_targets_min": 3511 }, { "epoch": 3.686849574266793, "grad_norm": 0.4431506823294413, "learning_rate": 2.1657521370532897e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.08795459568500519, "step": 1950, "valid_targets_mean": 5397.9, "valid_targets_min": 3132 }, { "epoch": 3.6963103122043517, "grad_norm": 0.4633802916301476, "learning_rate": 2.1563542161273077e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.12115620076656342, "step": 1955, "valid_targets_mean": 6784.1, "valid_targets_min": 5711 }, { "epoch": 3.705771050141911, "grad_norm": 0.524813702266504, "learning_rate": 2.146952820331332e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.0889645665884018, "step": 1960, "valid_targets_mean": 4261.2, "valid_targets_min": 1085 }, { "epoch": 3.7152317880794703, "grad_norm": 0.5179766333042282, "learning_rate": 2.1375481586052237e-05, "loss": 0.1968, "loss_nan_ranks": 0, "loss_rank_avg": 0.15775936841964722, "step": 1965, "valid_targets_mean": 5552.2, "valid_targets_min": 1842 }, { "epoch": 3.724692526017029, "grad_norm": 0.43519671742917404, "learning_rate": 2.128140439961426e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.07054340094327927, "step": 1970, "valid_targets_mean": 5188.1, "valid_targets_min": 2924 }, { "epoch": 3.7341532639545885, "grad_norm": 0.4910575570595109, "learning_rate": 2.1187298734803214e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.08431971073150635, "step": 1975, "valid_targets_mean": 4949.9, "valid_targets_min": 797 }, { "epoch": 3.7436140018921478, "grad_norm": 0.4630093421088686, "learning_rate": 2.1093166683055832e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.11314146220684052, "step": 1980, "valid_targets_mean": 7022.4, "valid_targets_min": 5342 }, { "epoch": 3.7530747398297066, "grad_norm": 0.535517789749373, "learning_rate": 2.0999010336395273e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.09282414615154266, "step": 1985, "valid_targets_mean": 6285.4, "valid_targets_min": 2106 }, { "epoch": 3.762535477767266, "grad_norm": 0.5571000940662704, "learning_rate": 2.0904831787384645e-05, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.07217632234096527, "step": 1990, "valid_targets_mean": 6126.5, "valid_targets_min": 3404 }, { "epoch": 3.7719962157048252, "grad_norm": 0.4268240494799538, "learning_rate": 2.081063312908049e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.07058891654014587, "step": 1995, "valid_targets_mean": 5600.5, "valid_targets_min": 3873 }, { "epoch": 3.781456953642384, "grad_norm": 0.5099795351473646, "learning_rate": 2.0716416454986242e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.10760383307933807, "step": 2000, "valid_targets_mean": 5524.0, "valid_targets_min": 2901 }, { "epoch": 3.790917691579943, "grad_norm": 0.5097294694697546, "learning_rate": 2.0622183859005762e-05, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.0837247222661972, "step": 2005, "valid_targets_mean": 5495.4, "valid_targets_min": 3572 }, { "epoch": 3.8003784295175023, "grad_norm": 0.4534635455267388, "learning_rate": 2.052793743539673e-05, "loss": 0.1847, "loss_nan_ranks": 0, "loss_rank_avg": 0.08845619112253189, "step": 2010, "valid_targets_mean": 4920.2, "valid_targets_min": 1973 }, { "epoch": 3.8098391674550616, "grad_norm": 0.4737421696248978, "learning_rate": 2.043367927872416e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.08393751084804535, "step": 2015, "valid_targets_mean": 4830.4, "valid_targets_min": 2229 }, { "epoch": 3.8192999053926204, "grad_norm": 0.5249850580959375, "learning_rate": 2.0339411483813812e-05, "loss": 0.1975, "loss_nan_ranks": 0, "loss_rank_avg": 0.09723856300115585, "step": 2020, "valid_targets_mean": 6302.8, "valid_targets_min": 4072 }, { "epoch": 3.8287606433301797, "grad_norm": 0.4980980063470468, "learning_rate": 2.0245136145705648e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.09031252562999725, "step": 2025, "valid_targets_mean": 5300.4, "valid_targets_min": 874 }, { "epoch": 3.838221381267739, "grad_norm": 0.44214747777838764, "learning_rate": 2.0150855359607293e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.07880973070859909, "step": 2030, "valid_targets_mean": 5693.4, "valid_targets_min": 4152 }, { "epoch": 3.847682119205298, "grad_norm": 0.46991534430567616, "learning_rate": 2.0056571220847427e-05, "loss": 0.1896, "loss_nan_ranks": 0, "loss_rank_avg": 0.09112639725208282, "step": 2035, "valid_targets_mean": 5097.6, "valid_targets_min": 746 }, { "epoch": 3.857142857142857, "grad_norm": 0.4257490092767326, "learning_rate": 1.9962285824829245e-05, "loss": 0.1777, "loss_nan_ranks": 0, "loss_rank_avg": 0.08267439901828766, "step": 2040, "valid_targets_mean": 6324.6, "valid_targets_min": 3184 }, { "epoch": 3.8666035950804165, "grad_norm": 0.45072050304120914, "learning_rate": 1.986800126698389e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.09375502169132233, "step": 2045, "valid_targets_mean": 5897.2, "valid_targets_min": 4521 }, { "epoch": 3.8760643330179754, "grad_norm": 0.4256841534823553, "learning_rate": 1.9773719642723883e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.07670668512582779, "step": 2050, "valid_targets_mean": 6021.9, "valid_targets_min": 5247 }, { "epoch": 3.8855250709555347, "grad_norm": 0.46173000109780016, "learning_rate": 1.967944304739653e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.10058119893074036, "step": 2055, "valid_targets_mean": 6129.8, "valid_targets_min": 1951 }, { "epoch": 3.8949858088930935, "grad_norm": 0.49198637917271304, "learning_rate": 1.958517357623738e-05, "loss": 0.2021, "loss_nan_ranks": 0, "loss_rank_avg": 0.0934433713555336, "step": 2060, "valid_targets_mean": 4680.2, "valid_targets_min": 1565 }, { "epoch": 3.904446546830653, "grad_norm": 0.41090104211443634, "learning_rate": 1.949091332432367e-05, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.10091197490692139, "step": 2065, "valid_targets_mean": 7233.2, "valid_targets_min": 5038 }, { "epoch": 3.9139072847682117, "grad_norm": 0.4804194009201903, "learning_rate": 1.939666438652772e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.08922461420297623, "step": 2070, "valid_targets_mean": 5340.9, "valid_targets_min": 950 }, { "epoch": 3.923368022705771, "grad_norm": 0.4806891457866739, "learning_rate": 1.9302428857470406e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.11550113558769226, "step": 2075, "valid_targets_mean": 6336.2, "valid_targets_min": 3086 }, { "epoch": 3.9328287606433303, "grad_norm": 0.4278376583395593, "learning_rate": 1.9208208831474618e-05, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.08728399872779846, "step": 2080, "valid_targets_mean": 5975.9, "valid_targets_min": 2398 }, { "epoch": 3.942289498580889, "grad_norm": 0.46404606456299635, "learning_rate": 1.9114006402518676e-05, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.07773632556200027, "step": 2085, "valid_targets_mean": 5166.8, "valid_targets_min": 1719 }, { "epoch": 3.9517502365184485, "grad_norm": 0.45528452379559725, "learning_rate": 1.901982366418985e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.09388162940740585, "step": 2090, "valid_targets_mean": 6227.4, "valid_targets_min": 4431 }, { "epoch": 3.961210974456008, "grad_norm": 0.438918695698072, "learning_rate": 1.892566270963777e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.08582787215709686, "step": 2095, "valid_targets_mean": 5624.0, "valid_targets_min": 501 }, { "epoch": 3.9706717123935666, "grad_norm": 0.44371795309461276, "learning_rate": 1.883152563152795e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.09151076525449753, "step": 2100, "valid_targets_mean": 5600.0, "valid_targets_min": 3358 }, { "epoch": 3.980132450331126, "grad_norm": 0.4515824110525669, "learning_rate": 1.8737414521995268e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.09049001336097717, "step": 2105, "valid_targets_mean": 5852.4, "valid_targets_min": 3330 }, { "epoch": 3.989593188268685, "grad_norm": 0.49711976335752656, "learning_rate": 1.8643331472597445e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.08675132691860199, "step": 2110, "valid_targets_mean": 4558.4, "valid_targets_min": 1326 }, { "epoch": 3.999053926206244, "grad_norm": 0.45261577331220815, "learning_rate": 1.8549278574268618e-05, "loss": 0.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.08939523249864578, "step": 2115, "valid_targets_mean": 6261.1, "valid_targets_min": 2221 }, { "epoch": 4.007568590350047, "grad_norm": 0.47605379171873335, "learning_rate": 1.8455257917272814e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.07639576494693756, "step": 2120, "valid_targets_mean": 6170.1, "valid_targets_min": 4187 }, { "epoch": 4.017029328287607, "grad_norm": 0.47606983027063804, "learning_rate": 1.836127159115752e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.07952439785003662, "step": 2125, "valid_targets_mean": 5953.5, "valid_targets_min": 2745 }, { "epoch": 4.026490066225166, "grad_norm": 0.47621520504940396, "learning_rate": 1.8267321684707246e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.07942505925893784, "step": 2130, "valid_targets_mean": 5075.5, "valid_targets_min": 2145 }, { "epoch": 4.035950804162725, "grad_norm": 0.44019831135362675, "learning_rate": 1.817341028589709e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.10214540362358093, "step": 2135, "valid_targets_mean": 7163.8, "valid_targets_min": 2462 }, { "epoch": 4.045411542100283, "grad_norm": 0.4937271391982351, "learning_rate": 1.8079539481846366e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.07459040731191635, "step": 2140, "valid_targets_mean": 6227.9, "valid_targets_min": 3553 }, { "epoch": 4.054872280037843, "grad_norm": 0.4565164265520384, "learning_rate": 1.7985711358772165e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.07631679624319077, "step": 2145, "valid_targets_mean": 6136.8, "valid_targets_min": 4986 }, { "epoch": 4.064333017975402, "grad_norm": 0.4635680900045017, "learning_rate": 1.789192800194305e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.06983435899019241, "step": 2150, "valid_targets_mean": 5001.0, "valid_targets_min": 3895 }, { "epoch": 4.073793755912961, "grad_norm": 0.4728478107816903, "learning_rate": 1.7798191495632656e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.07341806590557098, "step": 2155, "valid_targets_mean": 6114.5, "valid_targets_min": 3650 }, { "epoch": 4.083254493850521, "grad_norm": 0.43092833708069367, "learning_rate": 1.7704503923073414e-05, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.07183924317359924, "step": 2160, "valid_targets_mean": 5524.2, "valid_targets_min": 2899 }, { "epoch": 4.0927152317880795, "grad_norm": 0.44675377011480427, "learning_rate": 1.7610867366410228e-05, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.08465928584337234, "step": 2165, "valid_targets_mean": 6738.9, "valid_targets_min": 4782 }, { "epoch": 4.102175969725638, "grad_norm": 0.5030878317134609, "learning_rate": 1.751728390665422e-05, "loss": 0.1816, "loss_nan_ranks": 0, "loss_rank_avg": 0.10309462249279022, "step": 2170, "valid_targets_mean": 6185.4, "valid_targets_min": 4371 }, { "epoch": 4.111636707663198, "grad_norm": 0.46070987441440847, "learning_rate": 1.742375562363645e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.0805835872888565, "step": 2175, "valid_targets_mean": 5687.2, "valid_targets_min": 1089 }, { "epoch": 4.121097445600757, "grad_norm": 0.4770082395886628, "learning_rate": 1.7330284595961714e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.07416245341300964, "step": 2180, "valid_targets_mean": 4618.5, "valid_targets_min": 1323 }, { "epoch": 4.130558183538316, "grad_norm": 0.5071152049171963, "learning_rate": 1.7236872900962364e-05, "loss": 0.176, "loss_nan_ranks": 0, "loss_rank_avg": 0.0895686000585556, "step": 2185, "valid_targets_mean": 5050.6, "valid_targets_min": 1848 }, { "epoch": 4.140018921475875, "grad_norm": 0.49903371784517364, "learning_rate": 1.7143522614652087e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.079046830534935, "step": 2190, "valid_targets_mean": 6004.9, "valid_targets_min": 1044 }, { "epoch": 4.149479659413434, "grad_norm": 0.4735587488254344, "learning_rate": 1.7050235811679842e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.07874190807342529, "step": 2195, "valid_targets_mean": 5291.8, "valid_targets_min": 3722 }, { "epoch": 4.158940397350993, "grad_norm": 0.4906110256360143, "learning_rate": 1.6957014565283686e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.08479055762290955, "step": 2200, "valid_targets_mean": 5371.8, "valid_targets_min": 3449 }, { "epoch": 4.168401135288552, "grad_norm": 0.45624047631312886, "learning_rate": 1.6863860947244734e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.0816778838634491, "step": 2205, "valid_targets_mean": 6315.0, "valid_targets_min": 2799 }, { "epoch": 4.177861873226112, "grad_norm": 0.5699518768002438, "learning_rate": 1.67707770278411e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.10105790197849274, "step": 2210, "valid_targets_mean": 5623.0, "valid_targets_min": 1596 }, { "epoch": 4.187322611163671, "grad_norm": 0.5215881624136443, "learning_rate": 1.6677764875801896e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.08306705951690674, "step": 2215, "valid_targets_mean": 4635.6, "valid_targets_min": 2345 }, { "epoch": 4.19678334910123, "grad_norm": 0.51490913642158, "learning_rate": 1.658482655826125e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.08734717965126038, "step": 2220, "valid_targets_mean": 5146.8, "valid_targets_min": 807 }, { "epoch": 4.206244087038789, "grad_norm": 0.5117573321781882, "learning_rate": 1.649196414071237e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.08336880803108215, "step": 2225, "valid_targets_mean": 5012.2, "valid_targets_min": 3057 }, { "epoch": 4.215704824976348, "grad_norm": 0.47924671481016884, "learning_rate": 1.6399179686961626e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.08556775748729706, "step": 2230, "valid_targets_mean": 6178.0, "valid_targets_min": 4463 }, { "epoch": 4.225165562913907, "grad_norm": 0.4866400336787381, "learning_rate": 1.630647525908271e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.08188188076019287, "step": 2235, "valid_targets_mean": 5382.4, "valid_targets_min": 3049 }, { "epoch": 4.234626300851467, "grad_norm": 0.4733351788699037, "learning_rate": 1.621385291737076e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.07345275580883026, "step": 2240, "valid_targets_mean": 4783.5, "valid_targets_min": 2041 }, { "epoch": 4.244087038789026, "grad_norm": 0.4767465652248829, "learning_rate": 1.6121314720296655e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.08385774493217468, "step": 2245, "valid_targets_mean": 5386.6, "valid_targets_min": 3619 }, { "epoch": 4.253547776726585, "grad_norm": 0.4789402563300116, "learning_rate": 1.6028862724461162e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.09487953782081604, "step": 2250, "valid_targets_mean": 5879.5, "valid_targets_min": 4405 }, { "epoch": 4.263008514664143, "grad_norm": 0.443105700964735, "learning_rate": 1.593649898454932e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.08754053711891174, "step": 2255, "valid_targets_mean": 5570.6, "valid_targets_min": 2637 }, { "epoch": 4.272469252601703, "grad_norm": 0.5369571580173819, "learning_rate": 1.5844225553284708e-05, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.07940442860126495, "step": 2260, "valid_targets_mean": 3860.5, "valid_targets_min": 1223 }, { "epoch": 4.281929990539262, "grad_norm": 0.4378025466243674, "learning_rate": 1.5752044481383875e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.09036465734243393, "step": 2265, "valid_targets_mean": 6985.9, "valid_targets_min": 4865 }, { "epoch": 4.291390728476821, "grad_norm": 0.4820274642035886, "learning_rate": 1.565995781751073e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.06915217638015747, "step": 2270, "valid_targets_mean": 4996.8, "valid_targets_min": 3137 }, { "epoch": 4.300851466414381, "grad_norm": 0.48393554696939894, "learning_rate": 1.556796760823105e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.08670508116483688, "step": 2275, "valid_targets_mean": 5565.1, "valid_targets_min": 2756 }, { "epoch": 4.3103122043519395, "grad_norm": 0.48251450451372285, "learning_rate": 1.5476075897966943e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.09289459884166718, "step": 2280, "valid_targets_mean": 7153.2, "valid_targets_min": 5303 }, { "epoch": 4.319772942289498, "grad_norm": 0.4834522235548724, "learning_rate": 1.538428472895145e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.09639063477516174, "step": 2285, "valid_targets_mean": 6249.6, "valid_targets_min": 3680 }, { "epoch": 4.329233680227058, "grad_norm": 0.48082534237663743, "learning_rate": 1.5292596141183156e-05, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.08183325827121735, "step": 2290, "valid_targets_mean": 5584.1, "valid_targets_min": 926 }, { "epoch": 4.338694418164617, "grad_norm": 0.5160950372006214, "learning_rate": 1.5201012172380834e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.07628428936004639, "step": 2295, "valid_targets_mean": 4932.9, "valid_targets_min": 802 }, { "epoch": 4.348155156102176, "grad_norm": 0.47312968698632135, "learning_rate": 1.5109534857938181e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.08713920414447784, "step": 2300, "valid_targets_mean": 5098.2, "valid_targets_min": 2424 }, { "epoch": 4.357615894039735, "grad_norm": 0.5690038403341784, "learning_rate": 1.501816623087857e-05, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.07945723831653595, "step": 2305, "valid_targets_mean": 4997.6, "valid_targets_min": 627 }, { "epoch": 4.3670766319772945, "grad_norm": 0.497199283715766, "learning_rate": 1.4926908321809856e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.09394356608390808, "step": 2310, "valid_targets_mean": 4530.1, "valid_targets_min": 1636 }, { "epoch": 4.376537369914853, "grad_norm": 0.5548377322347214, "learning_rate": 1.4835763158879264e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.08540955185890198, "step": 2315, "valid_targets_mean": 6093.8, "valid_targets_min": 3232 }, { "epoch": 4.385998107852412, "grad_norm": 0.44852133106940606, "learning_rate": 1.474473276772831e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.06924474239349365, "step": 2320, "valid_targets_mean": 5439.8, "valid_targets_min": 1041 }, { "epoch": 4.395458845789972, "grad_norm": 0.46438627822043954, "learning_rate": 1.4653819171447802e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.06627480685710907, "step": 2325, "valid_targets_mean": 5166.6, "valid_targets_min": 2940 }, { "epoch": 4.404919583727531, "grad_norm": 0.47334974760463755, "learning_rate": 1.4563024390532828e-05, "loss": 0.1711, "loss_nan_ranks": 0, "loss_rank_avg": 0.07604990899562836, "step": 2330, "valid_targets_mean": 5193.4, "valid_targets_min": 3623 }, { "epoch": 4.41438032166509, "grad_norm": 0.5009910260511469, "learning_rate": 1.4472350442837892e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.09670796990394592, "step": 2335, "valid_targets_mean": 5357.4, "valid_targets_min": 2511 }, { "epoch": 4.423841059602649, "grad_norm": 0.46984143631798586, "learning_rate": 1.4381799343532073e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.0717625617980957, "step": 2340, "valid_targets_mean": 5341.1, "valid_targets_min": 2983 }, { "epoch": 4.433301797540208, "grad_norm": 0.513188568847778, "learning_rate": 1.4291373105054201e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.09518257528543472, "step": 2345, "valid_targets_mean": 5414.4, "valid_targets_min": 2589 }, { "epoch": 4.442762535477767, "grad_norm": 0.5036887196599628, "learning_rate": 1.4201073737068182e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.08094947040081024, "step": 2350, "valid_targets_mean": 4974.0, "valid_targets_min": 2419 }, { "epoch": 4.452223273415326, "grad_norm": 0.4912192592188947, "learning_rate": 1.411090324641829e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.07559478282928467, "step": 2355, "valid_targets_mean": 5369.4, "valid_targets_min": 1880 }, { "epoch": 4.461684011352886, "grad_norm": 0.44942292554051916, "learning_rate": 1.4020863637084597e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.08044009655714035, "step": 2360, "valid_targets_mean": 6921.1, "valid_targets_min": 3977 }, { "epoch": 4.471144749290445, "grad_norm": 0.5240965033441205, "learning_rate": 1.3930956910138407e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.09544815123081207, "step": 2365, "valid_targets_mean": 5657.5, "valid_targets_min": 1822 }, { "epoch": 4.4806054872280034, "grad_norm": 0.48796641053338774, "learning_rate": 1.3841185063697817e-05, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.09811213612556458, "step": 2370, "valid_targets_mean": 6156.5, "valid_targets_min": 1085 }, { "epoch": 4.490066225165563, "grad_norm": 0.5152407926424893, "learning_rate": 1.3751550092883275e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.08462321758270264, "step": 2375, "valid_targets_mean": 4567.0, "valid_targets_min": 1628 }, { "epoch": 4.499526963103122, "grad_norm": 0.42297714903267936, "learning_rate": 1.366205398977329e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.08978421986103058, "step": 2380, "valid_targets_mean": 6711.9, "valid_targets_min": 5091 }, { "epoch": 4.508987701040681, "grad_norm": 0.5111927828536853, "learning_rate": 1.3572698743360086e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.10813774168491364, "step": 2385, "valid_targets_mean": 6821.0, "valid_targets_min": 2143 }, { "epoch": 4.518448438978241, "grad_norm": 0.5302388829745546, "learning_rate": 1.3483486339505476e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.07856719195842743, "step": 2390, "valid_targets_mean": 5057.1, "valid_targets_min": 1893 }, { "epoch": 4.5279091769157995, "grad_norm": 0.5657954220828462, "learning_rate": 1.3394418760896665e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.07074756920337677, "step": 2395, "valid_targets_mean": 5564.0, "valid_targets_min": 3312 }, { "epoch": 4.537369914853358, "grad_norm": 0.44816213903081314, "learning_rate": 1.3305497987002214e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.10855835676193237, "step": 2400, "valid_targets_mean": 7582.5, "valid_targets_min": 4586 }, { "epoch": 4.546830652790918, "grad_norm": 0.4969643603677432, "learning_rate": 1.3216725994028065e-05, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.07549931108951569, "step": 2405, "valid_targets_mean": 4293.8, "valid_targets_min": 2050 }, { "epoch": 4.556291390728477, "grad_norm": 0.49714025262854705, "learning_rate": 1.3128104754873592e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.09053511917591095, "step": 2410, "valid_targets_mean": 6208.1, "valid_targets_min": 4083 }, { "epoch": 4.565752128666036, "grad_norm": 0.4658167126447159, "learning_rate": 1.3039636239087751e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.08036954700946808, "step": 2415, "valid_targets_mean": 6865.4, "valid_targets_min": 5076 }, { "epoch": 4.575212866603595, "grad_norm": 0.4915257649668184, "learning_rate": 1.2951322412825333e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.09244567155838013, "step": 2420, "valid_targets_mean": 5903.8, "valid_targets_min": 2127 }, { "epoch": 4.5846736045411545, "grad_norm": 0.4567472797832718, "learning_rate": 1.2863165238803252e-05, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.07485067844390869, "step": 2425, "valid_targets_mean": 4524.6, "valid_targets_min": 1753 }, { "epoch": 4.594134342478713, "grad_norm": 0.5247752395742293, "learning_rate": 1.2775166676256942e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.08491607010364532, "step": 2430, "valid_targets_mean": 5091.6, "valid_targets_min": 2419 }, { "epoch": 4.603595080416272, "grad_norm": 0.512670381259889, "learning_rate": 1.2687328680896784e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.09027966111898422, "step": 2435, "valid_targets_mean": 5586.4, "valid_targets_min": 1893 }, { "epoch": 4.613055818353832, "grad_norm": 0.5086538957041402, "learning_rate": 1.2599653204864656e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.08313116431236267, "step": 2440, "valid_targets_mean": 4873.9, "valid_targets_min": 3246 }, { "epoch": 4.622516556291391, "grad_norm": 0.48363850099286876, "learning_rate": 1.2512142196690573e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.0974661335349083, "step": 2445, "valid_targets_mean": 6357.2, "valid_targets_min": 807 }, { "epoch": 4.63197729422895, "grad_norm": 0.4322906872044424, "learning_rate": 1.2424797601249328e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.06740396469831467, "step": 2450, "valid_targets_mean": 5795.9, "valid_targets_min": 3054 }, { "epoch": 4.6414380321665085, "grad_norm": 0.5417059342860636, "learning_rate": 1.2337621359717333e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.08276567608118057, "step": 2455, "valid_targets_mean": 6291.6, "valid_targets_min": 3234 }, { "epoch": 4.650898770104068, "grad_norm": 0.4795632027077425, "learning_rate": 1.2250615409529427e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.07418248802423477, "step": 2460, "valid_targets_mean": 5510.9, "valid_targets_min": 1409 }, { "epoch": 4.660359508041627, "grad_norm": 0.49378217745950864, "learning_rate": 1.2163781684335831e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.09448840469121933, "step": 2465, "valid_targets_mean": 7180.1, "valid_targets_min": 4937 }, { "epoch": 4.669820245979186, "grad_norm": 0.5039190071239315, "learning_rate": 1.2077122113959186e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.08793889731168747, "step": 2470, "valid_targets_mean": 5509.6, "valid_targets_min": 1816 }, { "epoch": 4.679280983916746, "grad_norm": 0.4931542543015456, "learning_rate": 1.1990638624351659e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.08114581555128098, "step": 2475, "valid_targets_mean": 6421.4, "valid_targets_min": 3250 }, { "epoch": 4.688741721854305, "grad_norm": 0.5489707303546564, "learning_rate": 1.1904333137552124e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.08878085017204285, "step": 2480, "valid_targets_mean": 5445.0, "valid_targets_min": 2077 }, { "epoch": 4.6982024597918635, "grad_norm": 0.4837787673198404, "learning_rate": 1.1818207571643484e-05, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.07125557959079742, "step": 2485, "valid_targets_mean": 4444.9, "valid_targets_min": 2616 }, { "epoch": 4.707663197729423, "grad_norm": 0.5083177062405144, "learning_rate": 1.173226384070999e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.07098717987537384, "step": 2490, "valid_targets_mean": 5205.4, "valid_targets_min": 1173 }, { "epoch": 4.717123935666982, "grad_norm": 0.5575925952865973, "learning_rate": 1.1646503854794746e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.11164502054452896, "step": 2495, "valid_targets_mean": 5729.4, "valid_targets_min": 1426 }, { "epoch": 4.726584673604541, "grad_norm": 0.5223389265424682, "learning_rate": 1.1560929519857246e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.08164171129465103, "step": 2500, "valid_targets_mean": 4500.6, "valid_targets_min": 1089 }, { "epoch": 4.736045411542101, "grad_norm": 0.5383697567770299, "learning_rate": 1.1475542737730998e-05, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.08602418750524521, "step": 2505, "valid_targets_mean": 5347.1, "valid_targets_min": 2448 }, { "epoch": 4.7455061494796595, "grad_norm": 0.5239083651471129, "learning_rate": 1.1390345406081286e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.08246322721242905, "step": 2510, "valid_targets_mean": 5422.6, "valid_targets_min": 2932 }, { "epoch": 4.754966887417218, "grad_norm": 0.48646478838090534, "learning_rate": 1.1305339418362978e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.07415419816970825, "step": 2515, "valid_targets_mean": 5297.6, "valid_targets_min": 1772 }, { "epoch": 4.764427625354777, "grad_norm": 0.4743203401979834, "learning_rate": 1.1220526663778441e-05, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.09026531875133514, "step": 2520, "valid_targets_mean": 6998.8, "valid_targets_min": 4582 }, { "epoch": 4.773888363292337, "grad_norm": 0.49095486039648706, "learning_rate": 1.113590902723557e-05, "loss": 0.1629, "loss_nan_ranks": 0, "loss_rank_avg": 0.08181262016296387, "step": 2525, "valid_targets_mean": 5897.6, "valid_targets_min": 2450 }, { "epoch": 4.783349101229896, "grad_norm": 0.4902911174921005, "learning_rate": 1.1051488389305875e-05, "loss": 0.1593, "loss_nan_ranks": 0, "loss_rank_avg": 0.08572474122047424, "step": 2530, "valid_targets_mean": 5079.1, "valid_targets_min": 571 }, { "epoch": 4.792809839167455, "grad_norm": 0.4613815865050699, "learning_rate": 1.0967266626182726e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.07123850286006927, "step": 2535, "valid_targets_mean": 6506.1, "valid_targets_min": 4824 }, { "epoch": 4.8022705771050145, "grad_norm": 0.4813549393736916, "learning_rate": 1.0883245609639622e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.07271705567836761, "step": 2540, "valid_targets_mean": 5694.1, "valid_targets_min": 4281 }, { "epoch": 4.811731315042573, "grad_norm": 0.48283752024336907, "learning_rate": 1.0799427206988588e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.08985312283039093, "step": 2545, "valid_targets_mean": 6184.9, "valid_targets_min": 2244 }, { "epoch": 4.821192052980132, "grad_norm": 0.5092895093118036, "learning_rate": 1.0715813281038697e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.07882203161716461, "step": 2550, "valid_targets_mean": 5018.8, "valid_targets_min": 2927 }, { "epoch": 4.830652790917692, "grad_norm": 0.47902608616249853, "learning_rate": 1.0632405690054652e-05, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.07882026582956314, "step": 2555, "valid_targets_mean": 5350.1, "valid_targets_min": 2041 }, { "epoch": 4.840113528855251, "grad_norm": 0.4781631389195755, "learning_rate": 1.0549206287715524e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.07253912091255188, "step": 2560, "valid_targets_mean": 5826.4, "valid_targets_min": 4815 }, { "epoch": 4.84957426679281, "grad_norm": 0.50927564435645, "learning_rate": 1.0466216923073497e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.07280386984348297, "step": 2565, "valid_targets_mean": 4362.0, "valid_targets_min": 1897 }, { "epoch": 4.859035004730369, "grad_norm": 0.4990588524253479, "learning_rate": 1.0383439440512814e-05, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.0832209438085556, "step": 2570, "valid_targets_mean": 5917.6, "valid_targets_min": 2058 }, { "epoch": 4.868495742667928, "grad_norm": 0.5104279600936655, "learning_rate": 1.030087567970879e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.10466784238815308, "step": 2575, "valid_targets_mean": 6902.9, "valid_targets_min": 4028 }, { "epoch": 4.877956480605487, "grad_norm": 0.49021362537296576, "learning_rate": 1.0218527475586902e-05, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.08758172392845154, "step": 2580, "valid_targets_mean": 5222.5, "valid_targets_min": 3552 }, { "epoch": 4.887417218543046, "grad_norm": 0.5214528334399346, "learning_rate": 1.013639665828201e-05, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.0988951027393341, "step": 2585, "valid_targets_mean": 5775.8, "valid_targets_min": 3433 }, { "epoch": 4.896877956480606, "grad_norm": 0.4992920444778697, "learning_rate": 1.0054485053097731e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.08480118215084076, "step": 2590, "valid_targets_mean": 5527.4, "valid_targets_min": 3358 }, { "epoch": 4.906338694418165, "grad_norm": 0.5073995907257243, "learning_rate": 9.972794480465798e-06, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.08439338207244873, "step": 2595, "valid_targets_mean": 5569.0, "valid_targets_min": 3082 }, { "epoch": 4.9157994323557235, "grad_norm": 0.46526402755578683, "learning_rate": 9.891326755905652e-06, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.07682204246520996, "step": 2600, "valid_targets_mean": 5154.4, "valid_targets_min": 2569 }, { "epoch": 4.925260170293283, "grad_norm": 0.5207018903668406, "learning_rate": 9.8100836899841e-06, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.08420620113611221, "step": 2605, "valid_targets_mean": 5129.8, "valid_targets_min": 1379 }, { "epoch": 4.934720908230842, "grad_norm": 0.4284701079205504, "learning_rate": 9.729067088275025e-06, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.07169349491596222, "step": 2610, "valid_targets_mean": 6409.8, "valid_targets_min": 5031 }, { "epoch": 4.944181646168401, "grad_norm": 0.4820116779766079, "learning_rate": 9.648278751319329e-06, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.08313654363155365, "step": 2615, "valid_targets_mean": 7001.9, "valid_targets_min": 3211 }, { "epoch": 4.95364238410596, "grad_norm": 0.455960966421983, "learning_rate": 9.56772047458485e-06, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.08207933604717255, "step": 2620, "valid_targets_mean": 6887.5, "valid_targets_min": 4307 }, { "epoch": 4.9631031220435196, "grad_norm": 0.49589408534775636, "learning_rate": 9.487394048426497e-06, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.06637847423553467, "step": 2625, "valid_targets_mean": 5183.2, "valid_targets_min": 2566 }, { "epoch": 4.972563859981078, "grad_norm": 0.48599414771340765, "learning_rate": 9.407301258046454e-06, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.09902942180633545, "step": 2630, "valid_targets_mean": 6159.5, "valid_targets_min": 3864 }, { "epoch": 4.982024597918637, "grad_norm": 0.5152781317137514, "learning_rate": 9.327443883454499e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.07795896381139755, "step": 2635, "valid_targets_mean": 4861.8, "valid_targets_min": 1064 }, { "epoch": 4.991485335856197, "grad_norm": 0.5038511985913933, "learning_rate": 9.247823699428452e-06, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.09703533351421356, "step": 2640, "valid_targets_mean": 5297.1, "valid_targets_min": 1495 }, { "epoch": 5.001892147587512, "grad_norm": 0.7919432421674072, "learning_rate": 9.168442475474737e-06, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.07412499934434891, "step": 2645, "valid_targets_mean": 5746.4, "valid_targets_min": 1906 }, { "epoch": 5.011352885525071, "grad_norm": 0.47230625720793334, "learning_rate": 9.089301975789029e-06, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.07187912613153458, "step": 2650, "valid_targets_mean": 5863.1, "valid_targets_min": 1526 }, { "epoch": 5.02081362346263, "grad_norm": 0.4893299689425291, "learning_rate": 9.010403959217078e-06, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.07913671433925629, "step": 2655, "valid_targets_mean": 5488.1, "valid_targets_min": 2092 }, { "epoch": 5.030274361400189, "grad_norm": 0.6130415734002539, "learning_rate": 8.931750179215586e-06, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.07517177611589432, "step": 2660, "valid_targets_mean": 6251.6, "valid_targets_min": 4729 }, { "epoch": 5.039735099337748, "grad_norm": 0.49993267762896326, "learning_rate": 8.853342383813289e-06, "loss": 0.1693, "loss_nan_ranks": 0, "loss_rank_avg": 0.08262951672077179, "step": 2665, "valid_targets_mean": 6646.4, "valid_targets_min": 3061 }, { "epoch": 5.049195837275308, "grad_norm": 0.5096897089548484, "learning_rate": 8.775182315572044e-06, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.07983925938606262, "step": 2670, "valid_targets_mean": 4711.5, "valid_targets_min": 1457 }, { "epoch": 5.058656575212867, "grad_norm": 0.5485108474130074, "learning_rate": 8.697271711548163e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.08494468778371811, "step": 2675, "valid_targets_mean": 5836.0, "valid_targets_min": 2637 }, { "epoch": 5.068117313150426, "grad_norm": 0.5863734037093357, "learning_rate": 8.619612303253759e-06, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.07812988758087158, "step": 2680, "valid_targets_mean": 5071.0, "valid_targets_min": 3161 }, { "epoch": 5.077578051087984, "grad_norm": 0.5169864922201843, "learning_rate": 8.54220581661829e-06, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.09739792346954346, "step": 2685, "valid_targets_mean": 5116.9, "valid_targets_min": 2506 }, { "epoch": 5.087038789025544, "grad_norm": 0.4924483330266412, "learning_rate": 8.465053971950188e-06, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.089106485247612, "step": 2690, "valid_targets_mean": 5403.6, "valid_targets_min": 3050 }, { "epoch": 5.096499526963103, "grad_norm": 0.4762786682998264, "learning_rate": 8.388158483898661e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.07820412516593933, "step": 2695, "valid_targets_mean": 6105.2, "valid_targets_min": 1913 }, { "epoch": 5.105960264900662, "grad_norm": 0.5062357344918998, "learning_rate": 8.31152106141553e-06, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.09622031450271606, "step": 2700, "valid_targets_mean": 5775.8, "valid_targets_min": 2980 }, { "epoch": 5.115421002838222, "grad_norm": 0.5002871838224989, "learning_rate": 8.235143407717282e-06, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.0585002526640892, "step": 2705, "valid_targets_mean": 3764.5, "valid_targets_min": 1599 }, { "epoch": 5.1248817407757805, "grad_norm": 0.5250930353279408, "learning_rate": 8.159027220247238e-06, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.08297573029994965, "step": 2710, "valid_targets_mean": 6368.1, "valid_targets_min": 2296 }, { "epoch": 5.134342478713339, "grad_norm": 0.5007368663874092, "learning_rate": 8.083174190637766e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.0794142335653305, "step": 2715, "valid_targets_mean": 4909.6, "valid_targets_min": 3604 }, { "epoch": 5.143803216650899, "grad_norm": 0.5230754061779214, "learning_rate": 8.00758600467276e-06, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.08960853517055511, "step": 2720, "valid_targets_mean": 5194.1, "valid_targets_min": 2815 }, { "epoch": 5.153263954588458, "grad_norm": 0.5064462916090743, "learning_rate": 7.932264342250112e-06, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.09582977741956711, "step": 2725, "valid_targets_mean": 5520.9, "valid_targets_min": 4252 }, { "epoch": 5.162724692526017, "grad_norm": 0.49932423593853265, "learning_rate": 7.857210877344405e-06, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.0778404176235199, "step": 2730, "valid_targets_mean": 5829.5, "valid_targets_min": 2468 }, { "epoch": 5.172185430463577, "grad_norm": 0.5323844417559039, "learning_rate": 7.782427277969715e-06, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.0745185911655426, "step": 2735, "valid_targets_mean": 5312.0, "valid_targets_min": 3180 }, { "epoch": 5.1816461684011355, "grad_norm": 0.5557657439250057, "learning_rate": 7.707915206142536e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.05902181565761566, "step": 2740, "valid_targets_mean": 5351.9, "valid_targets_min": 746 }, { "epoch": 5.191106906338694, "grad_norm": 0.5332886262361239, "learning_rate": 7.63367631784484e-06, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.07059160619974136, "step": 2745, "valid_targets_mean": 5607.6, "valid_targets_min": 3521 }, { "epoch": 5.200567644276253, "grad_norm": 0.5179154050055391, "learning_rate": 7.559712262987269e-06, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.070362389087677, "step": 2750, "valid_targets_mean": 5177.0, "valid_targets_min": 1471 }, { "epoch": 5.210028382213813, "grad_norm": 0.5265176493412506, "learning_rate": 7.486024685372468e-06, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.07411413639783859, "step": 2755, "valid_targets_mean": 6020.9, "valid_targets_min": 627 }, { "epoch": 5.219489120151372, "grad_norm": 0.554707229367045, "learning_rate": 7.412615222658566e-06, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.09033337235450745, "step": 2760, "valid_targets_mean": 4811.0, "valid_targets_min": 2461 }, { "epoch": 5.228949858088931, "grad_norm": 0.5515956673496363, "learning_rate": 7.339485506322755e-06, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.0772365927696228, "step": 2765, "valid_targets_mean": 5292.4, "valid_targets_min": 648 }, { "epoch": 5.23841059602649, "grad_norm": 0.47803954262560044, "learning_rate": 7.266637161625074e-06, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.09605518728494644, "step": 2770, "valid_targets_mean": 6811.4, "valid_targets_min": 4733 }, { "epoch": 5.247871333964049, "grad_norm": 0.5398489333939209, "learning_rate": 7.194071807572234e-06, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.0798153206706047, "step": 2775, "valid_targets_mean": 4869.1, "valid_targets_min": 1916 }, { "epoch": 5.257332071901608, "grad_norm": 0.511779870847518, "learning_rate": 7.121791056881688e-06, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.08416005969047546, "step": 2780, "valid_targets_mean": 5786.0, "valid_targets_min": 3360 }, { "epoch": 5.266792809839168, "grad_norm": 0.46117106595655755, "learning_rate": 7.049796515945748e-06, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.08570249378681183, "step": 2785, "valid_targets_mean": 6217.8, "valid_targets_min": 3805 }, { "epoch": 5.276253547776727, "grad_norm": 0.48698826185764776, "learning_rate": 6.9780897847959005e-06, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.08505302667617798, "step": 2790, "valid_targets_mean": 6306.8, "valid_targets_min": 4518 }, { "epoch": 5.285714285714286, "grad_norm": 0.47067540750278847, "learning_rate": 6.906672457067272e-06, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.06407542526721954, "step": 2795, "valid_targets_mean": 4664.0, "valid_targets_min": 777 }, { "epoch": 5.2951750236518444, "grad_norm": 0.4814404184659197, "learning_rate": 6.835546119963159e-06, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.07698783278465271, "step": 2800, "valid_targets_mean": 5979.5, "valid_targets_min": 874 }, { "epoch": 5.304635761589404, "grad_norm": 0.4138254655184686, "learning_rate": 6.764712354219798e-06, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.06797531247138977, "step": 2805, "valid_targets_mean": 7091.4, "valid_targets_min": 5493 }, { "epoch": 5.314096499526963, "grad_norm": 0.5158181059013228, "learning_rate": 6.694172734071209e-06, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.12109321355819702, "step": 2810, "valid_targets_mean": 6526.1, "valid_targets_min": 4415 }, { "epoch": 5.323557237464522, "grad_norm": 0.5116457962386629, "learning_rate": 6.623928827214234e-06, "loss": 0.1686, "loss_nan_ranks": 0, "loss_rank_avg": 0.08392614126205444, "step": 2815, "valid_targets_mean": 4956.9, "valid_targets_min": 1126 }, { "epoch": 5.333017975402082, "grad_norm": 0.4637640125901983, "learning_rate": 6.553982194773663e-06, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.06488104909658432, "step": 2820, "valid_targets_mean": 5014.0, "valid_targets_min": 1970 }, { "epoch": 5.3424787133396405, "grad_norm": 0.5489483258773076, "learning_rate": 6.4843343912675775e-06, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.07855500280857086, "step": 2825, "valid_targets_mean": 5010.8, "valid_targets_min": 3460 }, { "epoch": 5.351939451277199, "grad_norm": 0.5566628520939422, "learning_rate": 6.4149869645727604e-06, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.09175878018140793, "step": 2830, "valid_targets_mean": 5209.1, "valid_targets_min": 1971 }, { "epoch": 5.361400189214759, "grad_norm": 0.5194511420264721, "learning_rate": 6.34594145589033e-06, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.09560522437095642, "step": 2835, "valid_targets_mean": 5432.2, "valid_targets_min": 4445 }, { "epoch": 5.370860927152318, "grad_norm": 0.5297795083082508, "learning_rate": 6.277199399711462e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.09491391479969025, "step": 2840, "valid_targets_mean": 5806.8, "valid_targets_min": 4124 }, { "epoch": 5.380321665089877, "grad_norm": 0.5019727889753064, "learning_rate": 6.208762323783317e-06, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.07884600758552551, "step": 2845, "valid_targets_mean": 5524.0, "valid_targets_min": 1902 }, { "epoch": 5.389782403027436, "grad_norm": 0.50283030126958, "learning_rate": 6.140631749075063e-06, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.08332569897174835, "step": 2850, "valid_targets_mean": 5927.8, "valid_targets_min": 4868 }, { "epoch": 5.3992431409649955, "grad_norm": 0.4809018227791537, "learning_rate": 6.0728091897440734e-06, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.07353633642196655, "step": 2855, "valid_targets_mean": 5367.0, "valid_targets_min": 3740 }, { "epoch": 5.408703878902554, "grad_norm": 0.4864649688470974, "learning_rate": 6.005296153102285e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.0782986655831337, "step": 2860, "valid_targets_mean": 5988.9, "valid_targets_min": 1588 }, { "epoch": 5.418164616840113, "grad_norm": 0.48061818782181764, "learning_rate": 5.9380941395826926e-06, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.0813487246632576, "step": 2865, "valid_targets_mean": 5932.9, "valid_targets_min": 1655 }, { "epoch": 5.427625354777673, "grad_norm": 0.4924319395860947, "learning_rate": 5.871204642706006e-06, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.07597285509109497, "step": 2870, "valid_targets_mean": 5485.5, "valid_targets_min": 3119 }, { "epoch": 5.437086092715232, "grad_norm": 0.4985432480570909, "learning_rate": 5.8046291490474695e-06, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.08164849877357483, "step": 2875, "valid_targets_mean": 5445.2, "valid_targets_min": 4168 }, { "epoch": 5.446546830652791, "grad_norm": 0.48269318781366277, "learning_rate": 5.73836913820379e-06, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.07020534574985504, "step": 2880, "valid_targets_mean": 6313.1, "valid_targets_min": 4442 }, { "epoch": 5.45600756859035, "grad_norm": 0.49113593900775243, "learning_rate": 5.672426082760305e-06, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.07037980854511261, "step": 2885, "valid_targets_mean": 5693.4, "valid_targets_min": 4083 }, { "epoch": 5.465468306527909, "grad_norm": 0.5515240633580824, "learning_rate": 5.606801448258199e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.08901975303888321, "step": 2890, "valid_targets_mean": 4930.4, "valid_targets_min": 2773 }, { "epoch": 5.474929044465468, "grad_norm": 0.4994868431495095, "learning_rate": 5.541496693161963e-06, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.08624856919050217, "step": 2895, "valid_targets_mean": 6319.2, "valid_targets_min": 3351 }, { "epoch": 5.484389782403028, "grad_norm": 0.47317427516488886, "learning_rate": 5.4765132688269975e-06, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.07870611548423767, "step": 2900, "valid_targets_mean": 6180.1, "valid_targets_min": 3064 }, { "epoch": 5.493850520340587, "grad_norm": 0.5117713572156433, "learning_rate": 5.411852619467319e-06, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.0791124477982521, "step": 2905, "valid_targets_mean": 5138.5, "valid_targets_min": 1201 }, { "epoch": 5.503311258278146, "grad_norm": 0.44743979186538946, "learning_rate": 5.347516182123482e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.08641517162322998, "step": 2910, "valid_targets_mean": 6519.6, "valid_targets_min": 2545 }, { "epoch": 5.5127719962157045, "grad_norm": 0.5598404931767829, "learning_rate": 5.283505386630656e-06, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.09298183023929596, "step": 2915, "valid_targets_mean": 5395.4, "valid_targets_min": 3680 }, { "epoch": 5.522232734153264, "grad_norm": 0.46606600596730763, "learning_rate": 5.219821655586821e-06, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.08851338177919388, "step": 2920, "valid_targets_mean": 6989.0, "valid_targets_min": 3815 }, { "epoch": 5.531693472090823, "grad_norm": 0.4685726242174628, "learning_rate": 5.156466404321159e-06, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.09037988632917404, "step": 2925, "valid_targets_mean": 6915.8, "valid_targets_min": 1670 }, { "epoch": 5.541154210028382, "grad_norm": 0.5160408959477768, "learning_rate": 5.0934410408626235e-06, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.08055752515792847, "step": 2930, "valid_targets_mean": 5192.4, "valid_targets_min": 3354 }, { "epoch": 5.550614947965942, "grad_norm": 0.5746904433215911, "learning_rate": 5.030746965908613e-06, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.10669153928756714, "step": 2935, "valid_targets_mean": 5440.9, "valid_targets_min": 2202 }, { "epoch": 5.5600756859035005, "grad_norm": 0.45883493673475956, "learning_rate": 4.968385572793859e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.05654348433017731, "step": 2940, "valid_targets_mean": 4961.6, "valid_targets_min": 2024 }, { "epoch": 5.569536423841059, "grad_norm": 0.4993450808594117, "learning_rate": 4.906358247459451e-06, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.068525031208992, "step": 2945, "valid_targets_mean": 4959.1, "valid_targets_min": 1511 }, { "epoch": 5.578997161778618, "grad_norm": 0.5382032760412773, "learning_rate": 4.844666368422055e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.0909319519996643, "step": 2950, "valid_targets_mean": 5311.0, "valid_targets_min": 770 }, { "epoch": 5.588457899716178, "grad_norm": 0.5525554928211415, "learning_rate": 4.783311306743259e-06, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.08873642981052399, "step": 2955, "valid_targets_mean": 5606.0, "valid_targets_min": 1685 }, { "epoch": 5.597918637653737, "grad_norm": 0.461910556182754, "learning_rate": 4.722294425999099e-06, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.09890357404947281, "step": 2960, "valid_targets_mean": 7342.2, "valid_targets_min": 3229 }, { "epoch": 5.607379375591296, "grad_norm": 0.4464092110112635, "learning_rate": 4.661617082249765e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.07442782819271088, "step": 2965, "valid_targets_mean": 6529.2, "valid_targets_min": 3249 }, { "epoch": 5.6168401135288555, "grad_norm": 0.49577901930229196, "learning_rate": 4.601280624009459e-06, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.08115290105342865, "step": 2970, "valid_targets_mean": 5643.5, "valid_targets_min": 4384 }, { "epoch": 5.626300851466414, "grad_norm": 0.46421865938624207, "learning_rate": 4.541286392216419e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.06690236926078796, "step": 2975, "valid_targets_mean": 5475.8, "valid_targets_min": 3336 }, { "epoch": 5.635761589403973, "grad_norm": 0.47388885299577094, "learning_rate": 4.481635720203139e-06, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.08113521337509155, "step": 2980, "valid_targets_mean": 5951.1, "valid_targets_min": 4602 }, { "epoch": 5.645222327341533, "grad_norm": 0.48953790334528496, "learning_rate": 4.4223299336667226e-06, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.06641364097595215, "step": 2985, "valid_targets_mean": 5389.5, "valid_targets_min": 2234 }, { "epoch": 5.654683065279092, "grad_norm": 0.7042938717688352, "learning_rate": 4.363370350639405e-06, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.08492471277713776, "step": 2990, "valid_targets_mean": 5449.6, "valid_targets_min": 3031 }, { "epoch": 5.664143803216651, "grad_norm": 0.9121963480606142, "learning_rate": 4.304758281459283e-06, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.07324929535388947, "step": 2995, "valid_targets_mean": 4495.8, "valid_targets_min": 1353 }, { "epoch": 5.67360454115421, "grad_norm": 0.4938793058364134, "learning_rate": 4.24649502874118e-06, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.08978196978569031, "step": 3000, "valid_targets_mean": 5755.1, "valid_targets_min": 3092 }, { "epoch": 5.683065279091769, "grad_norm": 0.4581010846815238, "learning_rate": 4.1885818873477156e-06, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.07784257084131241, "step": 3005, "valid_targets_mean": 5838.5, "valid_targets_min": 4027 }, { "epoch": 5.692526017029328, "grad_norm": 0.5339513481968639, "learning_rate": 4.131020144360505e-06, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.0724765881896019, "step": 3010, "valid_targets_mean": 4792.6, "valid_targets_min": 835 }, { "epoch": 5.701986754966887, "grad_norm": 0.4657301423666137, "learning_rate": 4.073811079051557e-06, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.06874331831932068, "step": 3015, "valid_targets_mean": 5342.6, "valid_targets_min": 2502 }, { "epoch": 5.711447492904447, "grad_norm": 0.5175010346747354, "learning_rate": 4.016955962854874e-06, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.07748369872570038, "step": 3020, "valid_targets_mean": 5557.0, "valid_targets_min": 2561 }, { "epoch": 5.720908230842006, "grad_norm": 0.46047001239287016, "learning_rate": 3.9604560593381444e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.07033313065767288, "step": 3025, "valid_targets_mean": 6183.8, "valid_targets_min": 3650 }, { "epoch": 5.7303689687795645, "grad_norm": 0.5039104334017726, "learning_rate": 3.9043126241747e-06, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.08076108247041702, "step": 3030, "valid_targets_mean": 5565.2, "valid_targets_min": 1265 }, { "epoch": 5.739829706717124, "grad_norm": 0.4333442468065866, "learning_rate": 3.8485269051156015e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.06987737119197845, "step": 3035, "valid_targets_mean": 6822.2, "valid_targets_min": 1650 }, { "epoch": 5.749290444654683, "grad_norm": 0.4382347126402435, "learning_rate": 3.7931001419618963e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.07224809378385544, "step": 3040, "valid_targets_mean": 6522.6, "valid_targets_min": 3391 }, { "epoch": 5.758751182592242, "grad_norm": 0.5135189211645638, "learning_rate": 3.7380335665370693e-06, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.0703924223780632, "step": 3045, "valid_targets_mean": 4980.6, "valid_targets_min": 1296 }, { "epoch": 5.768211920529802, "grad_norm": 0.4884310150604858, "learning_rate": 3.6833284026596827e-06, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.07352404296398163, "step": 3050, "valid_targets_mean": 5628.5, "valid_targets_min": 1475 }, { "epoch": 5.7776726584673606, "grad_norm": 0.46184445778343136, "learning_rate": 3.6289858661161435e-06, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.07652977108955383, "step": 3055, "valid_targets_mean": 5814.8, "valid_targets_min": 3954 }, { "epoch": 5.787133396404919, "grad_norm": 0.4579796667457961, "learning_rate": 3.5750071646337283e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.07104137539863586, "step": 3060, "valid_targets_mean": 6471.2, "valid_targets_min": 3462 }, { "epoch": 5.796594134342479, "grad_norm": 0.4537041582090879, "learning_rate": 3.5213934978537002e-06, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.08454744517803192, "step": 3065, "valid_targets_mean": 5621.0, "valid_targets_min": 4099 }, { "epoch": 5.806054872280038, "grad_norm": 0.5257566347643703, "learning_rate": 3.4681460573046667e-06, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.08486692607402802, "step": 3070, "valid_targets_mean": 4147.2, "valid_targets_min": 1579 }, { "epoch": 5.815515610217597, "grad_norm": 0.4551568372177165, "learning_rate": 3.415266026376105e-06, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.06996514648199081, "step": 3075, "valid_targets_mean": 6100.4, "valid_targets_min": 3362 }, { "epoch": 5.824976348155156, "grad_norm": 0.5279020357535302, "learning_rate": 3.3627545802920402e-06, "loss": 0.1682, "loss_nan_ranks": 0, "loss_rank_avg": 0.06808288395404816, "step": 3080, "valid_targets_mean": 6382.6, "valid_targets_min": 1899 }, { "epoch": 5.8344370860927155, "grad_norm": 0.509574069681122, "learning_rate": 3.310612886084961e-06, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.07354620844125748, "step": 3085, "valid_targets_mean": 4710.0, "valid_targets_min": 1412 }, { "epoch": 5.843897824030274, "grad_norm": 0.5099345034078288, "learning_rate": 3.2588421025698525e-06, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.07914125919342041, "step": 3090, "valid_targets_mean": 5402.9, "valid_targets_min": 771 }, { "epoch": 5.853358561967833, "grad_norm": 0.4921920783781287, "learning_rate": 3.207443380318449e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.0780281201004982, "step": 3095, "valid_targets_mean": 5046.9, "valid_targets_min": 2910 }, { "epoch": 5.862819299905393, "grad_norm": 0.5076451745790288, "learning_rate": 3.1564178616336737e-06, "loss": 0.1682, "loss_nan_ranks": 0, "loss_rank_avg": 0.08828535676002502, "step": 3100, "valid_targets_mean": 6130.9, "valid_targets_min": 4471 }, { "epoch": 5.872280037842952, "grad_norm": 0.4724679364763835, "learning_rate": 3.1057666805242336e-06, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.08091306686401367, "step": 3105, "valid_targets_mean": 6078.6, "valid_targets_min": 1741 }, { "epoch": 5.881740775780511, "grad_norm": 0.4996674681366472, "learning_rate": 3.055490962679448e-06, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.07268786430358887, "step": 3110, "valid_targets_mean": 5243.2, "valid_targets_min": 817 }, { "epoch": 5.8912015137180695, "grad_norm": 0.5291137259397091, "learning_rate": 3.005591825444194e-06, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.08995255827903748, "step": 3115, "valid_targets_mean": 5615.5, "valid_targets_min": 2952 }, { "epoch": 5.900662251655629, "grad_norm": 0.535236288933447, "learning_rate": 2.956070377794096e-06, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.08721289783716202, "step": 3120, "valid_targets_mean": 5925.4, "valid_targets_min": 3090 }, { "epoch": 5.910122989593188, "grad_norm": 0.5685850842714396, "learning_rate": 2.906927720310884e-06, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.09268994629383087, "step": 3125, "valid_targets_mean": 5151.6, "valid_targets_min": 2762 }, { "epoch": 5.919583727530747, "grad_norm": 0.5012001406123452, "learning_rate": 2.8581649451579083e-06, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.07973651587963104, "step": 3130, "valid_targets_mean": 5932.1, "valid_targets_min": 3486 }, { "epoch": 5.929044465468307, "grad_norm": 0.5152900354765085, "learning_rate": 2.809783136055895e-06, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.0881601944565773, "step": 3135, "valid_targets_mean": 5902.5, "valid_targets_min": 2004 }, { "epoch": 5.938505203405866, "grad_norm": 0.6871324672441096, "learning_rate": 2.761783368258852e-06, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.08433617651462555, "step": 3140, "valid_targets_mean": 6727.5, "valid_targets_min": 4594 }, { "epoch": 5.9479659413434245, "grad_norm": 0.522395677503641, "learning_rate": 2.7141667085301593e-06, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.06753349304199219, "step": 3145, "valid_targets_mean": 4657.8, "valid_targets_min": 1787 }, { "epoch": 5.957426679280984, "grad_norm": 0.49161260461585427, "learning_rate": 2.6669342151188704e-06, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.08413293957710266, "step": 3150, "valid_targets_mean": 6002.9, "valid_targets_min": 3061 }, { "epoch": 5.966887417218543, "grad_norm": 0.5461851756628411, "learning_rate": 2.62008693773621e-06, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.08240652084350586, "step": 3155, "valid_targets_mean": 5138.6, "valid_targets_min": 2077 }, { "epoch": 5.976348155156102, "grad_norm": 0.5821132136646191, "learning_rate": 2.573625917532212e-06, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.07987844944000244, "step": 3160, "valid_targets_mean": 5757.9, "valid_targets_min": 3017 }, { "epoch": 5.985808893093662, "grad_norm": 0.47968943718028695, "learning_rate": 2.5275521870726107e-06, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.08667580038309097, "step": 3165, "valid_targets_mean": 5866.8, "valid_targets_min": 4790 }, { "epoch": 5.995269631031221, "grad_norm": 0.4965790737728136, "learning_rate": 2.481866770315866e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.08443500101566315, "step": 3170, "valid_targets_mean": 5814.4, "valid_targets_min": 4152 }, { "epoch": 6.0037842951750235, "grad_norm": 0.584119229089462, "learning_rate": 2.4365706825904335e-06, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.0846308022737503, "step": 3175, "valid_targets_mean": 5266.2, "valid_targets_min": 4242 }, { "epoch": 6.013245033112582, "grad_norm": 0.5318032612027898, "learning_rate": 2.391664930572175e-06, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.07814428210258484, "step": 3180, "valid_targets_mean": 5013.9, "valid_targets_min": 850 }, { "epoch": 6.022705771050142, "grad_norm": 0.5144448514440982, "learning_rate": 2.347150512262002e-06, "loss": 0.158, "loss_nan_ranks": 0, "loss_rank_avg": 0.07846082746982574, "step": 3185, "valid_targets_mean": 5425.6, "valid_targets_min": 2247 }, { "epoch": 6.032166508987701, "grad_norm": 0.4646205864187392, "learning_rate": 2.303028416963693e-06, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.07777369767427444, "step": 3190, "valid_targets_mean": 5879.8, "valid_targets_min": 1877 }, { "epoch": 6.04162724692526, "grad_norm": 0.47396458926137663, "learning_rate": 2.259299625261906e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.0792025625705719, "step": 3195, "valid_targets_mean": 6722.5, "valid_targets_min": 1546 }, { "epoch": 6.05108798486282, "grad_norm": 0.45843753096435663, "learning_rate": 2.2159651090003774e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.06743055582046509, "step": 3200, "valid_targets_mean": 5288.9, "valid_targets_min": 1868 }, { "epoch": 6.0605487228003785, "grad_norm": 0.4553963970008123, "learning_rate": 2.173025831260336e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.0739666223526001, "step": 3205, "valid_targets_mean": 6655.4, "valid_targets_min": 5252 }, { "epoch": 6.070009460737937, "grad_norm": 0.49731449399968497, "learning_rate": 2.1304827463390843e-06, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.07816332578659058, "step": 3210, "valid_targets_mean": 6025.1, "valid_targets_min": 3547 }, { "epoch": 6.079470198675497, "grad_norm": 0.4889765047812308, "learning_rate": 2.088336799728814e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.0794171690940857, "step": 3215, "valid_targets_mean": 6134.9, "valid_targets_min": 4135 }, { "epoch": 6.088930936613056, "grad_norm": 0.47878941127207625, "learning_rate": 2.046588928095563e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.07988835871219635, "step": 3220, "valid_targets_mean": 5659.5, "valid_targets_min": 4115 }, { "epoch": 6.098391674550615, "grad_norm": 0.4997195025958504, "learning_rate": 2.005240059258431e-06, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.0862731784582138, "step": 3225, "valid_targets_mean": 5721.6, "valid_targets_min": 2052 }, { "epoch": 6.107852412488174, "grad_norm": 0.5692060263245817, "learning_rate": 1.9642911121689233e-06, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.07118255645036697, "step": 3230, "valid_targets_mean": 3830.5, "valid_targets_min": 699 }, { "epoch": 6.117313150425733, "grad_norm": 0.5686969457407623, "learning_rate": 1.9237429968905586e-06, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.06574267148971558, "step": 3235, "valid_targets_mean": 3772.6, "valid_targets_min": 2061 }, { "epoch": 6.126773888363292, "grad_norm": 0.49763597561095985, "learning_rate": 1.8835966145786222e-06, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.08373168855905533, "step": 3240, "valid_targets_mean": 6183.5, "valid_targets_min": 2730 }, { "epoch": 6.136234626300851, "grad_norm": 0.4887902369131846, "learning_rate": 1.84385285746016e-06, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.08439414203166962, "step": 3245, "valid_targets_mean": 5588.5, "valid_targets_min": 3357 }, { "epoch": 6.145695364238411, "grad_norm": 0.4985086513937735, "learning_rate": 1.8045126088141262e-06, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.07852502912282944, "step": 3250, "valid_targets_mean": 5644.4, "valid_targets_min": 3873 }, { "epoch": 6.15515610217597, "grad_norm": 0.533162317600248, "learning_rate": 1.7655767429517645e-06, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.08291523158550262, "step": 3255, "valid_targets_mean": 5257.0, "valid_targets_min": 1362 }, { "epoch": 6.164616840113529, "grad_norm": 0.8163603542581688, "learning_rate": 1.727046125197185e-06, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.11358313262462616, "step": 3260, "valid_targets_mean": 5585.5, "valid_targets_min": 3323 }, { "epoch": 6.174077578051088, "grad_norm": 0.5275817332491582, "learning_rate": 1.6889216118681107e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.07413968443870544, "step": 3265, "valid_targets_mean": 5179.8, "valid_targets_min": 1578 }, { "epoch": 6.183538315988647, "grad_norm": 0.47663914651303735, "learning_rate": 1.6512040502568761e-06, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.0781627744436264, "step": 3270, "valid_targets_mean": 6326.0, "valid_targets_min": 2718 }, { "epoch": 6.192999053926206, "grad_norm": 0.5198414647863658, "learning_rate": 1.6138942786115653e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.08433681726455688, "step": 3275, "valid_targets_mean": 5501.0, "valid_targets_min": 1788 }, { "epoch": 6.202459791863765, "grad_norm": 0.6408667201086448, "learning_rate": 1.5769931261174055e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.08084458112716675, "step": 3280, "valid_targets_mean": 6616.8, "valid_targets_min": 1689 }, { "epoch": 6.211920529801325, "grad_norm": 0.4944308322849977, "learning_rate": 1.5405014128783236e-06, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.08102227747440338, "step": 3285, "valid_targets_mean": 5647.5, "valid_targets_min": 2694 }, { "epoch": 6.221381267738884, "grad_norm": 0.48233444172077344, "learning_rate": 1.5044199498987456e-06, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.0742645263671875, "step": 3290, "valid_targets_mean": 5459.2, "valid_targets_min": 2468 }, { "epoch": 6.230842005676442, "grad_norm": 0.5321614423819155, "learning_rate": 1.4687495390655282e-06, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.07728166878223419, "step": 3295, "valid_targets_mean": 4666.1, "valid_targets_min": 2232 }, { "epoch": 6.240302743614002, "grad_norm": 0.45554443433516056, "learning_rate": 1.4334909731301893e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.07903093844652176, "step": 3300, "valid_targets_mean": 6301.2, "valid_targets_min": 2023 }, { "epoch": 6.249763481551561, "grad_norm": 0.4369901640686527, "learning_rate": 1.398645035691244e-06, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.07268842309713364, "step": 3305, "valid_targets_mean": 6521.2, "valid_targets_min": 4385 }, { "epoch": 6.25922421948912, "grad_norm": 0.5144149069493703, "learning_rate": 1.3642125011768204e-06, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.0853855162858963, "step": 3310, "valid_targets_mean": 4916.5, "valid_targets_min": 1306 }, { "epoch": 6.26868495742668, "grad_norm": 0.4662790470481307, "learning_rate": 1.3301941348274316e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.06581012159585953, "step": 3315, "valid_targets_mean": 5482.5, "valid_targets_min": 3959 }, { "epoch": 6.2781456953642385, "grad_norm": 0.543005624322293, "learning_rate": 1.2965906926789807e-06, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.08316712081432343, "step": 3320, "valid_targets_mean": 5355.4, "valid_targets_min": 3827 }, { "epoch": 6.287606433301797, "grad_norm": 0.4642963328041462, "learning_rate": 1.2634029215459442e-06, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.07344529032707214, "step": 3325, "valid_targets_mean": 6743.8, "valid_targets_min": 3629 }, { "epoch": 6.297067171239357, "grad_norm": 0.4729718094257136, "learning_rate": 1.2306315590047912e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.08172772079706192, "step": 3330, "valid_targets_mean": 6132.5, "valid_targets_min": 3527 }, { "epoch": 6.306527909176916, "grad_norm": 0.47615121755084255, "learning_rate": 1.1982773333775822e-06, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.06997595727443695, "step": 3335, "valid_targets_mean": 6265.9, "valid_targets_min": 3729 }, { "epoch": 6.315988647114475, "grad_norm": 0.49720672723911824, "learning_rate": 1.1663409637157685e-06, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.08522418141365051, "step": 3340, "valid_targets_mean": 6098.0, "valid_targets_min": 1787 }, { "epoch": 6.325449385052034, "grad_norm": 0.5893163672320445, "learning_rate": 1.1348231597842508e-06, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.07012220472097397, "step": 3345, "valid_targets_mean": 5598.1, "valid_targets_min": 3357 }, { "epoch": 6.334910122989593, "grad_norm": 0.5056344429691663, "learning_rate": 1.1037246220455611e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.07550933957099915, "step": 3350, "valid_targets_mean": 5193.8, "valid_targets_min": 3603 }, { "epoch": 6.344370860927152, "grad_norm": 0.49788948816850587, "learning_rate": 1.0730460416443233e-06, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.07792874425649643, "step": 3355, "valid_targets_mean": 5297.8, "valid_targets_min": 1526 }, { "epoch": 6.353831598864711, "grad_norm": 0.47295359132021303, "learning_rate": 1.0427881003918783e-06, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.06006645783782005, "step": 3360, "valid_targets_mean": 5776.5, "valid_targets_min": 1930 }, { "epoch": 6.363292336802271, "grad_norm": 0.5180446573609132, "learning_rate": 1.012951470751149e-06, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.06573215126991272, "step": 3365, "valid_targets_mean": 4157.4, "valid_targets_min": 1603 }, { "epoch": 6.37275307473983, "grad_norm": 0.5142987786973194, "learning_rate": 9.835368158216707e-07, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.0875168964266777, "step": 3370, "valid_targets_mean": 5995.5, "valid_targets_min": 3569 }, { "epoch": 6.382213812677389, "grad_norm": 0.549315279583512, "learning_rate": 9.545447893248827e-07, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.08440011739730835, "step": 3375, "valid_targets_mean": 5372.4, "valid_targets_min": 1524 }, { "epoch": 6.391674550614948, "grad_norm": 0.4975303100993707, "learning_rate": 9.259760355895664e-07, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.08323267102241516, "step": 3380, "valid_targets_mean": 5243.5, "valid_targets_min": 3619 }, { "epoch": 6.401135288552507, "grad_norm": 0.44933429326711627, "learning_rate": 8.978311895375569e-07, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.06366902589797974, "step": 3385, "valid_targets_mean": 5606.0, "valid_targets_min": 771 }, { "epoch": 6.410596026490066, "grad_norm": 0.5244538230451249, "learning_rate": 8.701108766696098e-07, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.08314728736877441, "step": 3390, "valid_targets_mean": 5397.2, "valid_targets_min": 976 }, { "epoch": 6.420056764427625, "grad_norm": 0.5321046922657727, "learning_rate": 8.428157130515169e-07, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.07390115410089493, "step": 3395, "valid_targets_mean": 4900.6, "valid_targets_min": 2668 }, { "epoch": 6.429517502365185, "grad_norm": 0.4997987625144715, "learning_rate": 8.159463053004058e-07, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.07713502645492554, "step": 3400, "valid_targets_mean": 5670.5, "valid_targets_min": 3714 }, { "epoch": 6.438978240302744, "grad_norm": 0.4783857613174314, "learning_rate": 7.89503250571253e-07, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.07338370382785797, "step": 3405, "valid_targets_mean": 6021.6, "valid_targets_min": 4140 }, { "epoch": 6.448438978240302, "grad_norm": 0.5084014116990427, "learning_rate": 7.634871365436192e-07, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.08246712386608124, "step": 3410, "valid_targets_mean": 6041.9, "valid_targets_min": 4465 }, { "epoch": 6.457899716177862, "grad_norm": 0.5069553293411639, "learning_rate": 7.378985414085949e-07, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.07229432463645935, "step": 3415, "valid_targets_mean": 5251.4, "valid_targets_min": 4371 }, { "epoch": 6.467360454115421, "grad_norm": 0.5195346482191306, "learning_rate": 7.127380338559331e-07, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.08095690608024597, "step": 3420, "valid_targets_mean": 5833.1, "valid_targets_min": 2788 }, { "epoch": 6.47682119205298, "grad_norm": 0.44961617162875356, "learning_rate": 6.880061730614307e-07, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.06503139436244965, "step": 3425, "valid_targets_mean": 5194.5, "valid_targets_min": 2034 }, { "epoch": 6.48628192999054, "grad_norm": 0.512212152514479, "learning_rate": 6.637035086744825e-07, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.08502800762653351, "step": 3430, "valid_targets_mean": 6129.9, "valid_targets_min": 3237 }, { "epoch": 6.4957426679280985, "grad_norm": 0.533866271670798, "learning_rate": 6.398305808058869e-07, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.080892413854599, "step": 3435, "valid_targets_mean": 5465.8, "valid_targets_min": 802 }, { "epoch": 6.505203405865657, "grad_norm": 0.4821294366129078, "learning_rate": 6.163879200158151e-07, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.0807921439409256, "step": 3440, "valid_targets_mean": 6166.4, "valid_targets_min": 1645 }, { "epoch": 6.514664143803216, "grad_norm": 0.47581791967584, "learning_rate": 5.933760473020411e-07, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.08440031111240387, "step": 3445, "valid_targets_mean": 7176.6, "valid_targets_min": 2313 }, { "epoch": 6.524124881740776, "grad_norm": 0.49665456440010425, "learning_rate": 5.707954740883592e-07, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.07877863943576813, "step": 3450, "valid_targets_mean": 6034.4, "valid_targets_min": 4409 }, { "epoch": 6.533585619678335, "grad_norm": 0.46914359671651773, "learning_rate": 5.486467022132114e-07, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.07220163941383362, "step": 3455, "valid_targets_mean": 5201.1, "valid_targets_min": 3269 }, { "epoch": 6.543046357615894, "grad_norm": 0.4999247739317717, "learning_rate": 5.269302239185359e-07, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.06515920162200928, "step": 3460, "valid_targets_mean": 4510.6, "valid_targets_min": 2249 }, { "epoch": 6.5525070955534535, "grad_norm": 0.49427440693924146, "learning_rate": 5.056465218388363e-07, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.07092322409152985, "step": 3465, "valid_targets_mean": 5033.9, "valid_targets_min": 1748 }, { "epoch": 6.561967833491012, "grad_norm": 0.693524396791674, "learning_rate": 4.847960689904385e-07, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.06443572044372559, "step": 3470, "valid_targets_mean": 5021.1, "valid_targets_min": 2541 }, { "epoch": 6.571428571428571, "grad_norm": 0.4652753136072147, "learning_rate": 4.6437932876099767e-07, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.07002725452184677, "step": 3475, "valid_targets_mean": 5402.4, "valid_targets_min": 1915 }, { "epoch": 6.580889309366131, "grad_norm": 0.46451032890247035, "learning_rate": 4.443967548991857e-07, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.07609806954860687, "step": 3480, "valid_targets_mean": 6261.8, "valid_targets_min": 1548 }, { "epoch": 6.59035004730369, "grad_norm": 0.4742091398940524, "learning_rate": 4.2484879150461067e-07, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.07329309731721878, "step": 3485, "valid_targets_mean": 5271.6, "valid_targets_min": 4216 }, { "epoch": 6.599810785241249, "grad_norm": 0.4912655014563391, "learning_rate": 4.0573587301794947e-07, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.08175991475582123, "step": 3490, "valid_targets_mean": 5803.6, "valid_targets_min": 3450 }, { "epoch": 6.609271523178808, "grad_norm": 0.47411330765123344, "learning_rate": 3.870584242112885e-07, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.08022162318229675, "step": 3495, "valid_targets_mean": 6148.5, "valid_targets_min": 1108 }, { "epoch": 6.618732261116367, "grad_norm": 0.5467862296497042, "learning_rate": 3.688168601786912e-07, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.08909142762422562, "step": 3500, "valid_targets_mean": 5511.9, "valid_targets_min": 2056 }, { "epoch": 6.628192999053926, "grad_norm": 0.4811284532821337, "learning_rate": 3.5101158632696584e-07, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.0686873197555542, "step": 3505, "valid_targets_mean": 5850.6, "valid_targets_min": 3425 }, { "epoch": 6.637653736991485, "grad_norm": 0.4764682488197729, "learning_rate": 3.336429983666545e-07, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.08067235350608826, "step": 3510, "valid_targets_mean": 6091.9, "valid_targets_min": 3877 }, { "epoch": 6.647114474929045, "grad_norm": 0.4894456490714887, "learning_rate": 3.1671148230324246e-07, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.07609429210424423, "step": 3515, "valid_targets_mean": 6449.8, "valid_targets_min": 3351 }, { "epoch": 6.656575212866604, "grad_norm": 0.5064247856959551, "learning_rate": 3.0021741442857634e-07, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.07491397857666016, "step": 3520, "valid_targets_mean": 5559.9, "valid_targets_min": 3138 }, { "epoch": 6.6660359508041624, "grad_norm": 0.5105415474802601, "learning_rate": 2.8416116131250836e-07, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.06692364066839218, "step": 3525, "valid_targets_mean": 5484.8, "valid_targets_min": 2488 }, { "epoch": 6.675496688741722, "grad_norm": 0.5083849374762096, "learning_rate": 2.6854307979474306e-07, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.08597913384437561, "step": 3530, "valid_targets_mean": 6459.1, "valid_targets_min": 767 }, { "epoch": 6.684957426679281, "grad_norm": 0.4342549973357616, "learning_rate": 2.5336351697690553e-07, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.0754256471991539, "step": 3535, "valid_targets_mean": 5868.1, "valid_targets_min": 3233 }, { "epoch": 6.69441816461684, "grad_norm": 0.5062031786978933, "learning_rate": 2.386228102148347e-07, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.07034958899021149, "step": 3540, "valid_targets_mean": 5718.9, "valid_targets_min": 2398 }, { "epoch": 6.703878902554399, "grad_norm": 0.500948493630646, "learning_rate": 2.2432128711107558e-07, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.07873102277517319, "step": 3545, "valid_targets_mean": 6648.0, "valid_targets_min": 4973 }, { "epoch": 6.7133396404919585, "grad_norm": 0.45111358239646104, "learning_rate": 2.1045926550760988e-07, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.07121957838535309, "step": 3550, "valid_targets_mean": 5770.5, "valid_targets_min": 3291 }, { "epoch": 6.722800378429517, "grad_norm": 0.46097603655795455, "learning_rate": 1.9703705347878355e-07, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.06768956780433655, "step": 3555, "valid_targets_mean": 5942.2, "valid_targets_min": 3064 }, { "epoch": 6.732261116367076, "grad_norm": 0.4964329737190062, "learning_rate": 1.8405494932446366e-07, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.06672897189855576, "step": 3560, "valid_targets_mean": 5239.6, "valid_targets_min": 1596 }, { "epoch": 6.741721854304636, "grad_norm": 0.5504838449968519, "learning_rate": 1.7151324156340355e-07, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.07267464697360992, "step": 3565, "valid_targets_mean": 4650.8, "valid_targets_min": 2054 }, { "epoch": 6.751182592242195, "grad_norm": 0.5237161400407134, "learning_rate": 1.5941220892684572e-07, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.08781194686889648, "step": 3570, "valid_targets_mean": 6332.1, "valid_targets_min": 4998 }, { "epoch": 6.760643330179754, "grad_norm": 0.5490099004104453, "learning_rate": 1.4775212035230691e-07, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.08914782106876373, "step": 3575, "valid_targets_mean": 4676.5, "valid_targets_min": 746 }, { "epoch": 6.7701040681173135, "grad_norm": 0.4995209315574402, "learning_rate": 1.3653323497761607e-07, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.06628039479255676, "step": 3580, "valid_targets_mean": 5913.0, "valid_targets_min": 3502 }, { "epoch": 6.779564806054872, "grad_norm": 0.513748933958977, "learning_rate": 1.2575580213514792e-07, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.08485302329063416, "step": 3585, "valid_targets_mean": 6715.2, "valid_targets_min": 2699 }, { "epoch": 6.789025543992431, "grad_norm": 0.5698785487991007, "learning_rate": 1.1542006134628747e-07, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.09485235810279846, "step": 3590, "valid_targets_mean": 5735.1, "valid_targets_min": 1654 }, { "epoch": 6.798486281929991, "grad_norm": 0.502423517172928, "learning_rate": 1.0552624231609632e-07, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.09140385687351227, "step": 3595, "valid_targets_mean": 6541.4, "valid_targets_min": 3404 }, { "epoch": 6.80794701986755, "grad_norm": 0.5486811174751066, "learning_rate": 9.607456492822132e-08, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.06690894812345505, "step": 3600, "valid_targets_mean": 4560.6, "valid_targets_min": 1293 }, { "epoch": 6.815515610217597, "grad_norm": 0.41971865894051924, "learning_rate": 8.706523924000066e-08, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.06027888506650925, "step": 3605, "valid_targets_mean": 6555.0, "valid_targets_min": 2788 }, { "epoch": 6.824976348155156, "grad_norm": 0.4407706789613994, "learning_rate": 7.849846547778983e-08, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.06519781798124313, "step": 3610, "valid_targets_mean": 6884.4, "valid_targets_min": 1265 }, { "epoch": 6.8344370860927155, "grad_norm": 0.4978073691618193, "learning_rate": 7.03744340325252e-08, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.07424402236938477, "step": 3615, "valid_targets_mean": 6403.1, "valid_targets_min": 4674 }, { "epoch": 6.843897824030274, "grad_norm": 0.5085529248955364, "learning_rate": 6.269332545548068e-08, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.08670083433389664, "step": 3620, "valid_targets_mean": 4922.5, "valid_targets_min": 1785 }, { "epoch": 6.853358561967833, "grad_norm": 0.4344651976137186, "learning_rate": 5.5455310454259894e-08, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.07209931313991547, "step": 3625, "valid_targets_mean": 7308.1, "valid_targets_min": 4659 }, { "epoch": 6.862819299905393, "grad_norm": 0.4413038947876362, "learning_rate": 4.866054988900581e-08, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.06930118799209595, "step": 3630, "valid_targets_mean": 6234.8, "valid_targets_min": 976 }, { "epoch": 6.872280037842952, "grad_norm": 0.48107253716280135, "learning_rate": 4.230919476881479e-08, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.06881730258464813, "step": 3635, "valid_targets_mean": 5447.9, "valid_targets_min": 2560 }, { "epoch": 6.881740775780511, "grad_norm": 0.5104224535773499, "learning_rate": 3.640138624839695e-08, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.06860077381134033, "step": 3640, "valid_targets_mean": 6469.2, "valid_targets_min": 3160 }, { "epoch": 6.8912015137180695, "grad_norm": 0.4870345502815453, "learning_rate": 3.093725562492544e-08, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.07753711938858032, "step": 3645, "valid_targets_mean": 6092.4, "valid_targets_min": 2908 }, { "epoch": 6.900662251655629, "grad_norm": 0.4461190608500686, "learning_rate": 2.591692433511872e-08, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.060674458742141724, "step": 3650, "valid_targets_mean": 4704.4, "valid_targets_min": 1739 }, { "epoch": 6.910122989593188, "grad_norm": 0.46744896878817527, "learning_rate": 2.1340503952551606e-08, "loss": 0.1454, "loss_nan_ranks": 0, "loss_rank_avg": 0.07023951411247253, "step": 3655, "valid_targets_mean": 6859.5, "valid_targets_min": 4199 }, { "epoch": 6.919583727530747, "grad_norm": 0.4423365813985784, "learning_rate": 1.720809618516839e-08, "loss": 0.1392, "loss_nan_ranks": 0, "loss_rank_avg": 0.05241403728723526, "step": 3660, "valid_targets_mean": 5074.6, "valid_targets_min": 1461 }, { "epoch": 6.929044465468307, "grad_norm": 0.4940830080464678, "learning_rate": 1.351979287302463e-08, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.06597153842449188, "step": 3665, "valid_targets_mean": 5494.9, "valid_targets_min": 1333 }, { "epoch": 6.938505203405866, "grad_norm": 0.5141965819400358, "learning_rate": 1.0275675986242128e-08, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.06885077059268951, "step": 3670, "valid_targets_mean": 5493.0, "valid_targets_min": 1550 }, { "epoch": 6.9479659413434245, "grad_norm": 0.49214237360203794, "learning_rate": 7.475817623194826e-09, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.06208660453557968, "step": 3675, "valid_targets_mean": 4805.9, "valid_targets_min": 699 }, { "epoch": 6.957426679280984, "grad_norm": 0.5374621708278976, "learning_rate": 5.120280008901191e-09, "loss": 0.1467, "loss_nan_ranks": 0, "loss_rank_avg": 0.080912746489048, "step": 3680, "valid_targets_mean": 5787.4, "valid_targets_min": 4241 }, { "epoch": 6.966887417218543, "grad_norm": 0.5296512592742303, "learning_rate": 3.2091154936386705e-09, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.06907324492931366, "step": 3685, "valid_targets_mean": 5773.0, "valid_targets_min": 3043 }, { "epoch": 6.976348155156102, "grad_norm": 0.4419333491426742, "learning_rate": 1.7423665517868338e-09, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.05245755612850189, "step": 3690, "valid_targets_mean": 5486.1, "valid_targets_min": 1693 }, { "epoch": 6.985808893093662, "grad_norm": 0.508769965540501, "learning_rate": 7.200657808792422e-10, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.08677756786346436, "step": 3695, "valid_targets_mean": 6286.6, "valid_targets_min": 2001 }, { "epoch": 6.995269631031221, "grad_norm": 0.47535964660935565, "learning_rate": 1.4223590088180416e-10, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.07410024106502533, "step": 3700, "valid_targets_mean": 5791.9, "valid_targets_min": 2377 }, { "epoch": 6.999053926206244, "loss_nan_ranks": 0, "loss_rank_avg": 0.14962854981422424, "step": 3702, "total_flos": 2.2812121694270915e+18, "train_loss": 0.004161321395542221, "train_runtime": 3645.582, "train_samples_per_second": 16.237, "train_steps_per_second": 1.016, "valid_targets_mean": 6778.8, "valid_targets_min": 4131 } ], "logging_steps": 5, "max_steps": 3703, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 2.2812121694270915e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }