{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 3913, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008944543828264758, "grad_norm": 21.606822638718377, "learning_rate": 4.0816326530612243e-07, "loss": 0.9157, "loss_nan_ranks": 0, "loss_rank_avg": 0.9071354866027832, "step": 5, "valid_targets_mean": 4165.1, "valid_targets_min": 1481 }, { "epoch": 0.017889087656529516, "grad_norm": 19.04995792657104, "learning_rate": 9.183673469387756e-07, "loss": 0.9249, "loss_nan_ranks": 0, "loss_rank_avg": 0.8876984119415283, "step": 10, "valid_targets_mean": 3925.7, "valid_targets_min": 1499 }, { "epoch": 0.026833631484794274, "grad_norm": 19.84564044371412, "learning_rate": 1.4285714285714286e-06, "loss": 0.8728, "loss_nan_ranks": 0, "loss_rank_avg": 0.8913623690605164, "step": 15, "valid_targets_mean": 4151.1, "valid_targets_min": 2060 }, { "epoch": 0.03577817531305903, "grad_norm": 12.750163023484031, "learning_rate": 1.938775510204082e-06, "loss": 0.8513, "loss_nan_ranks": 0, "loss_rank_avg": 0.8227970600128174, "step": 20, "valid_targets_mean": 3907.8, "valid_targets_min": 1805 }, { "epoch": 0.044722719141323794, "grad_norm": 7.2429705482367055, "learning_rate": 2.4489795918367347e-06, "loss": 0.7962, "loss_nan_ranks": 0, "loss_rank_avg": 0.7579451203346252, "step": 25, "valid_targets_mean": 4374.8, "valid_targets_min": 538 }, { "epoch": 0.05366726296958855, "grad_norm": 4.437835296542112, "learning_rate": 2.959183673469388e-06, "loss": 0.7424, "loss_nan_ranks": 0, "loss_rank_avg": 0.7099573612213135, "step": 30, "valid_targets_mean": 3956.7, "valid_targets_min": 954 }, { "epoch": 0.0626118067978533, "grad_norm": 2.7488646562577306, "learning_rate": 3.469387755102041e-06, "loss": 0.6793, "loss_nan_ranks": 0, "loss_rank_avg": 0.6850540041923523, "step": 35, "valid_targets_mean": 4000.8, "valid_targets_min": 579 }, { "epoch": 0.07155635062611806, "grad_norm": 2.1085770347953767, "learning_rate": 3.979591836734694e-06, "loss": 0.6197, "loss_nan_ranks": 0, "loss_rank_avg": 0.6641137003898621, "step": 40, "valid_targets_mean": 3597.0, "valid_targets_min": 1574 }, { "epoch": 0.08050089445438283, "grad_norm": 1.6255237321311984, "learning_rate": 4.489795918367348e-06, "loss": 0.6116, "loss_nan_ranks": 0, "loss_rank_avg": 0.6154483556747437, "step": 45, "valid_targets_mean": 3623.8, "valid_targets_min": 850 }, { "epoch": 0.08944543828264759, "grad_norm": 1.2082356599373048, "learning_rate": 5e-06, "loss": 0.6101, "loss_nan_ranks": 0, "loss_rank_avg": 0.5458171367645264, "step": 50, "valid_targets_mean": 3971.1, "valid_targets_min": 627 }, { "epoch": 0.09838998211091235, "grad_norm": 1.0504686350094798, "learning_rate": 5.510204081632653e-06, "loss": 0.5949, "loss_nan_ranks": 0, "loss_rank_avg": 0.573982834815979, "step": 55, "valid_targets_mean": 4307.6, "valid_targets_min": 1734 }, { "epoch": 0.1073345259391771, "grad_norm": 0.9226116061847508, "learning_rate": 6.020408163265307e-06, "loss": 0.5738, "loss_nan_ranks": 0, "loss_rank_avg": 0.559834361076355, "step": 60, "valid_targets_mean": 4199.9, "valid_targets_min": 1122 }, { "epoch": 0.11627906976744186, "grad_norm": 0.8020567416774592, "learning_rate": 6.530612244897959e-06, "loss": 0.5668, "loss_nan_ranks": 0, "loss_rank_avg": 0.5514993071556091, "step": 65, "valid_targets_mean": 4092.1, "valid_targets_min": 1833 }, { "epoch": 0.1252236135957066, "grad_norm": 0.7566279895205129, "learning_rate": 7.0408163265306125e-06, "loss": 0.5578, "loss_nan_ranks": 0, "loss_rank_avg": 0.5654456615447998, "step": 70, "valid_targets_mean": 4476.8, "valid_targets_min": 1837 }, { "epoch": 0.13416815742397137, "grad_norm": 0.8277372126838092, "learning_rate": 7.551020408163265e-06, "loss": 0.5356, "loss_nan_ranks": 0, "loss_rank_avg": 0.4986897110939026, "step": 75, "valid_targets_mean": 3277.0, "valid_targets_min": 1319 }, { "epoch": 0.14311270125223613, "grad_norm": 0.7706280252042736, "learning_rate": 8.06122448979592e-06, "loss": 0.5068, "loss_nan_ranks": 0, "loss_rank_avg": 0.5114747285842896, "step": 80, "valid_targets_mean": 3939.2, "valid_targets_min": 1961 }, { "epoch": 0.1520572450805009, "grad_norm": 0.7370945804564825, "learning_rate": 8.571428571428571e-06, "loss": 0.5039, "loss_nan_ranks": 0, "loss_rank_avg": 0.521478533744812, "step": 85, "valid_targets_mean": 3797.7, "valid_targets_min": 864 }, { "epoch": 0.16100178890876565, "grad_norm": 0.6156667263403908, "learning_rate": 9.081632653061225e-06, "loss": 0.4835, "loss_nan_ranks": 0, "loss_rank_avg": 0.4676780104637146, "step": 90, "valid_targets_mean": 4991.2, "valid_targets_min": 1062 }, { "epoch": 0.16994633273703041, "grad_norm": 0.6654121843319102, "learning_rate": 9.591836734693878e-06, "loss": 0.4785, "loss_nan_ranks": 0, "loss_rank_avg": 0.48915815353393555, "step": 95, "valid_targets_mean": 3783.8, "valid_targets_min": 705 }, { "epoch": 0.17889087656529518, "grad_norm": 0.5656478848830337, "learning_rate": 1.0102040816326531e-05, "loss": 0.4789, "loss_nan_ranks": 0, "loss_rank_avg": 0.4592038094997406, "step": 100, "valid_targets_mean": 4946.6, "valid_targets_min": 743 }, { "epoch": 0.18783542039355994, "grad_norm": 0.5753964943707206, "learning_rate": 1.0612244897959186e-05, "loss": 0.4481, "loss_nan_ranks": 0, "loss_rank_avg": 0.4560643434524536, "step": 105, "valid_targets_mean": 4798.2, "valid_targets_min": 1049 }, { "epoch": 0.1967799642218247, "grad_norm": 0.6637720894363032, "learning_rate": 1.1122448979591838e-05, "loss": 0.4584, "loss_nan_ranks": 0, "loss_rank_avg": 0.47521623969078064, "step": 110, "valid_targets_mean": 3852.6, "valid_targets_min": 1835 }, { "epoch": 0.20572450805008943, "grad_norm": 0.6937897615661168, "learning_rate": 1.1632653061224491e-05, "loss": 0.4686, "loss_nan_ranks": 0, "loss_rank_avg": 0.45546483993530273, "step": 115, "valid_targets_mean": 4407.1, "valid_targets_min": 2317 }, { "epoch": 0.2146690518783542, "grad_norm": 0.6387384496375781, "learning_rate": 1.2142857142857142e-05, "loss": 0.4378, "loss_nan_ranks": 0, "loss_rank_avg": 0.438065767288208, "step": 120, "valid_targets_mean": 4181.9, "valid_targets_min": 1324 }, { "epoch": 0.22361359570661896, "grad_norm": 0.6327727639217386, "learning_rate": 1.2653061224489798e-05, "loss": 0.4679, "loss_nan_ranks": 0, "loss_rank_avg": 0.47834330797195435, "step": 125, "valid_targets_mean": 4268.0, "valid_targets_min": 1629 }, { "epoch": 0.23255813953488372, "grad_norm": 0.6622093710086933, "learning_rate": 1.316326530612245e-05, "loss": 0.427, "loss_nan_ranks": 0, "loss_rank_avg": 0.4127560257911682, "step": 130, "valid_targets_mean": 3824.6, "valid_targets_min": 1371 }, { "epoch": 0.24150268336314848, "grad_norm": 0.6285981733100382, "learning_rate": 1.3673469387755102e-05, "loss": 0.4394, "loss_nan_ranks": 0, "loss_rank_avg": 0.4288730323314667, "step": 135, "valid_targets_mean": 3877.5, "valid_targets_min": 1614 }, { "epoch": 0.2504472271914132, "grad_norm": 0.7388339921347419, "learning_rate": 1.4183673469387755e-05, "loss": 0.4429, "loss_nan_ranks": 0, "loss_rank_avg": 0.420998752117157, "step": 140, "valid_targets_mean": 3424.4, "valid_targets_min": 780 }, { "epoch": 0.259391771019678, "grad_norm": 0.7101396979725441, "learning_rate": 1.469387755102041e-05, "loss": 0.4389, "loss_nan_ranks": 0, "loss_rank_avg": 0.4431981146335602, "step": 145, "valid_targets_mean": 3347.7, "valid_targets_min": 1109 }, { "epoch": 0.26833631484794274, "grad_norm": 0.6957496254556903, "learning_rate": 1.5204081632653063e-05, "loss": 0.4362, "loss_nan_ranks": 0, "loss_rank_avg": 0.4714646339416504, "step": 150, "valid_targets_mean": 4095.1, "valid_targets_min": 787 }, { "epoch": 0.2772808586762075, "grad_norm": 0.6624013827511412, "learning_rate": 1.5714285714285715e-05, "loss": 0.4158, "loss_nan_ranks": 0, "loss_rank_avg": 0.4100586771965027, "step": 155, "valid_targets_mean": 3521.4, "valid_targets_min": 1542 }, { "epoch": 0.28622540250447226, "grad_norm": 1.0921780130652612, "learning_rate": 1.6224489795918368e-05, "loss": 0.4217, "loss_nan_ranks": 0, "loss_rank_avg": 0.44413700699806213, "step": 160, "valid_targets_mean": 3212.3, "valid_targets_min": 945 }, { "epoch": 0.295169946332737, "grad_norm": 0.6555406982106572, "learning_rate": 1.673469387755102e-05, "loss": 0.411, "loss_nan_ranks": 0, "loss_rank_avg": 0.43597084283828735, "step": 165, "valid_targets_mean": 4127.6, "valid_targets_min": 732 }, { "epoch": 0.3041144901610018, "grad_norm": 0.7156947764144866, "learning_rate": 1.7244897959183674e-05, "loss": 0.4142, "loss_nan_ranks": 0, "loss_rank_avg": 0.45090579986572266, "step": 170, "valid_targets_mean": 4241.0, "valid_targets_min": 945 }, { "epoch": 0.31305903398926654, "grad_norm": 0.7843406742359783, "learning_rate": 1.7755102040816327e-05, "loss": 0.4088, "loss_nan_ranks": 0, "loss_rank_avg": 0.409368097782135, "step": 175, "valid_targets_mean": 3534.1, "valid_targets_min": 607 }, { "epoch": 0.3220035778175313, "grad_norm": 0.6832085964985579, "learning_rate": 1.826530612244898e-05, "loss": 0.4323, "loss_nan_ranks": 0, "loss_rank_avg": 0.4517691731452942, "step": 180, "valid_targets_mean": 4510.8, "valid_targets_min": 1674 }, { "epoch": 0.33094812164579607, "grad_norm": 0.6430408307738346, "learning_rate": 1.8775510204081636e-05, "loss": 0.406, "loss_nan_ranks": 0, "loss_rank_avg": 0.4193289875984192, "step": 185, "valid_targets_mean": 4455.5, "valid_targets_min": 1476 }, { "epoch": 0.33989266547406083, "grad_norm": 0.6803856005045361, "learning_rate": 1.928571428571429e-05, "loss": 0.3807, "loss_nan_ranks": 0, "loss_rank_avg": 0.376784086227417, "step": 190, "valid_targets_mean": 3769.6, "valid_targets_min": 715 }, { "epoch": 0.3488372093023256, "grad_norm": 0.7962416214555187, "learning_rate": 1.979591836734694e-05, "loss": 0.4095, "loss_nan_ranks": 0, "loss_rank_avg": 0.40137556195259094, "step": 195, "valid_targets_mean": 3348.6, "valid_targets_min": 831 }, { "epoch": 0.35778175313059035, "grad_norm": 0.6163018468674557, "learning_rate": 2.0306122448979594e-05, "loss": 0.4097, "loss_nan_ranks": 0, "loss_rank_avg": 0.4052973985671997, "step": 200, "valid_targets_mean": 4064.9, "valid_targets_min": 928 }, { "epoch": 0.3667262969588551, "grad_norm": 0.5825225301762951, "learning_rate": 2.0816326530612247e-05, "loss": 0.3895, "loss_nan_ranks": 0, "loss_rank_avg": 0.379678338766098, "step": 205, "valid_targets_mean": 4561.4, "valid_targets_min": 1682 }, { "epoch": 0.3756708407871199, "grad_norm": 0.7186506278507635, "learning_rate": 2.13265306122449e-05, "loss": 0.3987, "loss_nan_ranks": 0, "loss_rank_avg": 0.3955579996109009, "step": 210, "valid_targets_mean": 3334.4, "valid_targets_min": 877 }, { "epoch": 0.38461538461538464, "grad_norm": 0.7102346399517735, "learning_rate": 2.1836734693877552e-05, "loss": 0.3996, "loss_nan_ranks": 0, "loss_rank_avg": 0.3910446763038635, "step": 215, "valid_targets_mean": 3237.5, "valid_targets_min": 1604 }, { "epoch": 0.3935599284436494, "grad_norm": 0.6261071087270799, "learning_rate": 2.2346938775510205e-05, "loss": 0.3979, "loss_nan_ranks": 0, "loss_rank_avg": 0.371921181678772, "step": 220, "valid_targets_mean": 4290.6, "valid_targets_min": 1637 }, { "epoch": 0.40250447227191416, "grad_norm": 0.6481717381436756, "learning_rate": 2.2857142857142858e-05, "loss": 0.3915, "loss_nan_ranks": 0, "loss_rank_avg": 0.3760562539100647, "step": 225, "valid_targets_mean": 3945.3, "valid_targets_min": 1767 }, { "epoch": 0.41144901610017887, "grad_norm": 0.6201712385655748, "learning_rate": 2.336734693877551e-05, "loss": 0.3929, "loss_nan_ranks": 0, "loss_rank_avg": 0.4008695185184479, "step": 230, "valid_targets_mean": 4555.8, "valid_targets_min": 1312 }, { "epoch": 0.4203935599284436, "grad_norm": 0.6203763910651068, "learning_rate": 2.3877551020408167e-05, "loss": 0.3889, "loss_nan_ranks": 0, "loss_rank_avg": 0.41413581371307373, "step": 235, "valid_targets_mean": 4777.6, "valid_targets_min": 2200 }, { "epoch": 0.4293381037567084, "grad_norm": 0.65351087223048, "learning_rate": 2.438775510204082e-05, "loss": 0.3809, "loss_nan_ranks": 0, "loss_rank_avg": 0.3872208297252655, "step": 240, "valid_targets_mean": 3722.7, "valid_targets_min": 1608 }, { "epoch": 0.43828264758497315, "grad_norm": 0.6802074572655615, "learning_rate": 2.4897959183673473e-05, "loss": 0.3602, "loss_nan_ranks": 0, "loss_rank_avg": 0.36208364367485046, "step": 245, "valid_targets_mean": 4687.7, "valid_targets_min": 1944 }, { "epoch": 0.4472271914132379, "grad_norm": 0.8869715993980485, "learning_rate": 2.5408163265306125e-05, "loss": 0.3921, "loss_nan_ranks": 0, "loss_rank_avg": 0.4071674942970276, "step": 250, "valid_targets_mean": 4066.7, "valid_targets_min": 1633 }, { "epoch": 0.4561717352415027, "grad_norm": 0.7031570375051375, "learning_rate": 2.5918367346938778e-05, "loss": 0.3945, "loss_nan_ranks": 0, "loss_rank_avg": 0.38449206948280334, "step": 255, "valid_targets_mean": 3275.8, "valid_targets_min": 807 }, { "epoch": 0.46511627906976744, "grad_norm": 0.6401965700906631, "learning_rate": 2.642857142857143e-05, "loss": 0.3799, "loss_nan_ranks": 0, "loss_rank_avg": 0.4059576094150543, "step": 260, "valid_targets_mean": 4899.2, "valid_targets_min": 1869 }, { "epoch": 0.4740608228980322, "grad_norm": 0.68848774995671, "learning_rate": 2.6938775510204084e-05, "loss": 0.3899, "loss_nan_ranks": 0, "loss_rank_avg": 0.42488914728164673, "step": 265, "valid_targets_mean": 4040.0, "valid_targets_min": 1784 }, { "epoch": 0.48300536672629696, "grad_norm": 0.6555186879962056, "learning_rate": 2.7448979591836737e-05, "loss": 0.3747, "loss_nan_ranks": 0, "loss_rank_avg": 0.37860578298568726, "step": 270, "valid_targets_mean": 3953.7, "valid_targets_min": 1120 }, { "epoch": 0.4919499105545617, "grad_norm": 0.6958637124427978, "learning_rate": 2.7959183673469393e-05, "loss": 0.3657, "loss_nan_ranks": 0, "loss_rank_avg": 0.353659987449646, "step": 275, "valid_targets_mean": 4198.6, "valid_targets_min": 867 }, { "epoch": 0.5008944543828264, "grad_norm": 0.7270956530331304, "learning_rate": 2.8469387755102046e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.3616817593574524, "step": 280, "valid_targets_mean": 3319.2, "valid_targets_min": 1008 }, { "epoch": 0.5098389982110912, "grad_norm": 0.6584523988533558, "learning_rate": 2.89795918367347e-05, "loss": 0.3639, "loss_nan_ranks": 0, "loss_rank_avg": 0.3544594645500183, "step": 285, "valid_targets_mean": 3901.2, "valid_targets_min": 1630 }, { "epoch": 0.518783542039356, "grad_norm": 0.6603276785502654, "learning_rate": 2.948979591836735e-05, "loss": 0.3765, "loss_nan_ranks": 0, "loss_rank_avg": 0.3783223032951355, "step": 290, "valid_targets_mean": 4002.2, "valid_targets_min": 1031 }, { "epoch": 0.5277280858676208, "grad_norm": 0.6256302987866349, "learning_rate": 3.0000000000000004e-05, "loss": 0.3801, "loss_nan_ranks": 0, "loss_rank_avg": 0.3801421523094177, "step": 295, "valid_targets_mean": 4247.8, "valid_targets_min": 825 }, { "epoch": 0.5366726296958855, "grad_norm": 0.641725168293166, "learning_rate": 3.0510204081632654e-05, "loss": 0.3661, "loss_nan_ranks": 0, "loss_rank_avg": 0.3630704879760742, "step": 300, "valid_targets_mean": 3875.1, "valid_targets_min": 1685 }, { "epoch": 0.5456171735241503, "grad_norm": 0.811210240684181, "learning_rate": 3.102040816326531e-05, "loss": 0.3741, "loss_nan_ranks": 0, "loss_rank_avg": 0.36272579431533813, "step": 305, "valid_targets_mean": 3257.9, "valid_targets_min": 1264 }, { "epoch": 0.554561717352415, "grad_norm": 0.667191922839525, "learning_rate": 3.153061224489796e-05, "loss": 0.3667, "loss_nan_ranks": 0, "loss_rank_avg": 0.3673118054866791, "step": 310, "valid_targets_mean": 4112.9, "valid_targets_min": 923 }, { "epoch": 0.5635062611806798, "grad_norm": 0.6483488033218554, "learning_rate": 3.2040816326530615e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.3770442008972168, "step": 315, "valid_targets_mean": 4392.9, "valid_targets_min": 2212 }, { "epoch": 0.5724508050089445, "grad_norm": 0.6594195347781112, "learning_rate": 3.255102040816327e-05, "loss": 0.3851, "loss_nan_ranks": 0, "loss_rank_avg": 0.3894268274307251, "step": 320, "valid_targets_mean": 4147.8, "valid_targets_min": 1795 }, { "epoch": 0.5813953488372093, "grad_norm": 0.5800198159071142, "learning_rate": 3.306122448979592e-05, "loss": 0.3612, "loss_nan_ranks": 0, "loss_rank_avg": 0.3446458876132965, "step": 325, "valid_targets_mean": 4526.3, "valid_targets_min": 1608 }, { "epoch": 0.590339892665474, "grad_norm": 0.6476011130202899, "learning_rate": 3.357142857142858e-05, "loss": 0.3631, "loss_nan_ranks": 0, "loss_rank_avg": 0.36270543932914734, "step": 330, "valid_targets_mean": 4024.4, "valid_targets_min": 1450 }, { "epoch": 0.5992844364937389, "grad_norm": 0.6522027257372564, "learning_rate": 3.408163265306123e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.3855012357234955, "step": 335, "valid_targets_mean": 4163.4, "valid_targets_min": 1675 }, { "epoch": 0.6082289803220036, "grad_norm": 0.6243810739429985, "learning_rate": 3.459183673469388e-05, "loss": 0.3671, "loss_nan_ranks": 0, "loss_rank_avg": 0.3456933796405792, "step": 340, "valid_targets_mean": 3930.6, "valid_targets_min": 1588 }, { "epoch": 0.6171735241502684, "grad_norm": 0.6158815913365016, "learning_rate": 3.510204081632653e-05, "loss": 0.3655, "loss_nan_ranks": 0, "loss_rank_avg": 0.35427260398864746, "step": 345, "valid_targets_mean": 4795.0, "valid_targets_min": 1934 }, { "epoch": 0.6261180679785331, "grad_norm": 0.7068523423045154, "learning_rate": 3.561224489795918e-05, "loss": 0.3687, "loss_nan_ranks": 0, "loss_rank_avg": 0.4106198847293854, "step": 350, "valid_targets_mean": 4016.4, "valid_targets_min": 648 }, { "epoch": 0.6350626118067979, "grad_norm": 0.7843744948487554, "learning_rate": 3.612244897959184e-05, "loss": 0.3634, "loss_nan_ranks": 0, "loss_rank_avg": 0.36276382207870483, "step": 355, "valid_targets_mean": 3936.0, "valid_targets_min": 1615 }, { "epoch": 0.6440071556350626, "grad_norm": 0.6872061405347063, "learning_rate": 3.6632653061224494e-05, "loss": 0.3486, "loss_nan_ranks": 0, "loss_rank_avg": 0.33801645040512085, "step": 360, "valid_targets_mean": 3690.8, "valid_targets_min": 1805 }, { "epoch": 0.6529516994633273, "grad_norm": 0.626374760633224, "learning_rate": 3.714285714285715e-05, "loss": 0.3685, "loss_nan_ranks": 0, "loss_rank_avg": 0.3595544695854187, "step": 365, "valid_targets_mean": 4637.8, "valid_targets_min": 621 }, { "epoch": 0.6618962432915921, "grad_norm": 0.6319521644936286, "learning_rate": 3.76530612244898e-05, "loss": 0.3652, "loss_nan_ranks": 0, "loss_rank_avg": 0.37265145778656006, "step": 370, "valid_targets_mean": 4238.1, "valid_targets_min": 1087 }, { "epoch": 0.6708407871198568, "grad_norm": 0.6238512565906754, "learning_rate": 3.816326530612245e-05, "loss": 0.3527, "loss_nan_ranks": 0, "loss_rank_avg": 0.36174702644348145, "step": 375, "valid_targets_mean": 4511.5, "valid_targets_min": 1518 }, { "epoch": 0.6797853309481217, "grad_norm": 0.569965173329661, "learning_rate": 3.8673469387755105e-05, "loss": 0.3637, "loss_nan_ranks": 0, "loss_rank_avg": 0.34279459714889526, "step": 380, "valid_targets_mean": 4155.4, "valid_targets_min": 1851 }, { "epoch": 0.6887298747763864, "grad_norm": 0.6707477926009685, "learning_rate": 3.9183673469387755e-05, "loss": 0.3725, "loss_nan_ranks": 0, "loss_rank_avg": 0.3640945553779602, "step": 385, "valid_targets_mean": 4214.8, "valid_targets_min": 767 }, { "epoch": 0.6976744186046512, "grad_norm": 0.5367271020119635, "learning_rate": 3.969387755102041e-05, "loss": 0.3422, "loss_nan_ranks": 0, "loss_rank_avg": 0.3215610384941101, "step": 390, "valid_targets_mean": 4804.4, "valid_targets_min": 1580 }, { "epoch": 0.7066189624329159, "grad_norm": 0.6919691468354696, "learning_rate": 3.9999968156003224e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.3643749952316284, "step": 395, "valid_targets_mean": 3619.4, "valid_targets_min": 993 }, { "epoch": 0.7155635062611807, "grad_norm": 0.6288859512995435, "learning_rate": 3.999960991220401e-05, "loss": 0.3524, "loss_nan_ranks": 0, "loss_rank_avg": 0.3619106709957123, "step": 400, "valid_targets_mean": 4227.4, "valid_targets_min": 2088 }, { "epoch": 0.7245080500894454, "grad_norm": 0.6317063641588481, "learning_rate": 3.9998853626763316e-05, "loss": 0.3548, "loss_nan_ranks": 0, "loss_rank_avg": 0.3588660657405853, "step": 405, "valid_targets_mean": 4536.9, "valid_targets_min": 1735 }, { "epoch": 0.7334525939177102, "grad_norm": 0.6057461041737375, "learning_rate": 3.999769931473309e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.3536277711391449, "step": 410, "valid_targets_mean": 3928.1, "valid_targets_min": 1408 }, { "epoch": 0.7423971377459749, "grad_norm": 0.5865439635131978, "learning_rate": 3.999614699908698e-05, "loss": 0.3447, "loss_nan_ranks": 0, "loss_rank_avg": 0.3287227153778076, "step": 415, "valid_targets_mean": 4680.5, "valid_targets_min": 1738 }, { "epoch": 0.7513416815742398, "grad_norm": 0.6236369468759124, "learning_rate": 3.999419671071993e-05, "loss": 0.36, "loss_nan_ranks": 0, "loss_rank_avg": 0.3473414182662964, "step": 420, "valid_targets_mean": 4636.2, "valid_targets_min": 1483 }, { "epoch": 0.7602862254025045, "grad_norm": 0.6239705685634717, "learning_rate": 3.999184848844746e-05, "loss": 0.3558, "loss_nan_ranks": 0, "loss_rank_avg": 0.31550854444503784, "step": 425, "valid_targets_mean": 3627.9, "valid_targets_min": 1473 }, { "epoch": 0.7692307692307693, "grad_norm": 0.7215363445685998, "learning_rate": 3.9989102379005026e-05, "loss": 0.3531, "loss_nan_ranks": 0, "loss_rank_avg": 0.3723289370536804, "step": 430, "valid_targets_mean": 3313.8, "valid_targets_min": 777 }, { "epoch": 0.778175313059034, "grad_norm": 0.6314029660945639, "learning_rate": 3.9985958437046976e-05, "loss": 0.346, "loss_nan_ranks": 0, "loss_rank_avg": 0.3319028913974762, "step": 435, "valid_targets_mean": 4074.1, "valid_targets_min": 1150 }, { "epoch": 0.7871198568872988, "grad_norm": 0.671810871870371, "learning_rate": 3.998241672514551e-05, "loss": 0.3593, "loss_nan_ranks": 0, "loss_rank_avg": 0.3606319725513458, "step": 440, "valid_targets_mean": 3716.7, "valid_targets_min": 1462 }, { "epoch": 0.7960644007155635, "grad_norm": 0.6534639604048026, "learning_rate": 3.997847731378946e-05, "loss": 0.3545, "loss_nan_ranks": 0, "loss_rank_avg": 0.3522427976131439, "step": 445, "valid_targets_mean": 3853.1, "valid_targets_min": 1761 }, { "epoch": 0.8050089445438283, "grad_norm": 0.6256271897448633, "learning_rate": 3.9974140281382844e-05, "loss": 0.3523, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305948078632355, "step": 450, "valid_targets_mean": 4348.7, "valid_targets_min": 2006 }, { "epoch": 0.813953488372093, "grad_norm": 0.665427663210199, "learning_rate": 3.996940571424331e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.3263488709926605, "step": 455, "valid_targets_mean": 3719.2, "valid_targets_min": 2056 }, { "epoch": 0.8228980322003577, "grad_norm": 0.6525668365849738, "learning_rate": 3.996427370660045e-05, "loss": 0.3491, "loss_nan_ranks": 0, "loss_rank_avg": 0.357142835855484, "step": 460, "valid_targets_mean": 4044.6, "valid_targets_min": 681 }, { "epoch": 0.8318425760286225, "grad_norm": 0.5874893016038123, "learning_rate": 3.995874436059389e-05, "loss": 0.3463, "loss_nan_ranks": 0, "loss_rank_avg": 0.34184402227401733, "step": 465, "valid_targets_mean": 4344.1, "valid_targets_min": 1744 }, { "epoch": 0.8407871198568873, "grad_norm": 0.6543028013713276, "learning_rate": 3.9952817786271264e-05, "loss": 0.3456, "loss_nan_ranks": 0, "loss_rank_avg": 0.3407524824142456, "step": 470, "valid_targets_mean": 4510.4, "valid_targets_min": 2428 }, { "epoch": 0.8497316636851521, "grad_norm": 0.6482522573193757, "learning_rate": 3.994649410158605e-05, "loss": 0.3445, "loss_nan_ranks": 0, "loss_rank_avg": 0.336134672164917, "step": 475, "valid_targets_mean": 3787.4, "valid_targets_min": 545 }, { "epoch": 0.8586762075134168, "grad_norm": 0.6618318888035204, "learning_rate": 3.99397734323952e-05, "loss": 0.3559, "loss_nan_ranks": 0, "loss_rank_avg": 0.39081141352653503, "step": 480, "valid_targets_mean": 4617.5, "valid_targets_min": 778 }, { "epoch": 0.8676207513416816, "grad_norm": 0.6461883560383084, "learning_rate": 3.993265591245662e-05, "loss": 0.3481, "loss_nan_ranks": 0, "loss_rank_avg": 0.3543085753917694, "step": 485, "valid_targets_mean": 4650.8, "valid_targets_min": 1304 }, { "epoch": 0.8765652951699463, "grad_norm": 0.7166558381651617, "learning_rate": 3.992514168342655e-05, "loss": 0.355, "loss_nan_ranks": 0, "loss_rank_avg": 0.3686150312423706, "step": 490, "valid_targets_mean": 3723.8, "valid_targets_min": 927 }, { "epoch": 0.8855098389982111, "grad_norm": 0.6815294274219248, "learning_rate": 3.9917230894856705e-05, "loss": 0.3437, "loss_nan_ranks": 0, "loss_rank_avg": 0.3497094511985779, "step": 495, "valid_targets_mean": 3219.9, "valid_targets_min": 669 }, { "epoch": 0.8944543828264758, "grad_norm": 0.78386232455594, "learning_rate": 3.990892370419132e-05, "loss": 0.3493, "loss_nan_ranks": 0, "loss_rank_avg": 0.35013243556022644, "step": 500, "valid_targets_mean": 3843.9, "valid_targets_min": 1370 }, { "epoch": 0.9033989266547406, "grad_norm": 0.6199422182618969, "learning_rate": 3.9900220276764013e-05, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.35459715127944946, "step": 505, "valid_targets_mean": 4905.9, "valid_targets_min": 2222 }, { "epoch": 0.9123434704830053, "grad_norm": 0.6761601566190695, "learning_rate": 3.989112078579449e-05, "loss": 0.3363, "loss_nan_ranks": 0, "loss_rank_avg": 0.34386712312698364, "step": 510, "valid_targets_mean": 3200.0, "valid_targets_min": 1484 }, { "epoch": 0.9212880143112702, "grad_norm": 0.5809388892974982, "learning_rate": 3.988162541238509e-05, "loss": 0.3556, "loss_nan_ranks": 0, "loss_rank_avg": 0.3644087314605713, "step": 515, "valid_targets_mean": 4901.0, "valid_targets_min": 720 }, { "epoch": 0.9302325581395349, "grad_norm": 0.6670957667841473, "learning_rate": 3.98717343455172e-05, "loss": 0.3468, "loss_nan_ranks": 0, "loss_rank_avg": 0.3259006440639496, "step": 520, "valid_targets_mean": 3929.0, "valid_targets_min": 819 }, { "epoch": 0.9391771019677997, "grad_norm": 0.6133306725020052, "learning_rate": 3.9861447782047495e-05, "loss": 0.3521, "loss_nan_ranks": 0, "loss_rank_avg": 0.3232124149799347, "step": 525, "valid_targets_mean": 4338.9, "valid_targets_min": 1621 }, { "epoch": 0.9481216457960644, "grad_norm": 0.5945215828915712, "learning_rate": 3.9850765926704e-05, "loss": 0.3457, "loss_nan_ranks": 0, "loss_rank_avg": 0.3464571535587311, "step": 530, "valid_targets_mean": 4751.4, "valid_targets_min": 1880 }, { "epoch": 0.9570661896243292, "grad_norm": 0.616855899500005, "learning_rate": 3.9839688992082004e-05, "loss": 0.3406, "loss_nan_ranks": 0, "loss_rank_avg": 0.33732545375823975, "step": 535, "valid_targets_mean": 3987.8, "valid_targets_min": 1435 }, { "epoch": 0.9660107334525939, "grad_norm": 0.5714623187800117, "learning_rate": 3.9828217198639884e-05, "loss": 0.345, "loss_nan_ranks": 0, "loss_rank_avg": 0.3435646891593933, "step": 540, "valid_targets_mean": 4915.8, "valid_targets_min": 1400 }, { "epoch": 0.9749552772808586, "grad_norm": 0.6324746280014568, "learning_rate": 3.981635077469468e-05, "loss": 0.3394, "loss_nan_ranks": 0, "loss_rank_avg": 0.3339131474494934, "step": 545, "valid_targets_mean": 3912.2, "valid_targets_min": 1666 }, { "epoch": 0.9838998211091234, "grad_norm": 0.626118262073981, "learning_rate": 3.980408995641751e-05, "loss": 0.3219, "loss_nan_ranks": 0, "loss_rank_avg": 0.33410966396331787, "step": 550, "valid_targets_mean": 4326.9, "valid_targets_min": 1565 }, { "epoch": 0.9928443649373881, "grad_norm": 0.5559330654712583, "learning_rate": 3.979143498782898e-05, "loss": 0.3523, "loss_nan_ranks": 0, "loss_rank_avg": 0.3249479830265045, "step": 555, "valid_targets_mean": 4442.0, "valid_targets_min": 1579 }, { "epoch": 1.0017889087656529, "grad_norm": 0.5744899255811827, "learning_rate": 3.977838612079419e-05, "loss": 0.3482, "loss_nan_ranks": 0, "loss_rank_avg": 0.34298670291900635, "step": 560, "valid_targets_mean": 4366.9, "valid_targets_min": 1630 }, { "epoch": 1.0107334525939178, "grad_norm": 0.540064997986571, "learning_rate": 3.976494361501786e-05, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.29019173979759216, "step": 565, "valid_targets_mean": 4183.6, "valid_targets_min": 1293 }, { "epoch": 1.0196779964221825, "grad_norm": 0.6708126937194594, "learning_rate": 3.975110773803904e-05, "loss": 0.3291, "loss_nan_ranks": 0, "loss_rank_avg": 0.3077584505081177, "step": 570, "valid_targets_mean": 3365.9, "valid_targets_min": 1599 }, { "epoch": 1.0286225402504472, "grad_norm": 0.5975546705521818, "learning_rate": 3.973687876522587e-05, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.3131313920021057, "step": 575, "valid_targets_mean": 3975.9, "valid_targets_min": 1659 }, { "epoch": 1.037567084078712, "grad_norm": 0.5802313523133982, "learning_rate": 3.9722256979770054e-05, "loss": 0.3228, "loss_nan_ranks": 0, "loss_rank_avg": 0.3223347067832947, "step": 580, "valid_targets_mean": 3876.8, "valid_targets_min": 1256 }, { "epoch": 1.0465116279069768, "grad_norm": 0.5940502139996998, "learning_rate": 3.970724267268125e-05, "loss": 0.3316, "loss_nan_ranks": 0, "loss_rank_avg": 0.3173867166042328, "step": 585, "valid_targets_mean": 3916.0, "valid_targets_min": 1519 }, { "epoch": 1.0554561717352415, "grad_norm": 0.5526882078589692, "learning_rate": 3.969183614278125e-05, "loss": 0.3205, "loss_nan_ranks": 0, "loss_rank_avg": 0.3090658187866211, "step": 590, "valid_targets_mean": 3783.8, "valid_targets_min": 1558 }, { "epoch": 1.0644007155635062, "grad_norm": 0.5756072638500698, "learning_rate": 3.9676037696698056e-05, "loss": 0.3451, "loss_nan_ranks": 0, "loss_rank_avg": 0.33000075817108154, "step": 595, "valid_targets_mean": 4377.0, "valid_targets_min": 1580 }, { "epoch": 1.073345259391771, "grad_norm": 0.6209850679632152, "learning_rate": 3.9659847648859775e-05, "loss": 0.3358, "loss_nan_ranks": 0, "loss_rank_avg": 0.3666132092475891, "step": 600, "valid_targets_mean": 3891.3, "valid_targets_min": 766 }, { "epoch": 1.0822898032200359, "grad_norm": 0.574730620347152, "learning_rate": 3.9643266321488354e-05, "loss": 0.3297, "loss_nan_ranks": 0, "loss_rank_avg": 0.31989532709121704, "step": 605, "valid_targets_mean": 4488.6, "valid_targets_min": 1565 }, { "epoch": 1.0912343470483006, "grad_norm": 0.7137118300894771, "learning_rate": 3.962629404459317e-05, "loss": 0.3272, "loss_nan_ranks": 0, "loss_rank_avg": 0.3319159746170044, "step": 610, "valid_targets_mean": 2972.9, "valid_targets_min": 625 }, { "epoch": 1.1001788908765653, "grad_norm": 0.5664071308134078, "learning_rate": 3.960893115596445e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.2983168065547943, "step": 615, "valid_targets_mean": 4385.4, "valid_targets_min": 1484 }, { "epoch": 1.10912343470483, "grad_norm": 0.617788180227712, "learning_rate": 3.959117800116658e-05, "loss": 0.3321, "loss_nan_ranks": 0, "loss_rank_avg": 0.3224518299102783, "step": 620, "valid_targets_mean": 3728.5, "valid_targets_min": 988 }, { "epoch": 1.118067978533095, "grad_norm": 0.6068172667148498, "learning_rate": 3.9573034933531195e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.3229108154773712, "step": 625, "valid_targets_mean": 4483.8, "valid_targets_min": 1824 }, { "epoch": 1.1270125223613596, "grad_norm": 0.6113158435705944, "learning_rate": 3.955450231415014e-05, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.3196060061454773, "step": 630, "valid_targets_mean": 4137.5, "valid_targets_min": 1364 }, { "epoch": 1.1359570661896243, "grad_norm": 0.6173710617052496, "learning_rate": 3.953558051186834e-05, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.34940510988235474, "step": 635, "valid_targets_mean": 4084.4, "valid_targets_min": 1886 }, { "epoch": 1.144901610017889, "grad_norm": 0.6846373488774041, "learning_rate": 3.95162699032764e-05, "loss": 0.3244, "loss_nan_ranks": 0, "loss_rank_avg": 0.3563871383666992, "step": 640, "valid_targets_mean": 4735.4, "valid_targets_min": 1188 }, { "epoch": 1.1538461538461537, "grad_norm": 0.6569856707625712, "learning_rate": 3.949657087270313e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.32631808519363403, "step": 645, "valid_targets_mean": 4182.3, "valid_targets_min": 850 }, { "epoch": 1.1627906976744187, "grad_norm": 0.5672879733062905, "learning_rate": 3.947648381220789e-05, "loss": 0.3152, "loss_nan_ranks": 0, "loss_rank_avg": 0.31764596700668335, "step": 650, "valid_targets_mean": 3908.7, "valid_targets_min": 646 }, { "epoch": 1.1717352415026834, "grad_norm": 0.6801671519180097, "learning_rate": 3.9456009121572824e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.31651636958122253, "step": 655, "valid_targets_mean": 3767.4, "valid_targets_min": 1485 }, { "epoch": 1.180679785330948, "grad_norm": 0.5776768005096825, "learning_rate": 3.943514720829485e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.3585665225982666, "step": 660, "valid_targets_mean": 4321.3, "valid_targets_min": 1595 }, { "epoch": 1.1896243291592128, "grad_norm": 0.6632996529951345, "learning_rate": 3.941389848757756e-05, "loss": 0.3293, "loss_nan_ranks": 0, "loss_rank_avg": 0.34740591049194336, "step": 665, "valid_targets_mean": 3854.9, "valid_targets_min": 1643 }, { "epoch": 1.1985688729874777, "grad_norm": 0.6568776669609784, "learning_rate": 3.9392263382323e-05, "loss": 0.3271, "loss_nan_ranks": 0, "loss_rank_avg": 0.3057899475097656, "step": 670, "valid_targets_mean": 3277.4, "valid_targets_min": 1615 }, { "epoch": 1.2075134168157424, "grad_norm": 0.6270834310864767, "learning_rate": 3.93702423231232e-05, "loss": 0.3227, "loss_nan_ranks": 0, "loss_rank_avg": 0.32783782482147217, "step": 675, "valid_targets_mean": 3216.5, "valid_targets_min": 1055 }, { "epoch": 1.2164579606440071, "grad_norm": 0.6305095200057445, "learning_rate": 3.9347835748251645e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.3536560535430908, "step": 680, "valid_targets_mean": 3572.4, "valid_targets_min": 552 }, { "epoch": 1.2254025044722718, "grad_norm": 0.5736045805917658, "learning_rate": 3.9325044103654526e-05, "loss": 0.3348, "loss_nan_ranks": 0, "loss_rank_avg": 0.3276847004890442, "step": 685, "valid_targets_mean": 3811.6, "valid_targets_min": 1374 }, { "epoch": 1.2343470483005368, "grad_norm": 0.5244473851418727, "learning_rate": 3.9301867842941867e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.3139815926551819, "step": 690, "valid_targets_mean": 4468.8, "valid_targets_min": 1504 }, { "epoch": 1.2432915921288015, "grad_norm": 0.5751467981153631, "learning_rate": 3.9278307427378495e-05, "loss": 0.335, "loss_nan_ranks": 0, "loss_rank_avg": 0.320250928401947, "step": 695, "valid_targets_mean": 4114.9, "valid_targets_min": 2051 }, { "epoch": 1.2522361359570662, "grad_norm": 0.57724364766724, "learning_rate": 3.92543633258749e-05, "loss": 0.3328, "loss_nan_ranks": 0, "loss_rank_avg": 0.3237752914428711, "step": 700, "valid_targets_mean": 4272.7, "valid_targets_min": 1724 }, { "epoch": 1.2611806797853309, "grad_norm": 0.6222962371838422, "learning_rate": 3.923003601497785e-05, "loss": 0.3096, "loss_nan_ranks": 0, "loss_rank_avg": 0.2992010712623596, "step": 705, "valid_targets_mean": 3838.6, "valid_targets_min": 1073 }, { "epoch": 1.2701252236135958, "grad_norm": 0.5745002540877785, "learning_rate": 3.920532597886091e-05, "loss": 0.3273, "loss_nan_ranks": 0, "loss_rank_avg": 0.33431553840637207, "step": 710, "valid_targets_mean": 4709.8, "valid_targets_min": 1660 }, { "epoch": 1.2790697674418605, "grad_norm": 0.8250895929655195, "learning_rate": 3.918023370931485e-05, "loss": 0.3325, "loss_nan_ranks": 0, "loss_rank_avg": 0.34380948543548584, "step": 715, "valid_targets_mean": 3260.9, "valid_targets_min": 1452 }, { "epoch": 1.2880143112701252, "grad_norm": 0.5891395257155815, "learning_rate": 3.915475970573782e-05, "loss": 0.3116, "loss_nan_ranks": 0, "loss_rank_avg": 0.31047481298446655, "step": 720, "valid_targets_mean": 3394.5, "valid_targets_min": 728 }, { "epoch": 1.29695885509839, "grad_norm": 0.5492069212467995, "learning_rate": 3.9128904475125414e-05, "loss": 0.3236, "loss_nan_ranks": 0, "loss_rank_avg": 0.3350293040275574, "step": 725, "valid_targets_mean": 4490.6, "valid_targets_min": 1470 }, { "epoch": 1.3059033989266546, "grad_norm": 0.606471839392876, "learning_rate": 3.910266853206058e-05, "loss": 0.3227, "loss_nan_ranks": 0, "loss_rank_avg": 0.3107641935348511, "step": 730, "valid_targets_mean": 3896.6, "valid_targets_min": 545 }, { "epoch": 1.3148479427549196, "grad_norm": 0.6158261916551597, "learning_rate": 3.907605239870342e-05, "loss": 0.3187, "loss_nan_ranks": 0, "loss_rank_avg": 0.31847408413887024, "step": 735, "valid_targets_mean": 3804.2, "valid_targets_min": 741 }, { "epoch": 1.3237924865831843, "grad_norm": 0.6321605305603367, "learning_rate": 3.904905660478072e-05, "loss": 0.3249, "loss_nan_ranks": 0, "loss_rank_avg": 0.3120426833629608, "step": 740, "valid_targets_mean": 3962.6, "valid_targets_min": 1180 }, { "epoch": 1.332737030411449, "grad_norm": 0.5592948617131595, "learning_rate": 3.9021681687575465e-05, "loss": 0.3179, "loss_nan_ranks": 0, "loss_rank_avg": 0.323030024766922, "step": 745, "valid_targets_mean": 4431.0, "valid_targets_min": 1535 }, { "epoch": 1.341681574239714, "grad_norm": 0.5325276240664678, "learning_rate": 3.8993928191916134e-05, "loss": 0.3142, "loss_nan_ranks": 0, "loss_rank_avg": 0.30110353231430054, "step": 750, "valid_targets_mean": 4319.6, "valid_targets_min": 1804 }, { "epoch": 1.3506261180679786, "grad_norm": 0.5538507843730288, "learning_rate": 3.8965796670165856e-05, "loss": 0.3166, "loss_nan_ranks": 0, "loss_rank_avg": 0.31126099824905396, "step": 755, "valid_targets_mean": 4311.1, "valid_targets_min": 1641 }, { "epoch": 1.3595706618962433, "grad_norm": 0.5678960091362133, "learning_rate": 3.893728768221139e-05, "loss": 0.3244, "loss_nan_ranks": 0, "loss_rank_avg": 0.305950790643692, "step": 760, "valid_targets_mean": 3987.8, "valid_targets_min": 2194 }, { "epoch": 1.368515205724508, "grad_norm": 0.5888212617780767, "learning_rate": 3.8908401795452033e-05, "loss": 0.3307, "loss_nan_ranks": 0, "loss_rank_avg": 0.3165014684200287, "step": 765, "valid_targets_mean": 4065.1, "valid_targets_min": 1441 }, { "epoch": 1.3774597495527727, "grad_norm": 0.6376960259257772, "learning_rate": 3.8879139584788286e-05, "loss": 0.3235, "loss_nan_ranks": 0, "loss_rank_avg": 0.3417049050331116, "step": 770, "valid_targets_mean": 3551.9, "valid_targets_min": 1828 }, { "epoch": 1.3864042933810374, "grad_norm": 0.5627522323734243, "learning_rate": 3.884950163261042e-05, "loss": 0.3218, "loss_nan_ranks": 0, "loss_rank_avg": 0.32489728927612305, "step": 775, "valid_targets_mean": 3681.4, "valid_targets_min": 1565 }, { "epoch": 1.3953488372093024, "grad_norm": 0.643663426567113, "learning_rate": 3.8819488528786904e-05, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.29307177662849426, "step": 780, "valid_targets_mean": 3725.8, "valid_targets_min": 778 }, { "epoch": 1.404293381037567, "grad_norm": 0.5860397601189946, "learning_rate": 3.878910087065264e-05, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.31179744005203247, "step": 785, "valid_targets_mean": 3490.3, "valid_targets_min": 997 }, { "epoch": 1.4132379248658318, "grad_norm": 0.6006178361895881, "learning_rate": 3.8758339262997094e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.3223787546157837, "step": 790, "valid_targets_mean": 3681.4, "valid_targets_min": 1614 }, { "epoch": 1.4221824686940967, "grad_norm": 0.5703573435024017, "learning_rate": 3.872720431805224e-05, "loss": 0.3108, "loss_nan_ranks": 0, "loss_rank_avg": 0.31823939085006714, "step": 795, "valid_targets_mean": 3783.3, "valid_targets_min": 474 }, { "epoch": 1.4311270125223614, "grad_norm": 0.5583054675958945, "learning_rate": 3.86956966554804e-05, "loss": 0.3226, "loss_nan_ranks": 0, "loss_rank_avg": 0.3209839463233948, "step": 800, "valid_targets_mean": 4748.8, "valid_targets_min": 1829 }, { "epoch": 1.4400715563506261, "grad_norm": 0.5734451464718057, "learning_rate": 3.8663816902361896e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.3395638167858124, "step": 805, "valid_targets_mean": 4469.4, "valid_targets_min": 954 }, { "epoch": 1.4490161001788908, "grad_norm": 0.6240967521849574, "learning_rate": 3.863156569318256e-05, "loss": 0.3185, "loss_nan_ranks": 0, "loss_rank_avg": 0.342720627784729, "step": 810, "valid_targets_mean": 3274.9, "valid_targets_min": 873 }, { "epoch": 1.4579606440071555, "grad_norm": 0.5839916094456372, "learning_rate": 3.8598943669821124e-05, "loss": 0.3352, "loss_nan_ranks": 0, "loss_rank_avg": 0.34921061992645264, "step": 815, "valid_targets_mean": 4149.1, "valid_targets_min": 1776 }, { "epoch": 1.4669051878354205, "grad_norm": 0.5327258875676051, "learning_rate": 3.856595148153643e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.29739612340927124, "step": 820, "valid_targets_mean": 4420.4, "valid_targets_min": 1722 }, { "epoch": 1.4758497316636852, "grad_norm": 0.5726474256279158, "learning_rate": 3.853258978495454e-05, "loss": 0.3283, "loss_nan_ranks": 0, "loss_rank_avg": 0.3427349925041199, "step": 825, "valid_targets_mean": 4086.2, "valid_targets_min": 754 }, { "epoch": 1.4847942754919499, "grad_norm": 0.5586681064868766, "learning_rate": 3.8498859244055616e-05, "loss": 0.3201, "loss_nan_ranks": 0, "loss_rank_avg": 0.30017322301864624, "step": 830, "valid_targets_mean": 4213.1, "valid_targets_min": 1521 }, { "epoch": 1.4937388193202148, "grad_norm": 0.5545114860278723, "learning_rate": 3.8464760530160756e-05, "loss": 0.3041, "loss_nan_ranks": 0, "loss_rank_avg": 0.3249306082725525, "step": 835, "valid_targets_mean": 4479.8, "valid_targets_min": 1882 }, { "epoch": 1.5026833631484795, "grad_norm": 0.5851321941617261, "learning_rate": 3.843029432191858e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.3026468753814697, "step": 840, "valid_targets_mean": 3582.4, "valid_targets_min": 1779 }, { "epoch": 1.5116279069767442, "grad_norm": 0.6559733463498192, "learning_rate": 3.839546130529179e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.33914104104042053, "step": 845, "valid_targets_mean": 4173.3, "valid_targets_min": 1823 }, { "epoch": 1.520572450805009, "grad_norm": 0.6371050604836407, "learning_rate": 3.8360262173543467e-05, "loss": 0.3255, "loss_nan_ranks": 0, "loss_rank_avg": 0.32565081119537354, "step": 850, "valid_targets_mean": 3549.8, "valid_targets_min": 822 }, { "epoch": 1.5295169946332736, "grad_norm": 0.5768187274321938, "learning_rate": 3.8324697627223263e-05, "loss": 0.317, "loss_nan_ranks": 0, "loss_rank_avg": 0.3176955282688141, "step": 855, "valid_targets_mean": 3880.8, "valid_targets_min": 671 }, { "epoch": 1.5384615384615383, "grad_norm": 0.5482702475809518, "learning_rate": 3.828876837415352e-05, "loss": 0.3107, "loss_nan_ranks": 0, "loss_rank_avg": 0.2995319962501526, "step": 860, "valid_targets_mean": 4659.9, "valid_targets_min": 1931 }, { "epoch": 1.5474060822898033, "grad_norm": 0.6038821934595454, "learning_rate": 3.8252475129415127e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.32784345746040344, "step": 865, "valid_targets_mean": 3603.8, "valid_targets_min": 747 }, { "epoch": 1.556350626118068, "grad_norm": 0.5283881224885371, "learning_rate": 3.82158186153333e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.30888307094573975, "step": 870, "valid_targets_mean": 4141.3, "valid_targets_min": 1381 }, { "epoch": 1.5652951699463329, "grad_norm": 0.5983795772826802, "learning_rate": 3.817879956146323e-05, "loss": 0.3294, "loss_nan_ranks": 0, "loss_rank_avg": 0.34233012795448303, "step": 875, "valid_targets_mean": 4115.4, "valid_targets_min": 1008 }, { "epoch": 1.5742397137745976, "grad_norm": 0.6611039790326494, "learning_rate": 3.814141870457553e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.3333245813846588, "step": 880, "valid_targets_mean": 3703.6, "valid_targets_min": 848 }, { "epoch": 1.5831842576028623, "grad_norm": 0.5991870251745893, "learning_rate": 3.810367678864159e-05, "loss": 0.3237, "loss_nan_ranks": 0, "loss_rank_avg": 0.30103540420532227, "step": 885, "valid_targets_mean": 3587.0, "valid_targets_min": 1491 }, { "epoch": 1.592128801431127, "grad_norm": 0.5618095876534, "learning_rate": 3.806557456481878e-05, "loss": 0.3343, "loss_nan_ranks": 0, "loss_rank_avg": 0.31948399543762207, "step": 890, "valid_targets_mean": 3862.9, "valid_targets_min": 715 }, { "epoch": 1.6010733452593917, "grad_norm": 0.6334383283680136, "learning_rate": 3.8027112791435466e-05, "loss": 0.3288, "loss_nan_ranks": 0, "loss_rank_avg": 0.31764253973960876, "step": 895, "valid_targets_mean": 3225.9, "valid_targets_min": 607 }, { "epoch": 1.6100178890876564, "grad_norm": 0.582112973475375, "learning_rate": 3.7988292233975947e-05, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.33960235118865967, "step": 900, "valid_targets_mean": 4268.9, "valid_targets_min": 1483 }, { "epoch": 1.6189624329159211, "grad_norm": 0.5815635189350303, "learning_rate": 3.7949113665065226e-05, "loss": 0.3234, "loss_nan_ranks": 0, "loss_rank_avg": 0.3374456763267517, "step": 905, "valid_targets_mean": 4174.2, "valid_targets_min": 687 }, { "epoch": 1.627906976744186, "grad_norm": 1.0497579746341565, "learning_rate": 3.7909577864453593e-05, "loss": 0.325, "loss_nan_ranks": 0, "loss_rank_avg": 0.3294409513473511, "step": 910, "valid_targets_mean": 4344.9, "valid_targets_min": 827 }, { "epoch": 1.6368515205724508, "grad_norm": 0.567491242330487, "learning_rate": 3.786968561900116e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.2935563325881958, "step": 915, "valid_targets_mean": 3874.4, "valid_targets_min": 1672 }, { "epoch": 1.6457960644007157, "grad_norm": 0.6318743528248707, "learning_rate": 3.782943772266213e-05, "loss": 0.3191, "loss_nan_ranks": 0, "loss_rank_avg": 0.3036611080169678, "step": 920, "valid_targets_mean": 3250.3, "valid_targets_min": 911 }, { "epoch": 1.6547406082289804, "grad_norm": 0.6392903008216162, "learning_rate": 3.7788834976469095e-05, "loss": 0.3083, "loss_nan_ranks": 0, "loss_rank_avg": 0.3205622434616089, "step": 925, "valid_targets_mean": 3400.8, "valid_targets_min": 978 }, { "epoch": 1.663685152057245, "grad_norm": 0.5491612081779448, "learning_rate": 3.7747878188516965e-05, "loss": 0.3137, "loss_nan_ranks": 0, "loss_rank_avg": 0.3106827437877655, "step": 930, "valid_targets_mean": 4198.3, "valid_targets_min": 1757 }, { "epoch": 1.6726296958855098, "grad_norm": 0.5396436465197288, "learning_rate": 3.770656817394703e-05, "loss": 0.3168, "loss_nan_ranks": 0, "loss_rank_avg": 0.30610522627830505, "step": 935, "valid_targets_mean": 4018.6, "valid_targets_min": 1540 }, { "epoch": 1.6815742397137745, "grad_norm": 0.4890047892792955, "learning_rate": 3.7664905754930616e-05, "loss": 0.3155, "loss_nan_ranks": 0, "loss_rank_avg": 0.31638064980506897, "step": 940, "valid_targets_mean": 4828.7, "valid_targets_min": 1454 }, { "epoch": 1.6905187835420392, "grad_norm": 0.5488512250424282, "learning_rate": 3.762289176065276e-05, "loss": 0.3167, "loss_nan_ranks": 0, "loss_rank_avg": 0.3114585280418396, "step": 945, "valid_targets_mean": 4037.7, "valid_targets_min": 600 }, { "epoch": 1.6994633273703041, "grad_norm": 0.643517620390725, "learning_rate": 3.758052702729576e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.305495023727417, "step": 950, "valid_targets_mean": 4262.5, "valid_targets_min": 1184 }, { "epoch": 1.7084078711985689, "grad_norm": 0.5457086631910586, "learning_rate": 3.753781239802245e-05, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.2907237410545349, "step": 955, "valid_targets_mean": 3675.6, "valid_targets_min": 1495 }, { "epoch": 1.7173524150268338, "grad_norm": 0.5241171467893824, "learning_rate": 3.749474872295946e-05, "loss": 0.3125, "loss_nan_ranks": 0, "loss_rank_avg": 0.2793015241622925, "step": 960, "valid_targets_mean": 3477.6, "valid_targets_min": 1785 }, { "epoch": 1.7262969588550985, "grad_norm": 0.5513650345883626, "learning_rate": 3.745133685918032e-05, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.3557593822479248, "step": 965, "valid_targets_mean": 4640.1, "valid_targets_min": 2109 }, { "epoch": 1.7352415026833632, "grad_norm": 0.526841550249395, "learning_rate": 3.740757767068834e-05, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.2938116788864136, "step": 970, "valid_targets_mean": 4656.8, "valid_targets_min": 1424 }, { "epoch": 1.744186046511628, "grad_norm": 0.6055246993537275, "learning_rate": 3.7363472028399476e-05, "loss": 0.3248, "loss_nan_ranks": 0, "loss_rank_avg": 0.3154802918434143, "step": 975, "valid_targets_mean": 3483.9, "valid_targets_min": 1692 }, { "epoch": 1.7531305903398926, "grad_norm": 0.603322342815491, "learning_rate": 3.7319020810124965e-05, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.3003346920013428, "step": 980, "valid_targets_mean": 3828.6, "valid_targets_min": 621 }, { "epoch": 1.7620751341681573, "grad_norm": 0.5626166447337553, "learning_rate": 3.727422490055386e-05, "loss": 0.3148, "loss_nan_ranks": 0, "loss_rank_avg": 0.3034425973892212, "step": 985, "valid_targets_mean": 4099.6, "valid_targets_min": 836 }, { "epoch": 1.7710196779964222, "grad_norm": 0.4590848854306322, "learning_rate": 3.72290851912354e-05, "loss": 0.314, "loss_nan_ranks": 0, "loss_rank_avg": 0.3024485111236572, "step": 990, "valid_targets_mean": 5403.2, "valid_targets_min": 2338 }, { "epoch": 1.779964221824687, "grad_norm": 0.5634666645265822, "learning_rate": 3.718360258056133e-05, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.30547595024108887, "step": 995, "valid_targets_mean": 3841.9, "valid_targets_min": 1685 }, { "epoch": 1.7889087656529516, "grad_norm": 0.5618746894535553, "learning_rate": 3.713777797374794e-05, "loss": 0.322, "loss_nan_ranks": 0, "loss_rank_avg": 0.33232662081718445, "step": 1000, "valid_targets_mean": 3674.4, "valid_targets_min": 663 }, { "epoch": 1.7978533094812166, "grad_norm": 0.6550093924031264, "learning_rate": 3.709161228281811e-05, "loss": 0.3142, "loss_nan_ranks": 0, "loss_rank_avg": 0.30034154653549194, "step": 1005, "valid_targets_mean": 3396.8, "valid_targets_min": 1109 }, { "epoch": 1.8067978533094813, "grad_norm": 0.6073692572388313, "learning_rate": 3.704510642658314e-05, "loss": 0.3203, "loss_nan_ranks": 0, "loss_rank_avg": 0.3542916178703308, "step": 1010, "valid_targets_mean": 3448.8, "valid_targets_min": 795 }, { "epoch": 1.815742397137746, "grad_norm": 0.6171396796866804, "learning_rate": 3.699826133062443e-05, "loss": 0.3118, "loss_nan_ranks": 0, "loss_rank_avg": 0.3225131630897522, "step": 1015, "valid_targets_mean": 3759.8, "valid_targets_min": 1114 }, { "epoch": 1.8246869409660107, "grad_norm": 0.6099863228762299, "learning_rate": 3.6951077927275126e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.3298446834087372, "step": 1020, "valid_targets_mean": 3864.5, "valid_targets_min": 1052 }, { "epoch": 1.8336314847942754, "grad_norm": 0.5524141402638945, "learning_rate": 3.6903557155601503e-05, "loss": 0.3117, "loss_nan_ranks": 0, "loss_rank_avg": 0.291124165058136, "step": 1025, "valid_targets_mean": 3606.2, "valid_targets_min": 1973 }, { "epoch": 1.84257602862254, "grad_norm": 0.5169690200399784, "learning_rate": 3.685569996138431e-05, "loss": 0.3065, "loss_nan_ranks": 0, "loss_rank_avg": 0.3137836456298828, "step": 1030, "valid_targets_mean": 4619.6, "valid_targets_min": 1219 }, { "epoch": 1.851520572450805, "grad_norm": 0.5316610746415315, "learning_rate": 3.680750729709993e-05, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.33356547355651855, "step": 1035, "valid_targets_mean": 4652.9, "valid_targets_min": 981 }, { "epoch": 1.8604651162790697, "grad_norm": 0.5559235856424838, "learning_rate": 3.675898012190143e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.31008175015449524, "step": 1040, "valid_targets_mean": 3755.5, "valid_targets_min": 1368 }, { "epoch": 1.8694096601073347, "grad_norm": 0.6298206469639374, "learning_rate": 3.6710119401599474e-05, "loss": 0.3252, "loss_nan_ranks": 0, "loss_rank_avg": 0.33441591262817383, "step": 1045, "valid_targets_mean": 3854.9, "valid_targets_min": 1316 }, { "epoch": 1.8783542039355994, "grad_norm": 0.5389022768825737, "learning_rate": 3.6660926108643086e-05, "loss": 0.3179, "loss_nan_ranks": 0, "loss_rank_avg": 0.3052956461906433, "step": 1050, "valid_targets_mean": 3938.4, "valid_targets_min": 680 }, { "epoch": 1.887298747763864, "grad_norm": 0.5801147385776886, "learning_rate": 3.661140122210032e-05, "loss": 0.309, "loss_nan_ranks": 0, "loss_rank_avg": 0.32204878330230713, "step": 1055, "valid_targets_mean": 3663.2, "valid_targets_min": 839 }, { "epoch": 1.8962432915921288, "grad_norm": 0.5606779533763502, "learning_rate": 3.656154572763877e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.3348532021045685, "step": 1060, "valid_targets_mean": 3548.2, "valid_targets_min": 622 }, { "epoch": 1.9051878354203935, "grad_norm": 0.5573332010454619, "learning_rate": 3.651136061750592e-05, "loss": 0.3252, "loss_nan_ranks": 0, "loss_rank_avg": 0.3448393940925598, "step": 1065, "valid_targets_mean": 3946.6, "valid_targets_min": 748 }, { "epoch": 1.9141323792486582, "grad_norm": 0.5490778045530725, "learning_rate": 3.646084689050942e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.3161720633506775, "step": 1070, "valid_targets_mean": 3859.4, "valid_targets_min": 751 }, { "epoch": 1.9230769230769231, "grad_norm": 0.5894163589977383, "learning_rate": 3.641000555199725e-05, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.3114989697933197, "step": 1075, "valid_targets_mean": 3375.2, "valid_targets_min": 710 }, { "epoch": 1.9320214669051878, "grad_norm": 0.5349889235476035, "learning_rate": 3.6358837613837604e-05, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.30235400795936584, "step": 1080, "valid_targets_mean": 3989.0, "valid_targets_min": 1691 }, { "epoch": 1.9409660107334525, "grad_norm": 0.6736523490222415, "learning_rate": 3.630734409439887e-05, "loss": 0.3227, "loss_nan_ranks": 0, "loss_rank_avg": 0.3229427635669708, "step": 1085, "valid_targets_mean": 3905.6, "valid_targets_min": 950 }, { "epoch": 1.9499105545617175, "grad_norm": 0.5727534078817972, "learning_rate": 3.625552601852928e-05, "loss": 0.3119, "loss_nan_ranks": 0, "loss_rank_avg": 0.31192246079444885, "step": 1090, "valid_targets_mean": 3771.9, "valid_targets_min": 658 }, { "epoch": 1.9588550983899822, "grad_norm": 0.6120985202643506, "learning_rate": 3.6203384417536566e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.3371928036212921, "step": 1095, "valid_targets_mean": 3940.8, "valid_targets_min": 1372 }, { "epoch": 1.9677996422182469, "grad_norm": 0.5549601857245118, "learning_rate": 3.615092032916736e-05, "loss": 0.3106, "loss_nan_ranks": 0, "loss_rank_avg": 0.3066266179084778, "step": 1100, "valid_targets_mean": 3876.9, "valid_targets_min": 1122 }, { "epoch": 1.9767441860465116, "grad_norm": 0.5131380359563835, "learning_rate": 3.6098134797586646e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.2861686646938324, "step": 1105, "valid_targets_mean": 4285.8, "valid_targets_min": 1706 }, { "epoch": 1.9856887298747763, "grad_norm": 0.527229318850269, "learning_rate": 3.604502887335688e-05, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.317037433385849, "step": 1110, "valid_targets_mean": 4532.9, "valid_targets_min": 1358 }, { "epoch": 1.994633273703041, "grad_norm": 0.6132587433714716, "learning_rate": 3.599160361341715e-05, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.35272109508514404, "step": 1115, "valid_targets_mean": 4244.4, "valid_targets_min": 1862 }, { "epoch": 2.0035778175313057, "grad_norm": 0.5593406465085026, "learning_rate": 3.59378600810621e-05, "loss": 0.3091, "loss_nan_ranks": 0, "loss_rank_avg": 0.30550044775009155, "step": 1120, "valid_targets_mean": 3629.8, "valid_targets_min": 1287 }, { "epoch": 2.012522361359571, "grad_norm": 0.5559035299742234, "learning_rate": 3.588379934592078e-05, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.2961064577102661, "step": 1125, "valid_targets_mean": 4219.7, "valid_targets_min": 2082 }, { "epoch": 2.0214669051878356, "grad_norm": 0.5222588666049305, "learning_rate": 3.5829422483935374e-05, "loss": 0.2991, "loss_nan_ranks": 0, "loss_rank_avg": 0.2910686135292053, "step": 1130, "valid_targets_mean": 4635.5, "valid_targets_min": 720 }, { "epoch": 2.0304114490161003, "grad_norm": 0.5492856936529431, "learning_rate": 3.577473057733975e-05, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.2696704864501953, "step": 1135, "valid_targets_mean": 3424.2, "valid_targets_min": 1441 }, { "epoch": 2.039355992844365, "grad_norm": 0.5805919255184491, "learning_rate": 3.571972471463795e-05, "loss": 0.2914, "loss_nan_ranks": 0, "loss_rank_avg": 0.2642717957496643, "step": 1140, "valid_targets_mean": 3726.3, "valid_targets_min": 1936 }, { "epoch": 2.0483005366726297, "grad_norm": 0.5654677847464393, "learning_rate": 3.566440599058253e-05, "loss": 0.2984, "loss_nan_ranks": 0, "loss_rank_avg": 0.31323423981666565, "step": 1145, "valid_targets_mean": 4155.1, "valid_targets_min": 1574 }, { "epoch": 2.0572450805008944, "grad_norm": 0.6258943561807471, "learning_rate": 3.560877550615275e-05, "loss": 0.2852, "loss_nan_ranks": 0, "loss_rank_avg": 0.2951895594596863, "step": 1150, "valid_targets_mean": 3085.2, "valid_targets_min": 732 }, { "epoch": 2.066189624329159, "grad_norm": 0.48185508119836556, "learning_rate": 3.555283436853267e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.277047336101532, "step": 1155, "valid_targets_mean": 4333.4, "valid_targets_min": 1674 }, { "epoch": 2.075134168157424, "grad_norm": 0.5337477447807386, "learning_rate": 3.549658369108911e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.290058970451355, "step": 1160, "valid_targets_mean": 4003.7, "valid_targets_min": 667 }, { "epoch": 2.084078711985689, "grad_norm": 0.573076273715761, "learning_rate": 3.544002459334952e-05, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.2986866235733032, "step": 1165, "valid_targets_mean": 3509.6, "valid_targets_min": 827 }, { "epoch": 2.0930232558139537, "grad_norm": 0.6434121744773865, "learning_rate": 3.5383158200979636e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.29687678813934326, "step": 1170, "valid_targets_mean": 2894.1, "valid_targets_min": 1532 }, { "epoch": 2.1019677996422184, "grad_norm": 1.0345078244238066, "learning_rate": 3.532598564576117e-05, "loss": 0.2923, "loss_nan_ranks": 0, "loss_rank_avg": 0.27670419216156006, "step": 1175, "valid_targets_mean": 3932.2, "valid_targets_min": 798 }, { "epoch": 2.110912343470483, "grad_norm": 0.5405380881490202, "learning_rate": 3.526850806556919e-05, "loss": 0.302, "loss_nan_ranks": 0, "loss_rank_avg": 0.2855556011199951, "step": 1180, "valid_targets_mean": 3778.3, "valid_targets_min": 696 }, { "epoch": 2.1198568872987478, "grad_norm": 0.5976648828621719, "learning_rate": 3.521072660434952e-05, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.28265494108200073, "step": 1185, "valid_targets_mean": 3455.8, "valid_targets_min": 866 }, { "epoch": 2.1288014311270125, "grad_norm": 0.518386120621355, "learning_rate": 3.5152642412095984e-05, "loss": 0.2869, "loss_nan_ranks": 0, "loss_rank_avg": 0.2857966721057892, "step": 1190, "valid_targets_mean": 4677.8, "valid_targets_min": 2305 }, { "epoch": 2.137745974955277, "grad_norm": 0.5447094720161839, "learning_rate": 3.5094256644827474e-05, "loss": 0.3016, "loss_nan_ranks": 0, "loss_rank_avg": 0.3032097816467285, "step": 1195, "valid_targets_mean": 4234.6, "valid_targets_min": 1055 }, { "epoch": 2.146690518783542, "grad_norm": 0.5406564490251188, "learning_rate": 3.503557046456501e-05, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.2764890193939209, "step": 1200, "valid_targets_mean": 4025.9, "valid_targets_min": 1610 }, { "epoch": 2.1556350626118066, "grad_norm": 0.5167292603339387, "learning_rate": 3.4976585039308535e-05, "loss": 0.3053, "loss_nan_ranks": 0, "loss_rank_avg": 0.2947821617126465, "step": 1205, "valid_targets_mean": 4129.1, "valid_targets_min": 1605 }, { "epoch": 2.1645796064400717, "grad_norm": 0.7469544699185315, "learning_rate": 3.491730154301372e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.3116210401058197, "step": 1210, "valid_targets_mean": 3251.5, "valid_targets_min": 1606 }, { "epoch": 2.1735241502683365, "grad_norm": 0.5769662832718492, "learning_rate": 3.485772115556859e-05, "loss": 0.2967, "loss_nan_ranks": 0, "loss_rank_avg": 0.2989100217819214, "step": 1215, "valid_targets_mean": 3717.8, "valid_targets_min": 1327 }, { "epoch": 2.182468694096601, "grad_norm": 0.5888498917346773, "learning_rate": 3.4797845062770045e-05, "loss": 0.2985, "loss_nan_ranks": 0, "loss_rank_avg": 0.2971697747707367, "step": 1220, "valid_targets_mean": 3346.9, "valid_targets_min": 1827 }, { "epoch": 2.191413237924866, "grad_norm": 0.5385601523875473, "learning_rate": 3.473767445630022e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.2714182436466217, "step": 1225, "valid_targets_mean": 3834.8, "valid_targets_min": 1393 }, { "epoch": 2.2003577817531306, "grad_norm": 0.5095146941186255, "learning_rate": 3.467721053370284e-05, "loss": 0.2914, "loss_nan_ranks": 0, "loss_rank_avg": 0.3141205608844757, "step": 1230, "valid_targets_mean": 4676.5, "valid_targets_min": 1372 }, { "epoch": 2.2093023255813953, "grad_norm": 0.6020826429693371, "learning_rate": 3.4616454498359306e-05, "loss": 0.3047, "loss_nan_ranks": 0, "loss_rank_avg": 0.29343247413635254, "step": 1235, "valid_targets_mean": 3196.5, "valid_targets_min": 1524 }, { "epoch": 2.21824686940966, "grad_norm": 0.5403496852716332, "learning_rate": 3.4555407559464825e-05, "loss": 0.3081, "loss_nan_ranks": 0, "loss_rank_avg": 0.3097769618034363, "step": 1240, "valid_targets_mean": 4774.0, "valid_targets_min": 1541 }, { "epoch": 2.2271914132379247, "grad_norm": 0.5120840671547888, "learning_rate": 3.4494070932004274e-05, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.284509539604187, "step": 1245, "valid_targets_mean": 4208.5, "valid_targets_min": 1295 }, { "epoch": 2.23613595706619, "grad_norm": 0.5914343254506964, "learning_rate": 3.4432445836728055e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.2789539694786072, "step": 1250, "valid_targets_mean": 4127.3, "valid_targets_min": 872 }, { "epoch": 2.2450805008944545, "grad_norm": 0.5645415624490583, "learning_rate": 3.4370533500127794e-05, "loss": 0.3038, "loss_nan_ranks": 0, "loss_rank_avg": 0.30053240060806274, "step": 1255, "valid_targets_mean": 3852.9, "valid_targets_min": 1580 }, { "epoch": 2.2540250447227193, "grad_norm": 0.5806828746585898, "learning_rate": 3.430833515441193e-05, "loss": 0.3006, "loss_nan_ranks": 0, "loss_rank_avg": 0.31069332361221313, "step": 1260, "valid_targets_mean": 3907.2, "valid_targets_min": 1436 }, { "epoch": 2.262969588550984, "grad_norm": 0.5626831319283796, "learning_rate": 3.424585203748119e-05, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.3043138086795807, "step": 1265, "valid_targets_mean": 4106.3, "valid_targets_min": 1718 }, { "epoch": 2.2719141323792487, "grad_norm": 0.5419828214534085, "learning_rate": 3.4183085392903965e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.28403908014297485, "step": 1270, "valid_targets_mean": 3841.6, "valid_targets_min": 1794 }, { "epoch": 2.2808586762075134, "grad_norm": 0.5881372643406569, "learning_rate": 3.41200364698915e-05, "loss": 0.2899, "loss_nan_ranks": 0, "loss_rank_avg": 0.30241650342941284, "step": 1275, "valid_targets_mean": 3480.4, "valid_targets_min": 1784 }, { "epoch": 2.289803220035778, "grad_norm": 0.5027336153791081, "learning_rate": 3.405670652327313e-05, "loss": 0.3028, "loss_nan_ranks": 0, "loss_rank_avg": 0.28809165954589844, "step": 1280, "valid_targets_mean": 4556.8, "valid_targets_min": 2196 }, { "epoch": 2.298747763864043, "grad_norm": 0.5959906299682153, "learning_rate": 3.399309681347123e-05, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.305059552192688, "step": 1285, "valid_targets_mean": 4217.6, "valid_targets_min": 1517 }, { "epoch": 2.3076923076923075, "grad_norm": 0.47359707150452485, "learning_rate": 3.392920860647617e-05, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.3012004792690277, "step": 1290, "valid_targets_mean": 4578.0, "valid_targets_min": 1297 }, { "epoch": 2.3166368515205726, "grad_norm": 0.5369785466687547, "learning_rate": 3.3865043173821074e-05, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.2727619409561157, "step": 1295, "valid_targets_mean": 3760.1, "valid_targets_min": 1539 }, { "epoch": 2.3255813953488373, "grad_norm": 0.57676869627547, "learning_rate": 3.380060179255656e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.31669068336486816, "step": 1300, "valid_targets_mean": 3117.1, "valid_targets_min": 1662 }, { "epoch": 2.334525939177102, "grad_norm": 0.5283474540373422, "learning_rate": 3.37358857452253e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.303724467754364, "step": 1305, "valid_targets_mean": 4069.7, "valid_targets_min": 1847 }, { "epoch": 2.3434704830053668, "grad_norm": 0.48205035846371097, "learning_rate": 3.367089631983651e-05, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.27161988615989685, "step": 1310, "valid_targets_mean": 4610.1, "valid_targets_min": 625 }, { "epoch": 2.3524150268336315, "grad_norm": 0.5018852845147292, "learning_rate": 3.360563480984029e-05, "loss": 0.2908, "loss_nan_ranks": 0, "loss_rank_avg": 0.2748308479785919, "step": 1315, "valid_targets_mean": 4035.2, "valid_targets_min": 1483 }, { "epoch": 2.361359570661896, "grad_norm": 0.6082741514089518, "learning_rate": 3.3540102514101904e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.2947337031364441, "step": 1320, "valid_targets_mean": 3258.3, "valid_targets_min": 863 }, { "epoch": 2.370304114490161, "grad_norm": 0.5119247145544926, "learning_rate": 3.347430073687592e-05, "loss": 0.3057, "loss_nan_ranks": 0, "loss_rank_avg": 0.3057720363140106, "step": 1325, "valid_targets_mean": 5325.2, "valid_targets_min": 2447 }, { "epoch": 2.3792486583184256, "grad_norm": 0.5545132272446245, "learning_rate": 3.340823078778024e-05, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.329643577337265, "step": 1330, "valid_targets_mean": 4703.9, "valid_targets_min": 822 }, { "epoch": 2.3881932021466907, "grad_norm": 0.5611524701506613, "learning_rate": 3.3341893981770086e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.28520113229751587, "step": 1335, "valid_targets_mean": 3347.0, "valid_targets_min": 1432 }, { "epoch": 2.3971377459749554, "grad_norm": 0.5360100187741607, "learning_rate": 3.327529163911174e-05, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.27396950125694275, "step": 1340, "valid_targets_mean": 4146.1, "valid_targets_min": 1777 }, { "epoch": 2.40608228980322, "grad_norm": 0.5232182650009217, "learning_rate": 3.320842508535636e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.294733464717865, "step": 1345, "valid_targets_mean": 3978.9, "valid_targets_min": 1969 }, { "epoch": 2.415026833631485, "grad_norm": 0.6341635562060696, "learning_rate": 3.314129565131355e-05, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.2832929491996765, "step": 1350, "valid_targets_mean": 3560.1, "valid_targets_min": 1561 }, { "epoch": 2.4239713774597496, "grad_norm": 0.5512350224651154, "learning_rate": 3.3073904673024854e-05, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930479943752289, "step": 1355, "valid_targets_mean": 4085.1, "valid_targets_min": 1762 }, { "epoch": 2.4329159212880143, "grad_norm": 0.5089586101245678, "learning_rate": 3.300625349173723e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.304643452167511, "step": 1360, "valid_targets_mean": 4801.9, "valid_targets_min": 1725 }, { "epoch": 2.441860465116279, "grad_norm": 0.5712139371917907, "learning_rate": 3.29383434538763e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.290343314409256, "step": 1365, "valid_targets_mean": 4540.5, "valid_targets_min": 1504 }, { "epoch": 2.4508050089445437, "grad_norm": 0.6223435319453212, "learning_rate": 3.287017591101957e-05, "loss": 0.3061, "loss_nan_ranks": 0, "loss_rank_avg": 0.3304898738861084, "step": 1370, "valid_targets_mean": 3340.2, "valid_targets_min": 1231 }, { "epoch": 2.4597495527728084, "grad_norm": 0.548835445285655, "learning_rate": 3.2801752219869536e-05, "loss": 0.2962, "loss_nan_ranks": 0, "loss_rank_avg": 0.29954493045806885, "step": 1375, "valid_targets_mean": 3768.6, "valid_targets_min": 1507 }, { "epoch": 2.4686940966010735, "grad_norm": 0.5273857106581554, "learning_rate": 3.273307374222667e-05, "loss": 0.2956, "loss_nan_ranks": 0, "loss_rank_avg": 0.29336017370224, "step": 1380, "valid_targets_mean": 3922.8, "valid_targets_min": 527 }, { "epoch": 2.4776386404293382, "grad_norm": 0.461716385493086, "learning_rate": 3.266414184496233e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.29551392793655396, "step": 1385, "valid_targets_mean": 4960.4, "valid_targets_min": 1853 }, { "epoch": 2.486583184257603, "grad_norm": 0.5233231328137401, "learning_rate": 3.2594957899991566e-05, "loss": 0.3022, "loss_nan_ranks": 0, "loss_rank_avg": 0.30951058864593506, "step": 1390, "valid_targets_mean": 4894.6, "valid_targets_min": 1705 }, { "epoch": 2.4955277280858676, "grad_norm": 0.5483474982667876, "learning_rate": 3.2525523284245766e-05, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.2956357002258301, "step": 1395, "valid_targets_mean": 4093.8, "valid_targets_min": 1158 }, { "epoch": 2.5044722719141324, "grad_norm": 0.5470117760522922, "learning_rate": 3.245583937964532e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.29229462146759033, "step": 1400, "valid_targets_mean": 4277.4, "valid_targets_min": 1526 }, { "epoch": 2.513416815742397, "grad_norm": 0.5692210997559785, "learning_rate": 3.238590757307206e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.28669655323028564, "step": 1405, "valid_targets_mean": 4107.9, "valid_targets_min": 2476 }, { "epoch": 2.5223613595706618, "grad_norm": 0.5999394928447368, "learning_rate": 3.2315729256341686e-05, "loss": 0.3037, "loss_nan_ranks": 0, "loss_rank_avg": 0.3192169666290283, "step": 1410, "valid_targets_mean": 3115.0, "valid_targets_min": 482 }, { "epoch": 2.531305903398927, "grad_norm": 0.5067438226356301, "learning_rate": 3.2245305826176063e-05, "loss": 0.2978, "loss_nan_ranks": 0, "loss_rank_avg": 0.30782514810562134, "step": 1415, "valid_targets_mean": 4176.4, "valid_targets_min": 1489 }, { "epoch": 2.5402504472271916, "grad_norm": 0.5670153939929208, "learning_rate": 3.217463868417541e-05, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.2898740768432617, "step": 1420, "valid_targets_mean": 4424.1, "valid_targets_min": 877 }, { "epoch": 2.5491949910554563, "grad_norm": 0.5320142185017729, "learning_rate": 3.2103729236790434e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.3135606646537781, "step": 1425, "valid_targets_mean": 4807.0, "valid_targets_min": 1759 }, { "epoch": 2.558139534883721, "grad_norm": 0.5377685633015429, "learning_rate": 3.203257889529428e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.3080807626247406, "step": 1430, "valid_targets_mean": 4145.8, "valid_targets_min": 1470 }, { "epoch": 2.5670840787119857, "grad_norm": 0.9791809632288329, "learning_rate": 3.196118907575452e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.32376378774642944, "step": 1435, "valid_targets_mean": 2997.5, "valid_targets_min": 1849 }, { "epoch": 2.5760286225402504, "grad_norm": 0.5199580890989173, "learning_rate": 3.188956119900491e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.27378737926483154, "step": 1440, "valid_targets_mean": 3816.5, "valid_targets_min": 835 }, { "epoch": 2.584973166368515, "grad_norm": 0.5360826743649624, "learning_rate": 3.181769669061713e-05, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.3072686791419983, "step": 1445, "valid_targets_mean": 3774.3, "valid_targets_min": 529 }, { "epoch": 2.59391771019678, "grad_norm": 0.5009124650640604, "learning_rate": 3.174559698087244e-05, "loss": 0.3046, "loss_nan_ranks": 0, "loss_rank_avg": 0.2810012698173523, "step": 1450, "valid_targets_mean": 3802.2, "valid_targets_min": 1494 }, { "epoch": 2.6028622540250446, "grad_norm": 0.5463511449260107, "learning_rate": 3.1673263504733136e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.28489333391189575, "step": 1455, "valid_targets_mean": 3726.8, "valid_targets_min": 737 }, { "epoch": 2.6118067978533093, "grad_norm": 0.6037481930684999, "learning_rate": 3.160069770181411e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.3057287335395813, "step": 1460, "valid_targets_mean": 3358.2, "valid_targets_min": 1491 }, { "epoch": 2.620751341681574, "grad_norm": 0.504749731879137, "learning_rate": 3.152790101635408e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.2742614150047302, "step": 1465, "valid_targets_mean": 4562.9, "valid_targets_min": 710 }, { "epoch": 2.629695885509839, "grad_norm": 0.5501576116598611, "learning_rate": 3.145487489718692e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.29383790493011475, "step": 1470, "valid_targets_mean": 4014.8, "valid_targets_min": 1590 }, { "epoch": 2.638640429338104, "grad_norm": 0.6055643551418105, "learning_rate": 3.138162079771278e-05, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.30859410762786865, "step": 1475, "valid_targets_mean": 3838.2, "valid_targets_min": 1093 }, { "epoch": 2.6475849731663685, "grad_norm": 0.6069047010077838, "learning_rate": 3.1308140175869216e-05, "loss": 0.2978, "loss_nan_ranks": 0, "loss_rank_avg": 0.29912006855010986, "step": 1480, "valid_targets_mean": 3958.1, "valid_targets_min": 1677 }, { "epoch": 2.6565295169946332, "grad_norm": 0.5738673372037972, "learning_rate": 3.123443449410211e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.29722023010253906, "step": 1485, "valid_targets_mean": 3427.4, "valid_targets_min": 527 }, { "epoch": 2.665474060822898, "grad_norm": 0.5133193729173582, "learning_rate": 3.1160505219336594e-05, "loss": 0.3037, "loss_nan_ranks": 0, "loss_rank_avg": 0.26430267095565796, "step": 1490, "valid_targets_mean": 4530.4, "valid_targets_min": 1263 }, { "epoch": 2.6744186046511627, "grad_norm": 0.5734809599747189, "learning_rate": 3.108635382294787e-05, "loss": 0.2919, "loss_nan_ranks": 0, "loss_rank_avg": 0.2972019910812378, "step": 1495, "valid_targets_mean": 3677.4, "valid_targets_min": 1602 }, { "epoch": 2.683363148479428, "grad_norm": 0.5428678152914708, "learning_rate": 3.101198178073189e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.2788999080657959, "step": 1500, "valid_targets_mean": 4050.4, "valid_targets_min": 1841 }, { "epoch": 2.6923076923076925, "grad_norm": 0.5346131939463955, "learning_rate": 3.093739057287603e-05, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.3178672790527344, "step": 1505, "valid_targets_mean": 4216.1, "valid_targets_min": 2013 }, { "epoch": 2.701252236135957, "grad_norm": 0.5546663057017248, "learning_rate": 3.086258168392957e-05, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.2941766381263733, "step": 1510, "valid_targets_mean": 4037.4, "valid_targets_min": 2094 }, { "epoch": 2.710196779964222, "grad_norm": 0.6007631310576768, "learning_rate": 3.0787556602774195e-05, "loss": 0.2995, "loss_nan_ranks": 0, "loss_rank_avg": 0.3104172348976135, "step": 1515, "valid_targets_mean": 3226.3, "valid_targets_min": 699 }, { "epoch": 2.7191413237924866, "grad_norm": 0.5246652173150378, "learning_rate": 3.071231682259437e-05, "loss": 0.2993, "loss_nan_ranks": 0, "loss_rank_avg": 0.31006383895874023, "step": 1520, "valid_targets_mean": 3979.1, "valid_targets_min": 1929 }, { "epoch": 2.7280858676207513, "grad_norm": 0.4917003682982894, "learning_rate": 3.063686384084756e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.3010290265083313, "step": 1525, "valid_targets_mean": 4885.2, "valid_targets_min": 1695 }, { "epoch": 2.737030411449016, "grad_norm": 0.5164120363148196, "learning_rate": 3.05611991592345e-05, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.28511500358581543, "step": 1530, "valid_targets_mean": 4332.8, "valid_targets_min": 2130 }, { "epoch": 2.7459749552772807, "grad_norm": 0.546710521171786, "learning_rate": 3.0485324283669288e-05, "loss": 0.2976, "loss_nan_ranks": 0, "loss_rank_avg": 0.2977195382118225, "step": 1535, "valid_targets_mean": 3932.6, "valid_targets_min": 835 }, { "epoch": 2.7549194991055455, "grad_norm": 0.4987699796804533, "learning_rate": 3.0409240724249334e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.28613370656967163, "step": 1540, "valid_targets_mean": 4534.4, "valid_targets_min": 932 }, { "epoch": 2.76386404293381, "grad_norm": 0.5318282523003093, "learning_rate": 3.033294999522545e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.29021310806274414, "step": 1545, "valid_targets_mean": 4185.5, "valid_targets_min": 1805 }, { "epoch": 2.772808586762075, "grad_norm": 0.5878956920224669, "learning_rate": 3.0256453614971594e-05, "loss": 0.3034, "loss_nan_ranks": 0, "loss_rank_avg": 0.2993810772895813, "step": 1550, "valid_targets_mean": 3415.2, "valid_targets_min": 715 }, { "epoch": 2.78175313059034, "grad_norm": 0.5178111135961665, "learning_rate": 3.017975310595469e-05, "loss": 0.3122, "loss_nan_ranks": 0, "loss_rank_avg": 0.32516568899154663, "step": 1555, "valid_targets_mean": 4719.7, "valid_targets_min": 2013 }, { "epoch": 2.7906976744186047, "grad_norm": 0.5581315425684471, "learning_rate": 3.0102849994704343e-05, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.2962647080421448, "step": 1560, "valid_targets_mean": 3870.3, "valid_targets_min": 1774 }, { "epoch": 2.7996422182468694, "grad_norm": 0.6256471631470097, "learning_rate": 3.0025745811782444e-05, "loss": 0.3041, "loss_nan_ranks": 0, "loss_rank_avg": 0.29967325925827026, "step": 1565, "valid_targets_mean": 3177.1, "valid_targets_min": 772 }, { "epoch": 2.808586762075134, "grad_norm": 0.5320691282381641, "learning_rate": 2.994844209175269e-05, "loss": 0.2977, "loss_nan_ranks": 0, "loss_rank_avg": 0.331190824508667, "step": 1570, "valid_targets_mean": 4638.9, "valid_targets_min": 1626 }, { "epoch": 2.817531305903399, "grad_norm": 0.6752470008469027, "learning_rate": 2.987094037315008e-05, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.3196222186088562, "step": 1575, "valid_targets_mean": 2458.3, "valid_targets_min": 658 }, { "epoch": 2.8264758497316635, "grad_norm": 0.5531523191801033, "learning_rate": 2.9793242198450258e-05, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.28398263454437256, "step": 1580, "valid_targets_mean": 4128.9, "valid_targets_min": 1775 }, { "epoch": 2.8354203935599287, "grad_norm": 0.5237471309819827, "learning_rate": 2.9715349114038825e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.2685989737510681, "step": 1585, "valid_targets_mean": 5779.9, "valid_targets_min": 1305 }, { "epoch": 2.8443649373881934, "grad_norm": 0.47372842550809013, "learning_rate": 2.9637262670180597e-05, "loss": 0.2924, "loss_nan_ranks": 0, "loss_rank_avg": 0.29568806290626526, "step": 1590, "valid_targets_mean": 4608.0, "valid_targets_min": 607 }, { "epoch": 2.853309481216458, "grad_norm": 0.5192555722225825, "learning_rate": 2.955898442098869e-05, "loss": 0.2932, "loss_nan_ranks": 0, "loss_rank_avg": 0.28541460633277893, "step": 1595, "valid_targets_mean": 4063.2, "valid_targets_min": 919 }, { "epoch": 2.862254025044723, "grad_norm": 0.5309547559574028, "learning_rate": 2.948051592439363e-05, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.31091922521591187, "step": 1600, "valid_targets_mean": 3888.9, "valid_targets_min": 823 }, { "epoch": 2.8711985688729875, "grad_norm": 0.5461932654893836, "learning_rate": 2.9401858742112334e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.30643460154533386, "step": 1605, "valid_targets_mean": 3989.2, "valid_targets_min": 1666 }, { "epoch": 2.8801431127012522, "grad_norm": 0.5151199812668427, "learning_rate": 2.9323014439617044e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.3191748559474945, "step": 1610, "valid_targets_mean": 4541.9, "valid_targets_min": 2209 }, { "epoch": 2.889087656529517, "grad_norm": 0.452227709754697, "learning_rate": 2.924398458610414e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.23286093771457672, "step": 1615, "valid_targets_mean": 4696.9, "valid_targets_min": 2143 }, { "epoch": 2.8980322003577816, "grad_norm": 0.5294903977491242, "learning_rate": 2.9164770754462926e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.27453750371932983, "step": 1620, "valid_targets_mean": 4409.6, "valid_targets_min": 2448 }, { "epoch": 2.9069767441860463, "grad_norm": 0.5116227108871184, "learning_rate": 2.9085374521244333e-05, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.2921096682548523, "step": 1625, "valid_targets_mean": 4203.6, "valid_targets_min": 774 }, { "epoch": 2.915921288014311, "grad_norm": 0.8886084421935505, "learning_rate": 2.900579746662954e-05, "loss": 0.2994, "loss_nan_ranks": 0, "loss_rank_avg": 0.2785966992378235, "step": 1630, "valid_targets_mean": 4256.9, "valid_targets_min": 1439 }, { "epoch": 2.9248658318425758, "grad_norm": 0.5165202216086147, "learning_rate": 2.8926041174398496e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.2874126434326172, "step": 1635, "valid_targets_mean": 3910.6, "valid_targets_min": 1567 }, { "epoch": 2.933810375670841, "grad_norm": 0.5227694759657353, "learning_rate": 2.8846107231898445e-05, "loss": 0.2982, "loss_nan_ranks": 0, "loss_rank_avg": 0.2759662866592407, "step": 1640, "valid_targets_mean": 3917.8, "valid_targets_min": 928 }, { "epoch": 2.9427549194991056, "grad_norm": 0.610425871678501, "learning_rate": 2.8765997230012295e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.28333795070648193, "step": 1645, "valid_targets_mean": 4170.1, "valid_targets_min": 2193 }, { "epoch": 2.9516994633273703, "grad_norm": 0.46116236306935077, "learning_rate": 2.868571276312698e-05, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.28075987100601196, "step": 1650, "valid_targets_mean": 4360.5, "valid_targets_min": 1737 }, { "epoch": 2.960644007155635, "grad_norm": 0.5095418283669151, "learning_rate": 2.860525542910171e-05, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.2718711495399475, "step": 1655, "valid_targets_mean": 3928.2, "valid_targets_min": 1604 }, { "epoch": 2.9695885509838997, "grad_norm": 0.5085610495904306, "learning_rate": 2.852462682923619e-05, "loss": 0.2815, "loss_nan_ranks": 0, "loss_rank_avg": 0.2917214334011078, "step": 1660, "valid_targets_mean": 3901.8, "valid_targets_min": 1275 }, { "epoch": 2.9785330948121644, "grad_norm": 0.5658892685832217, "learning_rate": 2.844382856823872e-05, "loss": 0.2934, "loss_nan_ranks": 0, "loss_rank_avg": 0.29110509157180786, "step": 1665, "valid_targets_mean": 3285.5, "valid_targets_min": 690 }, { "epoch": 2.9874776386404296, "grad_norm": 0.6573066368722159, "learning_rate": 2.8362862254194298e-05, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.28502312302589417, "step": 1670, "valid_targets_mean": 4089.2, "valid_targets_min": 787 }, { "epoch": 2.9964221824686943, "grad_norm": 0.5079392607819926, "learning_rate": 2.8281729498532574e-05, "loss": 0.312, "loss_nan_ranks": 0, "loss_rank_avg": 0.3002755045890808, "step": 1675, "valid_targets_mean": 4365.2, "valid_targets_min": 1049 }, { "epoch": 3.005366726296959, "grad_norm": 0.5393232205748715, "learning_rate": 2.8200431915995805e-05, "loss": 0.2826, "loss_nan_ranks": 0, "loss_rank_avg": 0.28886353969573975, "step": 1680, "valid_targets_mean": 3904.8, "valid_targets_min": 863 }, { "epoch": 3.0143112701252237, "grad_norm": 0.5476424824827836, "learning_rate": 2.8118971124606712e-05, "loss": 0.2629, "loss_nan_ranks": 0, "loss_rank_avg": 0.2710658311843872, "step": 1685, "valid_targets_mean": 4062.5, "valid_targets_min": 2017 }, { "epoch": 3.0232558139534884, "grad_norm": 0.606499437576894, "learning_rate": 2.8037348745636274e-05, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.2897275388240814, "step": 1690, "valid_targets_mean": 3168.9, "valid_targets_min": 1034 }, { "epoch": 3.032200357781753, "grad_norm": 0.5222073176909986, "learning_rate": 2.7955566403571464e-05, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.26425305008888245, "step": 1695, "valid_targets_mean": 4216.6, "valid_targets_min": 1906 }, { "epoch": 3.041144901610018, "grad_norm": 0.533081866038887, "learning_rate": 2.78736257260829e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.2789760231971741, "step": 1700, "valid_targets_mean": 4355.0, "valid_targets_min": 1674 }, { "epoch": 3.0500894454382825, "grad_norm": 0.5395830050252504, "learning_rate": 2.7791528343992494e-05, "loss": 0.2914, "loss_nan_ranks": 0, "loss_rank_avg": 0.2874540090560913, "step": 1705, "valid_targets_mean": 3905.8, "valid_targets_min": 1662 }, { "epoch": 3.0590339892665472, "grad_norm": 0.5327375583639009, "learning_rate": 2.7709275891240936e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.2773253917694092, "step": 1710, "valid_targets_mean": 3790.8, "valid_targets_min": 1228 }, { "epoch": 3.067978533094812, "grad_norm": 0.5332213202740119, "learning_rate": 2.7626870004855236e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.2752811312675476, "step": 1715, "valid_targets_mean": 4314.0, "valid_targets_min": 2290 }, { "epoch": 3.076923076923077, "grad_norm": 0.5771000275440432, "learning_rate": 2.7544312324916088e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.3129065930843353, "step": 1720, "valid_targets_mean": 3639.2, "valid_targets_min": 1703 }, { "epoch": 3.085867620751342, "grad_norm": 0.4926160303249595, "learning_rate": 2.7461604494525257e-05, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.27431702613830566, "step": 1725, "valid_targets_mean": 4959.2, "valid_targets_min": 1500 }, { "epoch": 3.0948121645796065, "grad_norm": 0.5440762244035418, "learning_rate": 2.7378748159772888e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.2572042942047119, "step": 1730, "valid_targets_mean": 3845.3, "valid_targets_min": 867 }, { "epoch": 3.103756708407871, "grad_norm": 0.5468975063253847, "learning_rate": 2.7295744969704725e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.2830193340778351, "step": 1735, "valid_targets_mean": 3994.4, "valid_targets_min": 793 }, { "epoch": 3.112701252236136, "grad_norm": 0.5247791983633943, "learning_rate": 2.7212596576289264e-05, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.25497889518737793, "step": 1740, "valid_targets_mean": 3932.6, "valid_targets_min": 867 }, { "epoch": 3.1216457960644006, "grad_norm": 0.5097180897051293, "learning_rate": 2.712930463438496e-05, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.2678571343421936, "step": 1745, "valid_targets_mean": 4393.1, "valid_targets_min": 1763 }, { "epoch": 3.1305903398926653, "grad_norm": 0.5054371550866157, "learning_rate": 2.7045870801707194e-05, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.2683069109916687, "step": 1750, "valid_targets_mean": 4437.9, "valid_targets_min": 1725 }, { "epoch": 3.13953488372093, "grad_norm": 0.5389786007076532, "learning_rate": 2.6962296738795344e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.29220160841941833, "step": 1755, "valid_targets_mean": 4123.8, "valid_targets_min": 579 }, { "epoch": 3.148479427549195, "grad_norm": 0.5762090201207496, "learning_rate": 2.687858410897971e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.25318244099617004, "step": 1760, "valid_targets_mean": 3570.9, "valid_targets_min": 743 }, { "epoch": 3.15742397137746, "grad_norm": 0.5279696697699028, "learning_rate": 2.679473457834842e-05, "loss": 0.2916, "loss_nan_ranks": 0, "loss_rank_avg": 0.29287105798721313, "step": 1765, "valid_targets_mean": 4093.7, "valid_targets_min": 2342 }, { "epoch": 3.1663685152057246, "grad_norm": 0.6183882195312416, "learning_rate": 2.6710749815714262e-05, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.26889514923095703, "step": 1770, "valid_targets_mean": 3194.8, "valid_targets_min": 676 }, { "epoch": 3.1753130590339893, "grad_norm": 0.5656736312850078, "learning_rate": 2.6626631492581475e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.28966403007507324, "step": 1775, "valid_targets_mean": 3782.7, "valid_targets_min": 1258 }, { "epoch": 3.184257602862254, "grad_norm": 0.5484222792379775, "learning_rate": 2.654238128311249e-05, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.2807530164718628, "step": 1780, "valid_targets_mean": 3794.1, "valid_targets_min": 1944 }, { "epoch": 3.1932021466905187, "grad_norm": 0.5453822622258856, "learning_rate": 2.645800086409458e-05, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.2747189402580261, "step": 1785, "valid_targets_mean": 4427.3, "valid_targets_min": 1608 }, { "epoch": 3.2021466905187834, "grad_norm": 0.5001051263184161, "learning_rate": 2.637349191490654e-05, "loss": 0.2796, "loss_nan_ranks": 0, "loss_rank_avg": 0.2797410488128662, "step": 1790, "valid_targets_mean": 4777.8, "valid_targets_min": 2640 }, { "epoch": 3.211091234347048, "grad_norm": 0.5575267617456836, "learning_rate": 2.6288856117485216e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.298971951007843, "step": 1795, "valid_targets_mean": 4380.4, "valid_targets_min": 1213 }, { "epoch": 3.220035778175313, "grad_norm": 0.5382921298878789, "learning_rate": 2.6204095156292048e-05, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.26511919498443604, "step": 1800, "valid_targets_mean": 4108.1, "valid_targets_min": 2044 }, { "epoch": 3.228980322003578, "grad_norm": 0.5252112327673899, "learning_rate": 2.6119210718279538e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.28953590989112854, "step": 1805, "valid_targets_mean": 4361.9, "valid_targets_min": 1299 }, { "epoch": 3.2379248658318427, "grad_norm": 0.5410954452724649, "learning_rate": 2.60342044928577e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.30843818187713623, "step": 1810, "valid_targets_mean": 4546.8, "valid_targets_min": 1329 }, { "epoch": 3.2468694096601074, "grad_norm": 0.581674111347238, "learning_rate": 2.5949078171860395e-05, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.30058762431144714, "step": 1815, "valid_targets_mean": 3899.8, "valid_targets_min": 763 }, { "epoch": 3.255813953488372, "grad_norm": 0.5237279678403152, "learning_rate": 2.5863833449511706e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.27064049243927, "step": 1820, "valid_targets_mean": 4455.4, "valid_targets_min": 1818 }, { "epoch": 3.264758497316637, "grad_norm": 0.5533963196851126, "learning_rate": 2.5778472022392184e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.2702397108078003, "step": 1825, "valid_targets_mean": 4271.4, "valid_targets_min": 2002 }, { "epoch": 3.2737030411449015, "grad_norm": 0.5313362157055852, "learning_rate": 2.5692995589405087e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.2803131341934204, "step": 1830, "valid_targets_mean": 4208.0, "valid_targets_min": 1639 }, { "epoch": 3.282647584973166, "grad_norm": 0.5541192810579373, "learning_rate": 2.5607405851742578e-05, "loss": 0.2786, "loss_nan_ranks": 0, "loss_rank_avg": 0.2655271291732788, "step": 1835, "valid_targets_mean": 4423.6, "valid_targets_min": 1631 }, { "epoch": 3.2915921288014314, "grad_norm": 0.581829811898252, "learning_rate": 2.5521704512851884e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.28082770109176636, "step": 1840, "valid_targets_mean": 3964.4, "valid_targets_min": 1481 }, { "epoch": 3.300536672629696, "grad_norm": 0.5564304499542477, "learning_rate": 2.5435893278401328e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.2610231637954712, "step": 1845, "valid_targets_mean": 3748.6, "valid_targets_min": 1052 }, { "epoch": 3.309481216457961, "grad_norm": 0.5890948907758241, "learning_rate": 2.534997385624647e-05, "loss": 0.2651, "loss_nan_ranks": 0, "loss_rank_avg": 0.2398790717124939, "step": 1850, "valid_targets_mean": 3603.0, "valid_targets_min": 552 }, { "epoch": 3.3184257602862255, "grad_norm": 0.563595381422207, "learning_rate": 2.5263947956396043e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.2689689099788666, "step": 1855, "valid_targets_mean": 3884.8, "valid_targets_min": 922 }, { "epoch": 3.32737030411449, "grad_norm": 0.5202754657752621, "learning_rate": 2.5177817290977967e-05, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.2853309214115143, "step": 1860, "valid_targets_mean": 4258.4, "valid_targets_min": 1557 }, { "epoch": 3.336314847942755, "grad_norm": 0.5125955462826816, "learning_rate": 2.5091583574205247e-05, "loss": 0.2813, "loss_nan_ranks": 0, "loss_rank_avg": 0.26263585686683655, "step": 1865, "valid_targets_mean": 4235.4, "valid_targets_min": 2097 }, { "epoch": 3.3452593917710196, "grad_norm": 0.5366296714092318, "learning_rate": 2.5005248522341868e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.2572114169597626, "step": 1870, "valid_targets_mean": 3658.3, "valid_targets_min": 1843 }, { "epoch": 3.3542039355992843, "grad_norm": 0.5473866663101812, "learning_rate": 2.4918813853668632e-05, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.2796470522880554, "step": 1875, "valid_targets_mean": 3708.9, "valid_targets_min": 1482 }, { "epoch": 3.363148479427549, "grad_norm": 0.5566454634749927, "learning_rate": 2.483228128844896e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.2780247926712036, "step": 1880, "valid_targets_mean": 3811.8, "valid_targets_min": 842 }, { "epoch": 3.3720930232558137, "grad_norm": 0.5573845593232436, "learning_rate": 2.4745652548894654e-05, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.2704911231994629, "step": 1885, "valid_targets_mean": 4766.7, "valid_targets_min": 2080 }, { "epoch": 3.381037567084079, "grad_norm": 0.5104062442322098, "learning_rate": 2.4658929359131634e-05, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.2546011209487915, "step": 1890, "valid_targets_mean": 4313.2, "valid_targets_min": 993 }, { "epoch": 3.3899821109123436, "grad_norm": 0.6120011359863383, "learning_rate": 2.4572113445165603e-05, "loss": 0.2944, "loss_nan_ranks": 0, "loss_rank_avg": 0.29367899894714355, "step": 1895, "valid_targets_mean": 3432.7, "valid_targets_min": 758 }, { "epoch": 3.3989266547406083, "grad_norm": 0.5470654579653317, "learning_rate": 2.4485206534847706e-05, "loss": 0.2786, "loss_nan_ranks": 0, "loss_rank_avg": 0.2764478921890259, "step": 1900, "valid_targets_mean": 3888.6, "valid_targets_min": 1597 }, { "epoch": 3.407871198568873, "grad_norm": 0.5631697298734966, "learning_rate": 2.439821035784014e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.29474952816963196, "step": 1905, "valid_targets_mean": 3846.1, "valid_targets_min": 1665 }, { "epoch": 3.4168157423971377, "grad_norm": 0.522999992256365, "learning_rate": 2.431112664558173e-05, "loss": 0.2704, "loss_nan_ranks": 0, "loss_rank_avg": 0.2620839476585388, "step": 1910, "valid_targets_mean": 3582.1, "valid_targets_min": 1304 }, { "epoch": 3.4257602862254024, "grad_norm": 0.49262352099697787, "learning_rate": 2.4223957131253467e-05, "loss": 0.2743, "loss_nan_ranks": 0, "loss_rank_avg": 0.26315534114837646, "step": 1915, "valid_targets_mean": 4538.1, "valid_targets_min": 2028 }, { "epoch": 3.434704830053667, "grad_norm": 0.5515685545090246, "learning_rate": 2.4136703549744028e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.2935299873352051, "step": 1920, "valid_targets_mean": 4080.0, "valid_targets_min": 794 }, { "epoch": 3.4436493738819323, "grad_norm": 0.48476650247349296, "learning_rate": 2.4049367637615215e-05, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.2544916272163391, "step": 1925, "valid_targets_mean": 4508.7, "valid_targets_min": 1366 }, { "epoch": 3.452593917710197, "grad_norm": 0.4860033907502521, "learning_rate": 2.396195113306742e-05, "loss": 0.2764, "loss_nan_ranks": 0, "loss_rank_avg": 0.2550594210624695, "step": 1930, "valid_targets_mean": 4433.0, "valid_targets_min": 1985 }, { "epoch": 3.4615384615384617, "grad_norm": 0.5353229674635286, "learning_rate": 2.3874455775905036e-05, "loss": 0.2666, "loss_nan_ranks": 0, "loss_rank_avg": 0.2665395736694336, "step": 1935, "valid_targets_mean": 3745.3, "valid_targets_min": 937 }, { "epoch": 3.4704830053667264, "grad_norm": 0.5901472498319702, "learning_rate": 2.3786883307501794e-05, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.29798996448516846, "step": 1940, "valid_targets_mean": 4030.6, "valid_targets_min": 1812 }, { "epoch": 3.479427549194991, "grad_norm": 0.5296365133279529, "learning_rate": 2.3699235470766147e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.2898460030555725, "step": 1945, "valid_targets_mean": 4661.3, "valid_targets_min": 2092 }, { "epoch": 3.488372093023256, "grad_norm": 0.6738643909015106, "learning_rate": 2.3611514010106564e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.2727169990539551, "step": 1950, "valid_targets_mean": 4183.0, "valid_targets_min": 1207 }, { "epoch": 3.4973166368515205, "grad_norm": 0.5074455770952165, "learning_rate": 2.35237206713968e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.24378815293312073, "step": 1955, "valid_targets_mean": 4246.9, "valid_targets_min": 1394 }, { "epoch": 3.506261180679785, "grad_norm": 0.5374442471219851, "learning_rate": 2.3435857201941172e-05, "loss": 0.2717, "loss_nan_ranks": 0, "loss_rank_avg": 0.27619755268096924, "step": 1960, "valid_targets_mean": 3896.1, "valid_targets_min": 1301 }, { "epoch": 3.51520572450805, "grad_norm": 0.5087843696552686, "learning_rate": 2.3347925350439765e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.2813979387283325, "step": 1965, "valid_targets_mean": 3997.4, "valid_targets_min": 1369 }, { "epoch": 3.5241502683363146, "grad_norm": 0.5980560849762698, "learning_rate": 2.3259926866953636e-05, "loss": 0.2801, "loss_nan_ranks": 0, "loss_rank_avg": 0.28663375973701477, "step": 1970, "valid_targets_mean": 3297.6, "valid_targets_min": 1305 }, { "epoch": 3.5330948121645798, "grad_norm": 0.5193924325842352, "learning_rate": 2.3171863502869993e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.26521211862564087, "step": 1975, "valid_targets_mean": 4117.4, "valid_targets_min": 2056 }, { "epoch": 3.5420393559928445, "grad_norm": 0.5449182986186685, "learning_rate": 2.3083737010867316e-05, "loss": 0.2765, "loss_nan_ranks": 0, "loss_rank_avg": 0.26807746291160583, "step": 1980, "valid_targets_mean": 3758.1, "valid_targets_min": 1563 }, { "epoch": 3.550983899821109, "grad_norm": 0.6191157830270809, "learning_rate": 2.2995549144880487e-05, "loss": 0.2805, "loss_nan_ranks": 0, "loss_rank_avg": 0.31274452805519104, "step": 1985, "valid_targets_mean": 3152.6, "valid_targets_min": 710 }, { "epoch": 3.559928443649374, "grad_norm": 0.4986923272606033, "learning_rate": 2.290730166006589e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.27044352889060974, "step": 1990, "valid_targets_mean": 4526.8, "valid_targets_min": 1712 }, { "epoch": 3.5688729874776386, "grad_norm": 0.5291098132220836, "learning_rate": 2.2818996312766474e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.28628769516944885, "step": 1995, "valid_targets_mean": 4237.6, "valid_targets_min": 1300 }, { "epoch": 3.5778175313059033, "grad_norm": 0.5395780033336437, "learning_rate": 2.2730634860476778e-05, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.2602778673171997, "step": 2000, "valid_targets_mean": 3754.7, "valid_targets_min": 2238 }, { "epoch": 3.586762075134168, "grad_norm": 0.5654796524167398, "learning_rate": 2.264221906180798e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.26922616362571716, "step": 2005, "valid_targets_mean": 3893.6, "valid_targets_min": 1565 }, { "epoch": 3.595706618962433, "grad_norm": 0.5747944159759851, "learning_rate": 2.255375067645289e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.29051297903060913, "step": 2010, "valid_targets_mean": 3719.8, "valid_targets_min": 1764 }, { "epoch": 3.604651162790698, "grad_norm": 1.076215188277447, "learning_rate": 2.2465231465150902e-05, "loss": 0.2711, "loss_nan_ranks": 0, "loss_rank_avg": 0.2821960151195526, "step": 2015, "valid_targets_mean": 4530.9, "valid_targets_min": 1666 }, { "epoch": 3.6135957066189626, "grad_norm": 0.5041678901004969, "learning_rate": 2.2376663189653002e-05, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.25614356994628906, "step": 2020, "valid_targets_mean": 4557.1, "valid_targets_min": 2257 }, { "epoch": 3.6225402504472273, "grad_norm": 0.49697468351907303, "learning_rate": 2.2288047612686655e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.2509356737136841, "step": 2025, "valid_targets_mean": 4656.5, "valid_targets_min": 2178 }, { "epoch": 3.631484794275492, "grad_norm": 0.5593780074340731, "learning_rate": 2.219938649792074e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.2787664532661438, "step": 2030, "valid_targets_mean": 3585.8, "valid_targets_min": 725 }, { "epoch": 3.6404293381037567, "grad_norm": 0.6058445555907487, "learning_rate": 2.2110681609930458e-05, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.28542840480804443, "step": 2035, "valid_targets_mean": 3754.0, "valid_targets_min": 1893 }, { "epoch": 3.6493738819320214, "grad_norm": 0.6592434752132575, "learning_rate": 2.2021934714162212e-05, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.30062779784202576, "step": 2040, "valid_targets_mean": 3522.3, "valid_targets_min": 527 }, { "epoch": 3.658318425760286, "grad_norm": 0.511485872021097, "learning_rate": 2.1933147576898447e-05, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.25937914848327637, "step": 2045, "valid_targets_mean": 3873.6, "valid_targets_min": 1491 }, { "epoch": 3.667262969588551, "grad_norm": 0.5594642686607454, "learning_rate": 2.1844321965222525e-05, "loss": 0.2825, "loss_nan_ranks": 0, "loss_rank_avg": 0.3036922216415405, "step": 2050, "valid_targets_mean": 3970.2, "valid_targets_min": 1673 }, { "epoch": 3.6762075134168155, "grad_norm": 0.5162375365075016, "learning_rate": 2.1755459646983545e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.27681976556777954, "step": 2055, "valid_targets_mean": 4571.4, "valid_targets_min": 1171 }, { "epoch": 3.6851520572450807, "grad_norm": 0.507537692969965, "learning_rate": 2.1666562390761147e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.2693493664264679, "step": 2060, "valid_targets_mean": 5078.4, "valid_targets_min": 1264 }, { "epoch": 3.6940966010733454, "grad_norm": 0.5780198663275775, "learning_rate": 2.1577631965830324e-05, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.2515581250190735, "step": 2065, "valid_targets_mean": 3473.2, "valid_targets_min": 1525 }, { "epoch": 3.70304114490161, "grad_norm": 0.5015533752033411, "learning_rate": 2.1488670142126234e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.2759404182434082, "step": 2070, "valid_targets_mean": 4662.1, "valid_targets_min": 1440 }, { "epoch": 3.7119856887298748, "grad_norm": 0.518248052496532, "learning_rate": 2.13996786902089e-05, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.27556905150413513, "step": 2075, "valid_targets_mean": 4112.4, "valid_targets_min": 2299 }, { "epoch": 3.7209302325581395, "grad_norm": 0.53651912472871, "learning_rate": 2.1310659381228066e-05, "loss": 0.2846, "loss_nan_ranks": 0, "loss_rank_avg": 0.2784693241119385, "step": 2080, "valid_targets_mean": 3839.6, "valid_targets_min": 1588 }, { "epoch": 3.729874776386404, "grad_norm": 0.5764048848203882, "learning_rate": 2.122161398688788e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.28273123502731323, "step": 2085, "valid_targets_mean": 3669.2, "valid_targets_min": 741 }, { "epoch": 3.738819320214669, "grad_norm": 0.4820289047101863, "learning_rate": 2.1132544279411655e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.26568305492401123, "step": 2090, "valid_targets_mean": 4602.2, "valid_targets_min": 786 }, { "epoch": 3.747763864042934, "grad_norm": 0.6120891450370751, "learning_rate": 2.1043452031506578e-05, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.2671006917953491, "step": 2095, "valid_targets_mean": 3208.0, "valid_targets_min": 1621 }, { "epoch": 3.7567084078711988, "grad_norm": 0.4891187435236056, "learning_rate": 2.0954339016328485e-05, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.25922301411628723, "step": 2100, "valid_targets_mean": 4271.0, "valid_targets_min": 1612 }, { "epoch": 3.7656529516994635, "grad_norm": 0.5464092724861203, "learning_rate": 2.08652070074465e-05, "loss": 0.2805, "loss_nan_ranks": 0, "loss_rank_avg": 0.3047419786453247, "step": 2105, "valid_targets_mean": 3791.9, "valid_targets_min": 1102 }, { "epoch": 3.774597495527728, "grad_norm": 0.6364819542700682, "learning_rate": 2.077605777880778e-05, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.31326138973236084, "step": 2110, "valid_targets_mean": 3016.8, "valid_targets_min": 748 }, { "epoch": 3.783542039355993, "grad_norm": 0.5001257137373921, "learning_rate": 2.0686893104702198e-05, "loss": 0.2589, "loss_nan_ranks": 0, "loss_rank_avg": 0.2531580328941345, "step": 2115, "valid_targets_mean": 4102.5, "valid_targets_min": 1660 }, { "epoch": 3.7924865831842576, "grad_norm": 0.474779949675362, "learning_rate": 2.0597714759727028e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.2678177058696747, "step": 2120, "valid_targets_mean": 4861.8, "valid_targets_min": 1696 }, { "epoch": 3.8014311270125223, "grad_norm": 0.46813381967025147, "learning_rate": 2.050852451875163e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.27863186597824097, "step": 2125, "valid_targets_mean": 4995.9, "valid_targets_min": 715 }, { "epoch": 3.810375670840787, "grad_norm": 0.5646539409857256, "learning_rate": 2.041932415688212e-05, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.2734571099281311, "step": 2130, "valid_targets_mean": 4401.4, "valid_targets_min": 1873 }, { "epoch": 3.8193202146690517, "grad_norm": 0.5405176564877853, "learning_rate": 2.0330115449426054e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.30330121517181396, "step": 2135, "valid_targets_mean": 4075.5, "valid_targets_min": 988 }, { "epoch": 3.8282647584973164, "grad_norm": 0.5063431046009021, "learning_rate": 2.0240900171857064e-05, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.29637011885643005, "step": 2140, "valid_targets_mean": 4556.2, "valid_targets_min": 1850 }, { "epoch": 3.8372093023255816, "grad_norm": 0.6148280852194663, "learning_rate": 2.0151680099779574e-05, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.2594483494758606, "step": 2145, "valid_targets_mean": 3378.6, "valid_targets_min": 943 }, { "epoch": 3.8461538461538463, "grad_norm": 0.5460464073665912, "learning_rate": 2.0062457008893408e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.25146251916885376, "step": 2150, "valid_targets_mean": 3959.3, "valid_targets_min": 1579 }, { "epoch": 3.855098389982111, "grad_norm": 0.5034957296053513, "learning_rate": 1.9973232674958487e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.25639331340789795, "step": 2155, "valid_targets_mean": 4098.7, "valid_targets_min": 1449 }, { "epoch": 3.8640429338103757, "grad_norm": 0.566801459570412, "learning_rate": 1.9884008873759446e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.29593968391418457, "step": 2160, "valid_targets_mean": 3769.4, "valid_targets_min": 474 }, { "epoch": 3.8729874776386404, "grad_norm": 0.5224664015779718, "learning_rate": 1.979478738107035e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.2669827938079834, "step": 2165, "valid_targets_mean": 4153.2, "valid_targets_min": 1824 }, { "epoch": 3.881932021466905, "grad_norm": 0.5346475973128151, "learning_rate": 1.9705569972619295e-05, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.28263264894485474, "step": 2170, "valid_targets_mean": 3984.6, "valid_targets_min": 1518 }, { "epoch": 3.89087656529517, "grad_norm": 0.5482896143276372, "learning_rate": 1.961635842405311e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.27248382568359375, "step": 2175, "valid_targets_mean": 4330.0, "valid_targets_min": 1711 }, { "epoch": 3.899821109123435, "grad_norm": 0.48204226172382336, "learning_rate": 1.9527154510901972e-05, "loss": 0.2734, "loss_nan_ranks": 0, "loss_rank_avg": 0.25980862975120544, "step": 2180, "valid_targets_mean": 4406.8, "valid_targets_min": 1855 }, { "epoch": 3.9087656529516996, "grad_norm": 0.4210041453535078, "learning_rate": 1.9437960008544126e-05, "loss": 0.2578, "loss_nan_ranks": 0, "loss_rank_avg": 0.2111448049545288, "step": 2185, "valid_targets_mean": 5192.1, "valid_targets_min": 2200 }, { "epoch": 3.9177101967799643, "grad_norm": 0.5637363734690357, "learning_rate": 1.9348776692170494e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.2881026566028595, "step": 2190, "valid_targets_mean": 3882.8, "valid_targets_min": 558 }, { "epoch": 3.926654740608229, "grad_norm": 0.48316017438181486, "learning_rate": 1.9259606336749374e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.2716853618621826, "step": 2195, "valid_targets_mean": 4683.8, "valid_targets_min": 1674 }, { "epoch": 3.9355992844364938, "grad_norm": 0.45317704598781144, "learning_rate": 1.9170450716991122e-05, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.236902117729187, "step": 2200, "valid_targets_mean": 4864.1, "valid_targets_min": 2033 }, { "epoch": 3.9445438282647585, "grad_norm": 0.56647472453608, "learning_rate": 1.90813116073128e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.30802735686302185, "step": 2205, "valid_targets_mean": 3714.6, "valid_targets_min": 823 }, { "epoch": 3.953488372093023, "grad_norm": 0.5508322430994914, "learning_rate": 1.899219078180289e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.29120323061943054, "step": 2210, "valid_targets_mean": 3726.9, "valid_targets_min": 1807 }, { "epoch": 3.962432915921288, "grad_norm": 0.5708136652371602, "learning_rate": 1.8903090014185984e-05, "loss": 0.2706, "loss_nan_ranks": 0, "loss_rank_avg": 0.26580384373664856, "step": 2215, "valid_targets_mean": 3621.6, "valid_targets_min": 1470 }, { "epoch": 3.9713774597495526, "grad_norm": 0.5942416912075751, "learning_rate": 1.881401107778744e-05, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.30616092681884766, "step": 2220, "valid_targets_mean": 3367.2, "valid_targets_min": 777 }, { "epoch": 3.9803220035778173, "grad_norm": 0.5144304612582596, "learning_rate": 1.8724955745498147e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.2784048318862915, "step": 2225, "valid_targets_mean": 4234.6, "valid_targets_min": 1729 }, { "epoch": 3.9892665474060824, "grad_norm": 0.5300804516751338, "learning_rate": 1.863592578973921e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.27351003885269165, "step": 2230, "valid_targets_mean": 3583.5, "valid_targets_min": 1324 }, { "epoch": 3.998211091234347, "grad_norm": 0.5329781559722259, "learning_rate": 1.854692298242667e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.24892058968544006, "step": 2235, "valid_targets_mean": 3651.9, "valid_targets_min": 1519 }, { "epoch": 4.007155635062611, "grad_norm": 0.4900604244331859, "learning_rate": 1.8457949094936265e-05, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.2408735752105713, "step": 2240, "valid_targets_mean": 4293.0, "valid_targets_min": 1617 }, { "epoch": 4.016100178890877, "grad_norm": 0.49977219265912204, "learning_rate": 1.8369005898068136e-05, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.26399219036102295, "step": 2245, "valid_targets_mean": 5123.9, "valid_targets_min": 667 }, { "epoch": 4.025044722719142, "grad_norm": 0.5502105291911087, "learning_rate": 1.8280095162011617e-05, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.28108128905296326, "step": 2250, "valid_targets_mean": 4024.1, "valid_targets_min": 747 }, { "epoch": 4.033989266547406, "grad_norm": 0.5835364945002972, "learning_rate": 1.819121865630998e-05, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.25397148728370667, "step": 2255, "valid_targets_mean": 3106.8, "valid_targets_min": 1424 }, { "epoch": 4.042933810375671, "grad_norm": 0.5736849669987507, "learning_rate": 1.8102378149825242e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.25006911158561707, "step": 2260, "valid_targets_mean": 4338.4, "valid_targets_min": 1212 }, { "epoch": 4.051878354203936, "grad_norm": 0.578856261130234, "learning_rate": 1.801357541070294e-05, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.2498929500579834, "step": 2265, "valid_targets_mean": 3711.7, "valid_targets_min": 1454 }, { "epoch": 4.0608228980322005, "grad_norm": 0.570026305308228, "learning_rate": 1.7924812206336956e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.24680036306381226, "step": 2270, "valid_targets_mean": 3502.1, "valid_targets_min": 766 }, { "epoch": 4.069767441860465, "grad_norm": 0.5017381451878832, "learning_rate": 1.7836090303334312e-05, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.24516400694847107, "step": 2275, "valid_targets_mean": 4885.2, "valid_targets_min": 1056 }, { "epoch": 4.07871198568873, "grad_norm": 0.6571441759078382, "learning_rate": 1.7747411467480058e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.25563162565231323, "step": 2280, "valid_targets_mean": 4010.9, "valid_targets_min": 1636 }, { "epoch": 4.087656529516995, "grad_norm": 0.5157227921600919, "learning_rate": 1.7658777463702076e-05, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.26061367988586426, "step": 2285, "valid_targets_mean": 4204.8, "valid_targets_min": 1436 }, { "epoch": 4.096601073345259, "grad_norm": 0.5245851983426554, "learning_rate": 1.7570190056035996e-05, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.23559322953224182, "step": 2290, "valid_targets_mean": 4053.4, "valid_targets_min": 722 }, { "epoch": 4.105545617173524, "grad_norm": 0.5917926110353966, "learning_rate": 1.7481651007590054e-05, "loss": 0.2706, "loss_nan_ranks": 0, "loss_rank_avg": 0.25014737248420715, "step": 2295, "valid_targets_mean": 3289.2, "valid_targets_min": 699 }, { "epoch": 4.114490161001789, "grad_norm": 0.5026025456498621, "learning_rate": 1.7393162080510045e-05, "loss": 0.2712, "loss_nan_ranks": 0, "loss_rank_avg": 0.2548500895500183, "step": 2300, "valid_targets_mean": 4602.9, "valid_targets_min": 1525 }, { "epoch": 4.1234347048300535, "grad_norm": 0.5164574844544229, "learning_rate": 1.7304725035944194e-05, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.2356826364994049, "step": 2305, "valid_targets_mean": 4163.1, "valid_targets_min": 1691 }, { "epoch": 4.132379248658318, "grad_norm": 0.48824332711112567, "learning_rate": 1.7216341634008168e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.25585299730300903, "step": 2310, "valid_targets_mean": 5345.3, "valid_targets_min": 2336 }, { "epoch": 4.141323792486583, "grad_norm": 0.5908232354996049, "learning_rate": 1.7128013633749978e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.26593607664108276, "step": 2315, "valid_targets_mean": 4050.5, "valid_targets_min": 684 }, { "epoch": 4.150268336314848, "grad_norm": 0.5495386431735231, "learning_rate": 1.7039742793115025e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.2615734040737152, "step": 2320, "valid_targets_mean": 3975.1, "valid_targets_min": 2183 }, { "epoch": 4.159212880143112, "grad_norm": 0.6242915835353913, "learning_rate": 1.6951530868911097e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.2717490792274475, "step": 2325, "valid_targets_mean": 3084.0, "valid_targets_min": 737 }, { "epoch": 4.168157423971378, "grad_norm": 0.5070664833456054, "learning_rate": 1.6863379616773388e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.2583721876144409, "step": 2330, "valid_targets_mean": 4625.7, "valid_targets_min": 1817 }, { "epoch": 4.177101967799643, "grad_norm": 0.5582812233226788, "learning_rate": 1.6775290791129567e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.2620850205421448, "step": 2335, "valid_targets_mean": 3869.9, "valid_targets_min": 1570 }, { "epoch": 4.186046511627907, "grad_norm": 0.584227709585007, "learning_rate": 1.668726614516488e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.25571852922439575, "step": 2340, "valid_targets_mean": 3331.9, "valid_targets_min": 1615 }, { "epoch": 4.194991055456172, "grad_norm": 0.5175133185961949, "learning_rate": 1.6599307430787216e-05, "loss": 0.256, "loss_nan_ranks": 0, "loss_rank_avg": 0.2526220977306366, "step": 2345, "valid_targets_mean": 4406.4, "valid_targets_min": 1662 }, { "epoch": 4.203935599284437, "grad_norm": 0.49289171535932735, "learning_rate": 1.6511416398592264e-05, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.2843324840068817, "step": 2350, "valid_targets_mean": 5134.6, "valid_targets_min": 995 }, { "epoch": 4.212880143112701, "grad_norm": 0.5356859083954757, "learning_rate": 1.64235947978287e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.28424036502838135, "step": 2355, "valid_targets_mean": 4424.1, "valid_targets_min": 1810 }, { "epoch": 4.221824686940966, "grad_norm": 0.513042991430007, "learning_rate": 1.6335844376363295e-05, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.2585211396217346, "step": 2360, "valid_targets_mean": 5082.6, "valid_targets_min": 907 }, { "epoch": 4.230769230769231, "grad_norm": 0.5695128355206176, "learning_rate": 1.6248166880646225e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.2641540467739105, "step": 2365, "valid_targets_mean": 3779.7, "valid_targets_min": 1253 }, { "epoch": 4.2397137745974955, "grad_norm": 0.6023295149757434, "learning_rate": 1.6160564055676235e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.2857375144958496, "step": 2370, "valid_targets_mean": 2948.9, "valid_targets_min": 720 }, { "epoch": 4.24865831842576, "grad_norm": 0.5098827801538092, "learning_rate": 1.6073037644965938e-05, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.23553355038166046, "step": 2375, "valid_targets_mean": 4315.9, "valid_targets_min": 1473 }, { "epoch": 4.257602862254025, "grad_norm": 0.5243491333274759, "learning_rate": 1.5985589390507117e-05, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.27872568368911743, "step": 2380, "valid_targets_mean": 4803.7, "valid_targets_min": 842 }, { "epoch": 4.26654740608229, "grad_norm": 0.5241756061317848, "learning_rate": 1.589822103273607e-05, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.2604633867740631, "step": 2385, "valid_targets_mean": 3930.9, "valid_targets_min": 835 }, { "epoch": 4.275491949910554, "grad_norm": 0.4948005196786464, "learning_rate": 1.5810934310498922e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.28036582469940186, "step": 2390, "valid_targets_mean": 4740.4, "valid_targets_min": 1665 }, { "epoch": 4.284436493738819, "grad_norm": 0.5212209771223362, "learning_rate": 1.5723730961017082e-05, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.28980493545532227, "step": 2395, "valid_targets_mean": 4507.4, "valid_targets_min": 1489 }, { "epoch": 4.293381037567084, "grad_norm": 0.5309847222961126, "learning_rate": 1.5636612719852615e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.2707955837249756, "step": 2400, "valid_targets_mean": 4071.7, "valid_targets_min": 2048 }, { "epoch": 4.3023255813953485, "grad_norm": 0.6436096499085671, "learning_rate": 1.5549581320873715e-05, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.27491945028305054, "step": 2405, "valid_targets_mean": 3519.8, "valid_targets_min": 483 }, { "epoch": 4.311270125223613, "grad_norm": 0.6837292335134912, "learning_rate": 1.5462638496220223e-05, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.2572469413280487, "step": 2410, "valid_targets_mean": 3385.1, "valid_targets_min": 787 }, { "epoch": 4.320214669051879, "grad_norm": 0.5148506938846231, "learning_rate": 1.537578597626912e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.2704946994781494, "step": 2415, "valid_targets_mean": 4277.2, "valid_targets_min": 1140 }, { "epoch": 4.3291592128801435, "grad_norm": 0.5488881906738768, "learning_rate": 1.528902548960009e-05, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.26252859830856323, "step": 2420, "valid_targets_mean": 4134.1, "valid_targets_min": 697 }, { "epoch": 4.338103756708408, "grad_norm": 0.728874058237292, "learning_rate": 1.5202358762961155e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.2942860424518585, "step": 2425, "valid_targets_mean": 2536.9, "valid_targets_min": 629 }, { "epoch": 4.347048300536673, "grad_norm": 0.542241600208826, "learning_rate": 1.511578752123426e-05, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.2418219894170761, "step": 2430, "valid_targets_mean": 3832.9, "valid_targets_min": 1764 }, { "epoch": 4.355992844364938, "grad_norm": 0.5211187289766209, "learning_rate": 1.5029313487400958e-05, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.27209898829460144, "step": 2435, "valid_targets_mean": 4450.8, "valid_targets_min": 1600 }, { "epoch": 4.364937388193202, "grad_norm": 0.519412156562896, "learning_rate": 1.4942938382508147e-05, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.2514136731624603, "step": 2440, "valid_targets_mean": 3935.2, "valid_targets_min": 1225 }, { "epoch": 4.373881932021467, "grad_norm": 0.5552648581770736, "learning_rate": 1.4856663925633776e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.27997347712516785, "step": 2445, "valid_targets_mean": 3901.2, "valid_targets_min": 656 }, { "epoch": 4.382826475849732, "grad_norm": 0.5765361718445776, "learning_rate": 1.4770491833852663e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.25308501720428467, "step": 2450, "valid_targets_mean": 3612.2, "valid_targets_min": 1505 }, { "epoch": 4.391771019677996, "grad_norm": 0.4583081364190965, "learning_rate": 1.4684423822202297e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.2737816870212555, "step": 2455, "valid_targets_mean": 5324.3, "valid_targets_min": 1435 }, { "epoch": 4.400715563506261, "grad_norm": 0.5330319752947505, "learning_rate": 1.4598461603648736e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.2785816788673401, "step": 2460, "valid_targets_mean": 3858.1, "valid_targets_min": 646 }, { "epoch": 4.409660107334526, "grad_norm": 0.5365942670180822, "learning_rate": 1.451260688905245e-05, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.25116056203842163, "step": 2465, "valid_targets_mean": 3929.6, "valid_targets_min": 1495 }, { "epoch": 4.4186046511627906, "grad_norm": 0.5412560763819989, "learning_rate": 1.4426861387134361e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.2546349763870239, "step": 2470, "valid_targets_mean": 3853.9, "valid_targets_min": 1665 }, { "epoch": 4.427549194991055, "grad_norm": 0.49146455305384606, "learning_rate": 1.4341226804441766e-05, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.284711092710495, "step": 2475, "valid_targets_mean": 4519.9, "valid_targets_min": 2096 }, { "epoch": 4.43649373881932, "grad_norm": 0.5417709539865344, "learning_rate": 1.4255704845314406e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.28545889258384705, "step": 2480, "valid_targets_mean": 4169.8, "valid_targets_min": 1480 }, { "epoch": 4.445438282647585, "grad_norm": 0.580103049281134, "learning_rate": 1.4170297211850522e-05, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.2692874073982239, "step": 2485, "valid_targets_mean": 3508.5, "valid_targets_min": 1796 }, { "epoch": 4.454382826475849, "grad_norm": 0.518242596266636, "learning_rate": 1.4085005603873004e-05, "loss": 0.2748, "loss_nan_ranks": 0, "loss_rank_avg": 0.27401190996170044, "step": 2490, "valid_targets_mean": 4321.2, "valid_targets_min": 1504 }, { "epoch": 4.463327370304114, "grad_norm": 0.5757017697078726, "learning_rate": 1.3999831718895545e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.28794726729393005, "step": 2495, "valid_targets_mean": 4045.3, "valid_targets_min": 1123 }, { "epoch": 4.47227191413238, "grad_norm": 0.5507231462190035, "learning_rate": 1.3914777252088851e-05, "loss": 0.2666, "loss_nan_ranks": 0, "loss_rank_avg": 0.28651851415634155, "step": 2500, "valid_targets_mean": 4500.8, "valid_targets_min": 1340 }, { "epoch": 4.481216457960644, "grad_norm": 0.5709744504493519, "learning_rate": 1.3829843896246917e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.2755128741264343, "step": 2505, "valid_targets_mean": 3492.8, "valid_targets_min": 1623 }, { "epoch": 4.490161001788909, "grad_norm": 0.6042383309260438, "learning_rate": 1.3745033341753337e-05, "loss": 0.2687, "loss_nan_ranks": 0, "loss_rank_avg": 0.2556525468826294, "step": 2510, "valid_targets_mean": 3758.3, "valid_targets_min": 1447 }, { "epoch": 4.499105545617174, "grad_norm": 0.5391378624752455, "learning_rate": 1.3660347276547645e-05, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.2629320025444031, "step": 2515, "valid_targets_mean": 3977.8, "valid_targets_min": 1561 }, { "epoch": 4.5080500894454385, "grad_norm": 0.5894869456529992, "learning_rate": 1.3575787386091745e-05, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.2664399743080139, "step": 2520, "valid_targets_mean": 3450.4, "valid_targets_min": 1805 }, { "epoch": 4.516994633273703, "grad_norm": 0.5927649885745278, "learning_rate": 1.3491355353336338e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.2676470875740051, "step": 2525, "valid_targets_mean": 3550.7, "valid_targets_min": 741 }, { "epoch": 4.525939177101968, "grad_norm": 0.5460664988494238, "learning_rate": 1.3407052858687432e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.28948739171028137, "step": 2530, "valid_targets_mean": 4106.0, "valid_targets_min": 1399 }, { "epoch": 4.534883720930233, "grad_norm": 0.547063854344203, "learning_rate": 1.3322881579972934e-05, "loss": 0.2616, "loss_nan_ranks": 0, "loss_rank_avg": 0.2661360502243042, "step": 2535, "valid_targets_mean": 3879.1, "valid_targets_min": 754 }, { "epoch": 4.543828264758497, "grad_norm": 0.5551257878105804, "learning_rate": 1.323884319240921e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.30140677094459534, "step": 2540, "valid_targets_mean": 3945.9, "valid_targets_min": 1303 }, { "epoch": 4.552772808586762, "grad_norm": 0.5712690563559092, "learning_rate": 1.3154939368567771e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.25856685638427734, "step": 2545, "valid_targets_mean": 3441.0, "valid_targets_min": 1512 }, { "epoch": 4.561717352415027, "grad_norm": 0.5434270961027026, "learning_rate": 1.3071171778341975e-05, "loss": 0.2597, "loss_nan_ranks": 0, "loss_rank_avg": 0.25168734788894653, "step": 2550, "valid_targets_mean": 4073.9, "valid_targets_min": 1313 }, { "epoch": 4.5706618962432914, "grad_norm": 0.5497424956791681, "learning_rate": 1.2987542088913801e-05, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.24401748180389404, "step": 2555, "valid_targets_mean": 4201.8, "valid_targets_min": 1546 }, { "epoch": 4.579606440071556, "grad_norm": 0.5096054278407313, "learning_rate": 1.290405196472064e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.26317811012268066, "step": 2560, "valid_targets_mean": 4815.1, "valid_targets_min": 1171 }, { "epoch": 4.588550983899821, "grad_norm": 0.5275387474839849, "learning_rate": 1.282070306742222e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2525607645511627, "step": 2565, "valid_targets_mean": 4492.8, "valid_targets_min": 1887 }, { "epoch": 4.597495527728086, "grad_norm": 0.5924005743194193, "learning_rate": 1.2737497055867482e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.2749042510986328, "step": 2570, "valid_targets_mean": 3256.1, "valid_targets_min": 825 }, { "epoch": 4.60644007155635, "grad_norm": 0.520307087440015, "learning_rate": 1.2654435586061604e-05, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.23750732839107513, "step": 2575, "valid_targets_mean": 3960.6, "valid_targets_min": 1329 }, { "epoch": 4.615384615384615, "grad_norm": 0.5616936308653787, "learning_rate": 1.2571520311133012e-05, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.26292529702186584, "step": 2580, "valid_targets_mean": 4504.7, "valid_targets_min": 1275 }, { "epoch": 4.624329159212881, "grad_norm": 0.5518910049186732, "learning_rate": 1.2488752881300514e-05, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535983920097351, "step": 2585, "valid_targets_mean": 3939.8, "valid_targets_min": 1386 }, { "epoch": 4.633273703041145, "grad_norm": 0.5256431179864964, "learning_rate": 1.2406134943840398e-05, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.2522655129432678, "step": 2590, "valid_targets_mean": 4140.9, "valid_targets_min": 474 }, { "epoch": 4.64221824686941, "grad_norm": 0.5048588742383056, "learning_rate": 1.232366814305372e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.24697677791118622, "step": 2595, "valid_targets_mean": 4505.9, "valid_targets_min": 1820 }, { "epoch": 4.651162790697675, "grad_norm": 0.6135798826851775, "learning_rate": 1.2241354120233527e-05, "loss": 0.2609, "loss_nan_ranks": 0, "loss_rank_avg": 0.27449357509613037, "step": 2600, "valid_targets_mean": 3534.1, "valid_targets_min": 1231 }, { "epoch": 4.660107334525939, "grad_norm": 0.5407420740372647, "learning_rate": 1.2159194513632213e-05, "loss": 0.2619, "loss_nan_ranks": 0, "loss_rank_avg": 0.2621440589427948, "step": 2605, "valid_targets_mean": 3698.6, "valid_targets_min": 625 }, { "epoch": 4.669051878354204, "grad_norm": 0.5784897601072413, "learning_rate": 1.20771909584289e-05, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.2809554934501648, "step": 2610, "valid_targets_mean": 4114.5, "valid_targets_min": 1649 }, { "epoch": 4.677996422182469, "grad_norm": 0.5583707405753705, "learning_rate": 1.1995345086696919e-05, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.265133798122406, "step": 2615, "valid_targets_mean": 4105.6, "valid_targets_min": 1769 }, { "epoch": 4.6869409660107335, "grad_norm": 0.5899963254378155, "learning_rate": 1.1913658527371284e-05, "loss": 0.2642, "loss_nan_ranks": 0, "loss_rank_avg": 0.2800382077693939, "step": 2620, "valid_targets_mean": 3958.2, "valid_targets_min": 1014 }, { "epoch": 4.695885509838998, "grad_norm": 0.5666305355030801, "learning_rate": 1.1832132906216314e-05, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.27610641717910767, "step": 2625, "valid_targets_mean": 3627.1, "valid_targets_min": 734 }, { "epoch": 4.704830053667263, "grad_norm": 0.48544029558526913, "learning_rate": 1.1750769845793268e-05, "loss": 0.2629, "loss_nan_ranks": 0, "loss_rank_avg": 0.25514447689056396, "step": 2630, "valid_targets_mean": 4717.1, "valid_targets_min": 767 }, { "epoch": 4.713774597495528, "grad_norm": 0.5191718129231461, "learning_rate": 1.1669570965428028e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.28754234313964844, "step": 2635, "valid_targets_mean": 4340.2, "valid_targets_min": 1685 }, { "epoch": 4.722719141323792, "grad_norm": 0.5824564729383654, "learning_rate": 1.1588537881178902e-05, "loss": 0.2545, "loss_nan_ranks": 0, "loss_rank_avg": 0.259286105632782, "step": 2640, "valid_targets_mean": 3709.2, "valid_targets_min": 1083 }, { "epoch": 4.731663685152057, "grad_norm": 0.6199061316983084, "learning_rate": 1.150767220580444e-05, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.264919638633728, "step": 2645, "valid_targets_mean": 3604.6, "valid_targets_min": 1544 }, { "epoch": 4.740608228980322, "grad_norm": 0.4746750054946057, "learning_rate": 1.1426975548731329e-05, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.21649254858493805, "step": 2650, "valid_targets_mean": 4358.8, "valid_targets_min": 1497 }, { "epoch": 4.7495527728085865, "grad_norm": 0.6094545797228554, "learning_rate": 1.1346449516022395e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.26640570163726807, "step": 2655, "valid_targets_mean": 3034.4, "valid_targets_min": 529 }, { "epoch": 4.758497316636851, "grad_norm": 0.5341381722241784, "learning_rate": 1.1266095710344611e-05, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.2599736154079437, "step": 2660, "valid_targets_mean": 4056.6, "valid_targets_min": 748 }, { "epoch": 4.767441860465116, "grad_norm": 0.5450354818964038, "learning_rate": 1.1185915730937209e-05, "loss": 0.2554, "loss_nan_ranks": 0, "loss_rank_avg": 0.2556326985359192, "step": 2665, "valid_targets_mean": 3869.1, "valid_targets_min": 1724 }, { "epoch": 4.7763864042933815, "grad_norm": 0.5823841949915403, "learning_rate": 1.1105911173579831e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.2735878527164459, "step": 2670, "valid_targets_mean": 3594.8, "valid_targets_min": 1608 }, { "epoch": 4.785330948121646, "grad_norm": 0.5282126999205208, "learning_rate": 1.1026083630560814e-05, "loss": 0.2526, "loss_nan_ranks": 0, "loss_rank_avg": 0.26514312624931335, "step": 2675, "valid_targets_mean": 4371.6, "valid_targets_min": 1156 }, { "epoch": 4.794275491949911, "grad_norm": 0.5463930991787092, "learning_rate": 1.0946434690645446e-05, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.2594326138496399, "step": 2680, "valid_targets_mean": 4857.9, "valid_targets_min": 2646 }, { "epoch": 4.803220035778176, "grad_norm": 0.4924897165473573, "learning_rate": 1.08669659390444e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.2588515281677246, "step": 2685, "valid_targets_mean": 4642.6, "valid_targets_min": 2325 }, { "epoch": 4.81216457960644, "grad_norm": 0.4976503303623363, "learning_rate": 1.0787678957382124e-05, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.268010675907135, "step": 2690, "valid_targets_mean": 4382.6, "valid_targets_min": 1666 }, { "epoch": 4.821109123434705, "grad_norm": 0.5302669946862639, "learning_rate": 1.0708575323665422e-05, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.25757157802581787, "step": 2695, "valid_targets_mean": 3814.4, "valid_targets_min": 1832 }, { "epoch": 4.83005366726297, "grad_norm": 0.546113045209434, "learning_rate": 1.062965661225201e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.2852606773376465, "step": 2700, "valid_targets_mean": 4466.5, "valid_targets_min": 1706 }, { "epoch": 4.838998211091234, "grad_norm": 0.508464282119227, "learning_rate": 1.0550924393819204e-05, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.2477300763130188, "step": 2705, "valid_targets_mean": 4274.6, "valid_targets_min": 1461 }, { "epoch": 4.847942754919499, "grad_norm": 0.5908025845080628, "learning_rate": 1.0472380235332631e-05, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.26860788464546204, "step": 2710, "valid_targets_mean": 3469.6, "valid_targets_min": 1287 }, { "epoch": 4.856887298747764, "grad_norm": 0.49449536043979037, "learning_rate": 1.0394025700015064e-05, "loss": 0.2601, "loss_nan_ranks": 0, "loss_rank_avg": 0.2539494037628174, "step": 2715, "valid_targets_mean": 5158.5, "valid_targets_min": 1956 }, { "epoch": 4.8658318425760285, "grad_norm": 0.5211386908969953, "learning_rate": 1.0315862347315314e-05, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.26820501685142517, "step": 2720, "valid_targets_mean": 4476.4, "valid_targets_min": 1901 }, { "epoch": 4.874776386404293, "grad_norm": 0.5544257720104306, "learning_rate": 1.0237891732877202e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.2941119372844696, "step": 2725, "valid_targets_mean": 4002.2, "valid_targets_min": 1560 }, { "epoch": 4.883720930232558, "grad_norm": 0.5465940219798077, "learning_rate": 1.0160115408508533e-05, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.26257503032684326, "step": 2730, "valid_targets_mean": 3682.9, "valid_targets_min": 950 }, { "epoch": 4.892665474060823, "grad_norm": 0.5476342559629205, "learning_rate": 1.008253492215031e-05, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.2684975862503052, "step": 2735, "valid_targets_mean": 4095.6, "valid_targets_min": 1925 }, { "epoch": 4.901610017889087, "grad_norm": 0.5180846052234739, "learning_rate": 1.0005151817845853e-05, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.2808322012424469, "step": 2740, "valid_targets_mean": 4175.7, "valid_targets_min": 2464 }, { "epoch": 4.910554561717352, "grad_norm": 0.5936981738189633, "learning_rate": 9.927967635710087e-06, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.24229755997657776, "step": 2745, "valid_targets_mean": 4147.9, "valid_targets_min": 914 }, { "epoch": 4.919499105545617, "grad_norm": 0.5464370878938494, "learning_rate": 9.850983911898913e-06, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.24679221212863922, "step": 2750, "valid_targets_mean": 3841.9, "valid_targets_min": 877 }, { "epoch": 4.928443649373882, "grad_norm": 0.5334187085612581, "learning_rate": 9.774202178578592e-06, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.2615172863006592, "step": 2755, "valid_targets_mean": 3857.0, "valid_targets_min": 622 }, { "epoch": 4.937388193202147, "grad_norm": 0.5666627948297285, "learning_rate": 9.69762396389529e-06, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.2589084804058075, "step": 2760, "valid_targets_mean": 3624.9, "valid_targets_min": 1519 }, { "epoch": 4.946332737030412, "grad_norm": 0.5273284504363817, "learning_rate": 9.621250791944659e-06, "loss": 0.2627, "loss_nan_ranks": 0, "loss_rank_avg": 0.2510490417480469, "step": 2765, "valid_targets_mean": 5004.1, "valid_targets_min": 1979 }, { "epoch": 4.9552772808586765, "grad_norm": 0.6220423946842822, "learning_rate": 9.545084182741476e-06, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.2961236536502838, "step": 2770, "valid_targets_mean": 3909.4, "valid_targets_min": 657 }, { "epoch": 4.964221824686941, "grad_norm": 0.6418856659491654, "learning_rate": 9.469125652189403e-06, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.28539496660232544, "step": 2775, "valid_targets_mean": 3030.6, "valid_targets_min": 575 }, { "epoch": 4.973166368515206, "grad_norm": 0.5309277403670316, "learning_rate": 9.393376712050847e-06, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.2643331289291382, "step": 2780, "valid_targets_mean": 4088.8, "valid_targets_min": 848 }, { "epoch": 4.982110912343471, "grad_norm": 0.6124698201076337, "learning_rate": 9.317838869916835e-06, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.28254374861717224, "step": 2785, "valid_targets_mean": 3677.6, "valid_targets_min": 1521 }, { "epoch": 4.991055456171735, "grad_norm": 0.7441462785686875, "learning_rate": 9.242513629177033e-06, "loss": 0.261, "loss_nan_ranks": 0, "loss_rank_avg": 0.27683040499687195, "step": 2790, "valid_targets_mean": 3313.4, "valid_targets_min": 627 }, { "epoch": 5.0, "grad_norm": 0.5230399259211697, "learning_rate": 9.167402488989784e-06, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.25869959592819214, "step": 2795, "valid_targets_mean": 3854.7, "valid_targets_min": 743 }, { "epoch": 5.008944543828265, "grad_norm": 0.5549552542784999, "learning_rate": 9.092506944252344e-06, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.2471010535955429, "step": 2800, "valid_targets_mean": 4048.8, "valid_targets_min": 1320 }, { "epoch": 5.017889087656529, "grad_norm": 0.5147728124256338, "learning_rate": 9.017828485571044e-06, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.23798583447933197, "step": 2805, "valid_targets_mean": 4106.8, "valid_targets_min": 937 }, { "epoch": 5.026833631484794, "grad_norm": 0.5315317178738851, "learning_rate": 8.943368599231706e-06, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.2732792794704437, "step": 2810, "valid_targets_mean": 4333.1, "valid_targets_min": 2013 }, { "epoch": 5.035778175313059, "grad_norm": 0.5729446923576372, "learning_rate": 8.869128767169986e-06, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.2487604320049286, "step": 2815, "valid_targets_mean": 4101.1, "valid_targets_min": 1705 }, { "epoch": 5.0447227191413235, "grad_norm": 0.5034079404779742, "learning_rate": 8.79511046694194e-06, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.26576727628707886, "step": 2820, "valid_targets_mean": 5089.2, "valid_targets_min": 2511 }, { "epoch": 5.053667262969588, "grad_norm": 0.6023654856445056, "learning_rate": 8.721315171694591e-06, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.25126317143440247, "step": 2825, "valid_targets_mean": 3496.4, "valid_targets_min": 690 }, { "epoch": 5.062611806797853, "grad_norm": 0.6689786638114392, "learning_rate": 8.647744350136612e-06, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.24577105045318604, "step": 2830, "valid_targets_mean": 2972.4, "valid_targets_min": 732 }, { "epoch": 5.071556350626118, "grad_norm": 0.5438242397653636, "learning_rate": 8.574399466509085e-06, "loss": 0.2551, "loss_nan_ranks": 0, "loss_rank_avg": 0.26564639806747437, "step": 2835, "valid_targets_mean": 3876.6, "valid_targets_min": 1618 }, { "epoch": 5.080500894454383, "grad_norm": 0.6404762750457129, "learning_rate": 8.501281980556369e-06, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.2322574257850647, "step": 2840, "valid_targets_mean": 3335.4, "valid_targets_min": 1755 }, { "epoch": 5.089445438282648, "grad_norm": 0.5158771438098722, "learning_rate": 8.428393347497057e-06, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.2659394145011902, "step": 2845, "valid_targets_mean": 4493.7, "valid_targets_min": 2239 }, { "epoch": 5.098389982110913, "grad_norm": 0.563631894055807, "learning_rate": 8.355735017995011e-06, "loss": 0.2518, "loss_nan_ranks": 0, "loss_rank_avg": 0.23874777555465698, "step": 2850, "valid_targets_mean": 3666.8, "valid_targets_min": 754 }, { "epoch": 5.107334525939177, "grad_norm": 0.5264091725894624, "learning_rate": 8.283308438130458e-06, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.28656524419784546, "step": 2855, "valid_targets_mean": 4860.7, "valid_targets_min": 1880 }, { "epoch": 5.116279069767442, "grad_norm": 0.5531684984629897, "learning_rate": 8.211115049371266e-06, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.25294798612594604, "step": 2860, "valid_targets_mean": 4066.2, "valid_targets_min": 634 }, { "epoch": 5.125223613595707, "grad_norm": 0.5887989735486293, "learning_rate": 8.13915628854419e-06, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.27043190598487854, "step": 2865, "valid_targets_mean": 3563.4, "valid_targets_min": 737 }, { "epoch": 5.1341681574239715, "grad_norm": 0.6198216758291454, "learning_rate": 8.067433587806336e-06, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.2664569318294525, "step": 2870, "valid_targets_mean": 3196.0, "valid_targets_min": 646 }, { "epoch": 5.143112701252236, "grad_norm": 0.49039197556547504, "learning_rate": 7.995948374616628e-06, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.24738174676895142, "step": 2875, "valid_targets_mean": 4813.1, "valid_targets_min": 1748 }, { "epoch": 5.152057245080501, "grad_norm": 0.5124249703499617, "learning_rate": 7.924702071707386e-06, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.22936435043811798, "step": 2880, "valid_targets_mean": 4589.9, "valid_targets_min": 669 }, { "epoch": 5.161001788908766, "grad_norm": 0.5356467322668551, "learning_rate": 7.853696097056037e-06, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.264324426651001, "step": 2885, "valid_targets_mean": 4108.2, "valid_targets_min": 1605 }, { "epoch": 5.16994633273703, "grad_norm": 0.5087262397528598, "learning_rate": 7.782931863856888e-06, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.23341549932956696, "step": 2890, "valid_targets_mean": 4439.1, "valid_targets_min": 1726 }, { "epoch": 5.178890876565295, "grad_norm": 0.5549321487561256, "learning_rate": 7.71241078049298e-06, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.25444790720939636, "step": 2895, "valid_targets_mean": 4032.2, "valid_targets_min": 1642 }, { "epoch": 5.18783542039356, "grad_norm": 0.5352806321855557, "learning_rate": 7.642134250508069e-06, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.24765413999557495, "step": 2900, "valid_targets_mean": 4077.3, "valid_targets_min": 1757 }, { "epoch": 5.196779964221824, "grad_norm": 0.5518211501366974, "learning_rate": 7.57210367257871e-06, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.24627630412578583, "step": 2905, "valid_targets_mean": 4041.1, "valid_targets_min": 1350 }, { "epoch": 5.205724508050089, "grad_norm": 0.5517560537112484, "learning_rate": 7.502320440486399e-06, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.27135342359542847, "step": 2910, "valid_targets_mean": 4264.5, "valid_targets_min": 1184 }, { "epoch": 5.214669051878354, "grad_norm": 0.5509625444275201, "learning_rate": 7.4327859430898445e-06, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.2660328149795532, "step": 2915, "valid_targets_mean": 4360.2, "valid_targets_min": 1551 }, { "epoch": 5.2236135957066185, "grad_norm": 0.5264725135537257, "learning_rate": 7.363501564297302e-06, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.2478117048740387, "step": 2920, "valid_targets_mean": 4145.1, "valid_targets_min": 1811 }, { "epoch": 5.232558139534884, "grad_norm": 0.5015055063053451, "learning_rate": 7.294468683039058e-06, "loss": 0.2595, "loss_nan_ranks": 0, "loss_rank_avg": 0.24327683448791504, "step": 2925, "valid_targets_mean": 4711.1, "valid_targets_min": 714 }, { "epoch": 5.241502683363149, "grad_norm": 0.5747369854441176, "learning_rate": 7.225688673239981e-06, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.24569492042064667, "step": 2930, "valid_targets_mean": 4338.2, "valid_targets_min": 687 }, { "epoch": 5.2504472271914135, "grad_norm": 0.558577994633376, "learning_rate": 7.1571629037921804e-06, "loss": 0.2526, "loss_nan_ranks": 0, "loss_rank_avg": 0.28280454874038696, "step": 2935, "valid_targets_mean": 4211.2, "valid_targets_min": 2352 }, { "epoch": 5.259391771019678, "grad_norm": 0.6144056807907267, "learning_rate": 7.088892738527731e-06, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.2709640562534332, "step": 2940, "valid_targets_mean": 4119.1, "valid_targets_min": 1206 }, { "epoch": 5.268336314847943, "grad_norm": 0.5107272318888509, "learning_rate": 7.020879536191571e-06, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.26789391040802, "step": 2945, "valid_targets_mean": 4640.5, "valid_targets_min": 1448 }, { "epoch": 5.277280858676208, "grad_norm": 0.5541009190577022, "learning_rate": 6.953124650414447e-06, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.2534041404724121, "step": 2950, "valid_targets_mean": 4751.1, "valid_targets_min": 1213 }, { "epoch": 5.286225402504472, "grad_norm": 0.6514472569289943, "learning_rate": 6.885629429685943e-06, "loss": 0.2599, "loss_nan_ranks": 0, "loss_rank_avg": 0.2853846251964569, "step": 2955, "valid_targets_mean": 4381.8, "valid_targets_min": 1086 }, { "epoch": 5.295169946332737, "grad_norm": 0.5988322541910981, "learning_rate": 6.818395217327696e-06, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.25575023889541626, "step": 2960, "valid_targets_mean": 3193.8, "valid_targets_min": 1521 }, { "epoch": 5.304114490161002, "grad_norm": 0.5670506850205758, "learning_rate": 6.751423351466604e-06, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.23857812583446503, "step": 2965, "valid_targets_mean": 4116.7, "valid_targets_min": 2343 }, { "epoch": 5.3130590339892665, "grad_norm": 0.5218993251194615, "learning_rate": 6.684715165008242e-06, "loss": 0.2511, "loss_nan_ranks": 0, "loss_rank_avg": 0.24250607192516327, "step": 2970, "valid_targets_mean": 4213.7, "valid_targets_min": 712 }, { "epoch": 5.322003577817531, "grad_norm": 0.5569832821022914, "learning_rate": 6.618271985610316e-06, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.2601429224014282, "step": 2975, "valid_targets_mean": 4093.6, "valid_targets_min": 1465 }, { "epoch": 5.330948121645796, "grad_norm": 0.5257447628225279, "learning_rate": 6.552095135656211e-06, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.22466397285461426, "step": 2980, "valid_targets_mean": 4426.8, "valid_targets_min": 1498 }, { "epoch": 5.339892665474061, "grad_norm": 0.5288226075745489, "learning_rate": 6.486185932228732e-06, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.23786196112632751, "step": 2985, "valid_targets_mean": 4234.4, "valid_targets_min": 947 }, { "epoch": 5.348837209302325, "grad_norm": 0.5316983597863091, "learning_rate": 6.420545687083823e-06, "loss": 0.2453, "loss_nan_ranks": 0, "loss_rank_avg": 0.2561112642288208, "step": 2990, "valid_targets_mean": 4393.5, "valid_targets_min": 1639 }, { "epoch": 5.35778175313059, "grad_norm": 0.6336255850890024, "learning_rate": 6.355175706624521e-06, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.24200129508972168, "step": 2995, "valid_targets_mean": 2892.8, "valid_targets_min": 1724 }, { "epoch": 5.366726296958855, "grad_norm": 0.5790999887623745, "learning_rate": 6.290077291874923e-06, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.25445109605789185, "step": 3000, "valid_targets_mean": 3687.9, "valid_targets_min": 1561 }, { "epoch": 5.375670840787119, "grad_norm": 0.6224285293408105, "learning_rate": 6.225251738454281e-06, "loss": 0.2558, "loss_nan_ranks": 0, "loss_rank_avg": 0.2375735342502594, "step": 3005, "valid_targets_mean": 3882.3, "valid_targets_min": 1924 }, { "epoch": 5.384615384615385, "grad_norm": 0.5037477615762228, "learning_rate": 6.160700336551246e-06, "loss": 0.2484, "loss_nan_ranks": 0, "loss_rank_avg": 0.22593946754932404, "step": 3010, "valid_targets_mean": 4476.9, "valid_targets_min": 1419 }, { "epoch": 5.39355992844365, "grad_norm": 0.5857014550270156, "learning_rate": 6.096424370898186e-06, "loss": 0.2563, "loss_nan_ranks": 0, "loss_rank_avg": 0.26964280009269714, "step": 3015, "valid_targets_mean": 3775.2, "valid_targets_min": 942 }, { "epoch": 5.402504472271914, "grad_norm": 0.5658229988053839, "learning_rate": 6.032425120745586e-06, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.2709835171699524, "step": 3020, "valid_targets_mean": 3667.1, "valid_targets_min": 1957 }, { "epoch": 5.411449016100179, "grad_norm": 0.5988261907445214, "learning_rate": 5.968703859836615e-06, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.2751755118370056, "step": 3025, "valid_targets_mean": 3496.3, "valid_targets_min": 671 }, { "epoch": 5.420393559928444, "grad_norm": 0.5141241348502327, "learning_rate": 5.905261856381779e-06, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.2791970372200012, "step": 3030, "valid_targets_mean": 4357.8, "valid_targets_min": 1171 }, { "epoch": 5.4293381037567086, "grad_norm": 0.5498788228367728, "learning_rate": 5.8421003730336635e-06, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.2511694133281708, "step": 3035, "valid_targets_mean": 3824.6, "valid_targets_min": 1185 }, { "epoch": 5.438282647584973, "grad_norm": 0.6029343448549779, "learning_rate": 5.77922066686182e-06, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.243141770362854, "step": 3040, "valid_targets_mean": 3373.0, "valid_targets_min": 823 }, { "epoch": 5.447227191413238, "grad_norm": 0.5131367304880754, "learning_rate": 5.716623989327723e-06, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.2467704713344574, "step": 3045, "valid_targets_mean": 4253.5, "valid_targets_min": 1483 }, { "epoch": 5.456171735241503, "grad_norm": 0.5805462950603849, "learning_rate": 5.654311586259882e-06, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.23988988995552063, "step": 3050, "valid_targets_mean": 4065.0, "valid_targets_min": 2083 }, { "epoch": 5.465116279069767, "grad_norm": 0.5715523149741332, "learning_rate": 5.592284697829049e-06, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.2494080364704132, "step": 3055, "valid_targets_mean": 3334.1, "valid_targets_min": 734 }, { "epoch": 5.474060822898032, "grad_norm": 0.5721433275869938, "learning_rate": 5.5305445585235315e-06, "loss": 0.2598, "loss_nan_ranks": 0, "loss_rank_avg": 0.28742748498916626, "step": 3060, "valid_targets_mean": 3750.8, "valid_targets_min": 1385 }, { "epoch": 5.483005366726297, "grad_norm": 0.5114459072142161, "learning_rate": 5.469092397124609e-06, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.2271006852388382, "step": 3065, "valid_targets_mean": 4397.1, "valid_targets_min": 1489 }, { "epoch": 5.4919499105545615, "grad_norm": 0.5521229518692201, "learning_rate": 5.407929436682098e-06, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.25235363841056824, "step": 3070, "valid_targets_mean": 4136.6, "valid_targets_min": 1627 }, { "epoch": 5.500894454382826, "grad_norm": 0.5402233613552551, "learning_rate": 5.347056894490006e-06, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.2618515193462372, "step": 3075, "valid_targets_mean": 4445.6, "valid_targets_min": 1844 }, { "epoch": 5.509838998211091, "grad_norm": 0.5533934913144476, "learning_rate": 5.286475982062283e-06, "loss": 0.2572, "loss_nan_ranks": 0, "loss_rank_avg": 0.26157045364379883, "step": 3080, "valid_targets_mean": 4031.0, "valid_targets_min": 1056 }, { "epoch": 5.518783542039356, "grad_norm": 0.5110038510091776, "learning_rate": 5.226187905108746e-06, "loss": 0.2628, "loss_nan_ranks": 0, "loss_rank_avg": 0.2799553871154785, "step": 3085, "valid_targets_mean": 4822.0, "valid_targets_min": 1524 }, { "epoch": 5.52772808586762, "grad_norm": 0.6041299965242917, "learning_rate": 5.166193863511046e-06, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.25382912158966064, "step": 3090, "valid_targets_mean": 4463.2, "valid_targets_min": 1625 }, { "epoch": 5.536672629695886, "grad_norm": 0.523055625256692, "learning_rate": 5.106495051298815e-06, "loss": 0.2601, "loss_nan_ranks": 0, "loss_rank_avg": 0.26213690638542175, "step": 3095, "valid_targets_mean": 4872.1, "valid_targets_min": 1339 }, { "epoch": 5.545617173524151, "grad_norm": 0.689189142486139, "learning_rate": 5.047092656625887e-06, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.22535747289657593, "step": 3100, "valid_targets_mean": 4960.2, "valid_targets_min": 1725 }, { "epoch": 5.554561717352415, "grad_norm": 0.5703961451507539, "learning_rate": 4.98798786174667e-06, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.23777396976947784, "step": 3105, "valid_targets_mean": 3530.8, "valid_targets_min": 1099 }, { "epoch": 5.56350626118068, "grad_norm": 0.5659413248498028, "learning_rate": 4.9291818429925585e-06, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.2758846580982208, "step": 3110, "valid_targets_mean": 3740.4, "valid_targets_min": 1606 }, { "epoch": 5.572450805008945, "grad_norm": 0.6859304017050197, "learning_rate": 4.8706757707486075e-06, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.24378885328769684, "step": 3115, "valid_targets_mean": 4183.4, "valid_targets_min": 1253 }, { "epoch": 5.5813953488372094, "grad_norm": 0.8010245971038674, "learning_rate": 4.812470809430179e-06, "loss": 0.2506, "loss_nan_ranks": 0, "loss_rank_avg": 0.2438773214817047, "step": 3120, "valid_targets_mean": 4535.4, "valid_targets_min": 1654 }, { "epoch": 5.590339892665474, "grad_norm": 0.48380553908118173, "learning_rate": 4.754568117459788e-06, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.23566769063472748, "step": 3125, "valid_targets_mean": 4967.9, "valid_targets_min": 2282 }, { "epoch": 5.599284436493739, "grad_norm": 0.555628362724338, "learning_rate": 4.69696884724403e-06, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.26789629459381104, "step": 3130, "valid_targets_mean": 3930.6, "valid_targets_min": 1612 }, { "epoch": 5.608228980322004, "grad_norm": 0.5726463627079651, "learning_rate": 4.639674145150679e-06, "loss": 0.2703, "loss_nan_ranks": 0, "loss_rank_avg": 0.27078795433044434, "step": 3135, "valid_targets_mean": 4010.0, "valid_targets_min": 2215 }, { "epoch": 5.617173524150268, "grad_norm": 0.5160136519489497, "learning_rate": 4.582685151485826e-06, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.2637634873390198, "step": 3140, "valid_targets_mean": 4663.4, "valid_targets_min": 1675 }, { "epoch": 5.626118067978533, "grad_norm": 0.5831172100665993, "learning_rate": 4.526003000471238e-06, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.25619733333587646, "step": 3145, "valid_targets_mean": 3704.6, "valid_targets_min": 1062 }, { "epoch": 5.635062611806798, "grad_norm": 0.5228549236039476, "learning_rate": 4.469628820221723e-06, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.25507116317749023, "step": 3150, "valid_targets_mean": 4272.4, "valid_targets_min": 1740 }, { "epoch": 5.644007155635062, "grad_norm": 0.5442853215358627, "learning_rate": 4.4135637327227365e-06, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.24775390326976776, "step": 3155, "valid_targets_mean": 4432.6, "valid_targets_min": 2006 }, { "epoch": 5.652951699463327, "grad_norm": 0.6205216192517241, "learning_rate": 4.357808853808014e-06, "loss": 0.2484, "loss_nan_ranks": 0, "loss_rank_avg": 0.26101428270339966, "step": 3160, "valid_targets_mean": 3737.1, "valid_targets_min": 644 }, { "epoch": 5.661896243291592, "grad_norm": 0.5132795398550757, "learning_rate": 4.302365293137383e-06, "loss": 0.2558, "loss_nan_ranks": 0, "loss_rank_avg": 0.2703346014022827, "step": 3165, "valid_targets_mean": 4475.0, "valid_targets_min": 1557 }, { "epoch": 5.6708407871198565, "grad_norm": 0.5446296655760452, "learning_rate": 4.247234154174649e-06, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.261799693107605, "step": 3170, "valid_targets_mean": 4172.8, "valid_targets_min": 823 }, { "epoch": 5.679785330948121, "grad_norm": 0.5219059793104994, "learning_rate": 4.192416534165666e-06, "loss": 0.2551, "loss_nan_ranks": 0, "loss_rank_avg": 0.2537573277950287, "step": 3175, "valid_targets_mean": 4267.9, "valid_targets_min": 579 }, { "epoch": 5.688729874776387, "grad_norm": 0.5461673557485848, "learning_rate": 4.137913524116488e-06, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.2290881723165512, "step": 3180, "valid_targets_mean": 4211.2, "valid_targets_min": 818 }, { "epoch": 5.6976744186046515, "grad_norm": 0.517997717225711, "learning_rate": 4.083726208771653e-06, "loss": 0.2514, "loss_nan_ranks": 0, "loss_rank_avg": 0.25634273886680603, "step": 3185, "valid_targets_mean": 4610.6, "valid_targets_min": 1674 }, { "epoch": 5.706618962432916, "grad_norm": 0.5213271875253821, "learning_rate": 4.0298556665925996e-06, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.27138853073120117, "step": 3190, "valid_targets_mean": 4529.8, "valid_targets_min": 1865 }, { "epoch": 5.715563506261181, "grad_norm": 0.546634737650849, "learning_rate": 3.976302969736183e-06, "loss": 0.2587, "loss_nan_ranks": 0, "loss_rank_avg": 0.2496567666530609, "step": 3195, "valid_targets_mean": 3815.2, "valid_targets_min": 932 }, { "epoch": 5.724508050089446, "grad_norm": 0.5258705612970683, "learning_rate": 3.923069184033357e-06, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.23271816968917847, "step": 3200, "valid_targets_mean": 4088.2, "valid_targets_min": 2116 }, { "epoch": 5.73345259391771, "grad_norm": 0.5867279766106626, "learning_rate": 3.870155368967963e-06, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.25471609830856323, "step": 3205, "valid_targets_mean": 3395.8, "valid_targets_min": 1808 }, { "epoch": 5.742397137745975, "grad_norm": 0.5656851680671992, "learning_rate": 3.8175625776556354e-06, "loss": 0.2578, "loss_nan_ranks": 0, "loss_rank_avg": 0.26453453302383423, "step": 3210, "valid_targets_mean": 4103.0, "valid_targets_min": 786 }, { "epoch": 5.75134168157424, "grad_norm": 0.5284899901213221, "learning_rate": 3.76529185682283e-06, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.24859002232551575, "step": 3215, "valid_targets_mean": 4613.4, "valid_targets_min": 1303 }, { "epoch": 5.7602862254025045, "grad_norm": 0.5635253947920319, "learning_rate": 3.7133442467860215e-06, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.24023880064487457, "step": 3220, "valid_targets_mean": 3926.2, "valid_targets_min": 822 }, { "epoch": 5.769230769230769, "grad_norm": 0.6683290106994736, "learning_rate": 3.6617207814309686e-06, "loss": 0.2535, "loss_nan_ranks": 0, "loss_rank_avg": 0.24666255712509155, "step": 3225, "valid_targets_mean": 3464.2, "valid_targets_min": 1681 }, { "epoch": 5.778175313059034, "grad_norm": 0.5711365259269587, "learning_rate": 3.610422488192169e-06, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.22737815976142883, "step": 3230, "valid_targets_mean": 3654.8, "valid_targets_min": 1601 }, { "epoch": 5.787119856887299, "grad_norm": 0.5262566407141166, "learning_rate": 3.559450388032355e-06, "loss": 0.2405, "loss_nan_ranks": 0, "loss_rank_avg": 0.23528073728084564, "step": 3235, "valid_targets_mean": 4000.4, "valid_targets_min": 1795 }, { "epoch": 5.796064400715563, "grad_norm": 0.5857070524704964, "learning_rate": 3.508805495422247e-06, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.25850462913513184, "step": 3240, "valid_targets_mean": 3548.4, "valid_targets_min": 2027 }, { "epoch": 5.805008944543828, "grad_norm": 0.5422739378299365, "learning_rate": 3.4584888183203134e-06, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.23234635591506958, "step": 3245, "valid_targets_mean": 3974.6, "valid_targets_min": 1831 }, { "epoch": 5.813953488372093, "grad_norm": 0.5467138164186622, "learning_rate": 3.4085013581527295e-06, "loss": 0.2502, "loss_nan_ranks": 0, "loss_rank_avg": 0.25337696075439453, "step": 3250, "valid_targets_mean": 3679.7, "valid_targets_min": 1793 }, { "epoch": 5.822898032200357, "grad_norm": 0.5923423600872293, "learning_rate": 3.3588441097934223e-06, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.27606481313705444, "step": 3255, "valid_targets_mean": 4041.6, "valid_targets_min": 1902 }, { "epoch": 5.831842576028622, "grad_norm": 0.544712722817465, "learning_rate": 3.30951806154431e-06, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.24701544642448425, "step": 3260, "valid_targets_mean": 4252.6, "valid_targets_min": 1603 }, { "epoch": 5.840787119856888, "grad_norm": 0.5682646260679644, "learning_rate": 3.260524195115595e-06, "loss": 0.2527, "loss_nan_ranks": 0, "loss_rank_avg": 0.2743680477142334, "step": 3265, "valid_targets_mean": 4033.4, "valid_targets_min": 1567 }, { "epoch": 5.849731663685152, "grad_norm": 0.5053561115203649, "learning_rate": 3.2118634856062546e-06, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.25195997953414917, "step": 3270, "valid_targets_mean": 4670.6, "valid_targets_min": 1711 }, { "epoch": 5.858676207513417, "grad_norm": 0.5720698542136006, "learning_rate": 3.163536901484601e-06, "loss": 0.2579, "loss_nan_ranks": 0, "loss_rank_avg": 0.25598081946372986, "step": 3275, "valid_targets_mean": 3693.4, "valid_targets_min": 850 }, { "epoch": 5.867620751341682, "grad_norm": 0.5504159278631617, "learning_rate": 3.115545404569045e-06, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.2605506181716919, "step": 3280, "valid_targets_mean": 3985.3, "valid_targets_min": 1494 }, { "epoch": 5.8765652951699465, "grad_norm": 0.5073092549610757, "learning_rate": 3.0678899500089244e-06, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.28743916749954224, "step": 3285, "valid_targets_mean": 5028.8, "valid_targets_min": 2241 }, { "epoch": 5.885509838998211, "grad_norm": 0.5340456565641353, "learning_rate": 3.0205714862655135e-06, "loss": 0.2539, "loss_nan_ranks": 0, "loss_rank_avg": 0.2738155722618103, "step": 3290, "valid_targets_mean": 4406.5, "valid_targets_min": 1014 }, { "epoch": 5.894454382826476, "grad_norm": 0.5891360814807866, "learning_rate": 2.973590955093124e-06, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.26489949226379395, "step": 3295, "valid_targets_mean": 3631.4, "valid_targets_min": 1316 }, { "epoch": 5.903398926654741, "grad_norm": 0.606826380313794, "learning_rate": 2.9269492915203735e-06, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.28875553607940674, "step": 3300, "valid_targets_mean": 3582.3, "valid_targets_min": 748 }, { "epoch": 5.912343470483005, "grad_norm": 0.5117519052350044, "learning_rate": 2.880647423831591e-06, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.2642664909362793, "step": 3305, "valid_targets_mean": 5080.2, "valid_targets_min": 747 }, { "epoch": 5.92128801431127, "grad_norm": 0.5806379654175979, "learning_rate": 2.8346862735483215e-06, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.2645312547683716, "step": 3310, "valid_targets_mean": 3762.3, "valid_targets_min": 1805 }, { "epoch": 5.930232558139535, "grad_norm": 0.5311509065424678, "learning_rate": 2.789066755410994e-06, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.2585093379020691, "step": 3315, "valid_targets_mean": 4278.2, "valid_targets_min": 1326 }, { "epoch": 5.9391771019677995, "grad_norm": 0.5936285800316835, "learning_rate": 2.7437897773607102e-06, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.26041656732559204, "step": 3320, "valid_targets_mean": 3442.7, "valid_targets_min": 1502 }, { "epoch": 5.948121645796064, "grad_norm": 0.5459969266201287, "learning_rate": 2.698856240521173e-06, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.25794172286987305, "step": 3325, "valid_targets_mean": 4014.2, "valid_targets_min": 1551 }, { "epoch": 5.957066189624329, "grad_norm": 0.5630581255206843, "learning_rate": 2.6542670391807667e-06, "loss": 0.2533, "loss_nan_ranks": 0, "loss_rank_avg": 0.24545322358608246, "step": 3330, "valid_targets_mean": 3481.9, "valid_targets_min": 1557 }, { "epoch": 5.966010733452594, "grad_norm": 0.5799194413488256, "learning_rate": 2.610023060774749e-06, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.2724427580833435, "step": 3335, "valid_targets_mean": 3878.4, "valid_targets_min": 702 }, { "epoch": 5.974955277280858, "grad_norm": 0.5740945458943522, "learning_rate": 2.566125185867576e-06, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.23313261568546295, "step": 3340, "valid_targets_mean": 3677.9, "valid_targets_min": 923 }, { "epoch": 5.983899821109123, "grad_norm": 0.4939353323910504, "learning_rate": 2.5225742881354043e-06, "loss": 0.2455, "loss_nan_ranks": 0, "loss_rank_avg": 0.23637865483760834, "step": 3345, "valid_targets_mean": 5144.5, "valid_targets_min": 2196 }, { "epoch": 5.992844364937389, "grad_norm": 0.5709249769648037, "learning_rate": 2.479371234348682e-06, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.2716667056083679, "step": 3350, "valid_targets_mean": 4413.6, "valid_targets_min": 1591 }, { "epoch": 6.001788908765653, "grad_norm": 0.49922306688966933, "learning_rate": 2.4365168843549e-06, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.24928270280361176, "step": 3355, "valid_targets_mean": 4612.2, "valid_targets_min": 1207 }, { "epoch": 6.010733452593918, "grad_norm": 0.5555093196620423, "learning_rate": 2.3940120910614774e-06, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.2676859498023987, "step": 3360, "valid_targets_mean": 3853.4, "valid_targets_min": 1449 }, { "epoch": 6.019677996422183, "grad_norm": 0.5566602842743498, "learning_rate": 2.351857700418807e-06, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2452341467142105, "step": 3365, "valid_targets_mean": 4434.4, "valid_targets_min": 777 }, { "epoch": 6.028622540250447, "grad_norm": 0.5088695531600443, "learning_rate": 2.310054551403391e-06, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.2538371682167053, "step": 3370, "valid_targets_mean": 4775.4, "valid_targets_min": 1902 }, { "epoch": 6.037567084078712, "grad_norm": 0.5558924991251052, "learning_rate": 2.2686034760011656e-06, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.23813003301620483, "step": 3375, "valid_targets_mean": 3898.2, "valid_targets_min": 1674 }, { "epoch": 6.046511627906977, "grad_norm": 0.5591093005835225, "learning_rate": 2.2275052991909218e-06, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.21672865748405457, "step": 3380, "valid_targets_mean": 4234.8, "valid_targets_min": 671 }, { "epoch": 6.0554561717352415, "grad_norm": 0.5260886376788583, "learning_rate": 2.186760838927897e-06, "loss": 0.2507, "loss_nan_ranks": 0, "loss_rank_avg": 0.22722241282463074, "step": 3385, "valid_targets_mean": 4410.5, "valid_targets_min": 575 }, { "epoch": 6.064400715563506, "grad_norm": 0.5613980727726008, "learning_rate": 2.146370906127506e-06, "loss": 0.2408, "loss_nan_ranks": 0, "loss_rank_avg": 0.2486397624015808, "step": 3390, "valid_targets_mean": 3953.5, "valid_targets_min": 1297 }, { "epoch": 6.073345259391771, "grad_norm": 0.5718364438676335, "learning_rate": 2.1063363046491813e-06, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.24342885613441467, "step": 3395, "valid_targets_mean": 4326.2, "valid_targets_min": 1784 }, { "epoch": 6.082289803220036, "grad_norm": 0.5484733914155208, "learning_rate": 2.0666578312803942e-06, "loss": 0.2488, "loss_nan_ranks": 0, "loss_rank_avg": 0.23995618522167206, "step": 3400, "valid_targets_mean": 4243.8, "valid_targets_min": 1656 }, { "epoch": 6.0912343470483, "grad_norm": 0.6076003177346635, "learning_rate": 2.0273362757207726e-06, "loss": 0.2529, "loss_nan_ranks": 0, "loss_rank_avg": 0.2636367678642273, "step": 3405, "valid_targets_mean": 3371.1, "valid_targets_min": 700 }, { "epoch": 6.100178890876565, "grad_norm": 0.5364865052473711, "learning_rate": 1.988372420566416e-06, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.2631525993347168, "step": 3410, "valid_targets_mean": 4552.2, "valid_targets_min": 527 }, { "epoch": 6.10912343470483, "grad_norm": 0.5382573273538706, "learning_rate": 1.9497670412942835e-06, "loss": 0.2434, "loss_nan_ranks": 0, "loss_rank_avg": 0.25336796045303345, "step": 3415, "valid_targets_mean": 4031.2, "valid_targets_min": 1500 }, { "epoch": 6.1180679785330945, "grad_norm": 0.5332393694448714, "learning_rate": 1.9115209062467954e-06, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.25488486886024475, "step": 3420, "valid_targets_mean": 4084.2, "valid_targets_min": 1073 }, { "epoch": 6.127012522361359, "grad_norm": 0.5822463874616248, "learning_rate": 1.8736347766165086e-06, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.25610625743865967, "step": 3425, "valid_targets_mean": 3508.5, "valid_targets_min": 644 }, { "epoch": 6.135957066189624, "grad_norm": 0.516320931889104, "learning_rate": 1.8361094064309993e-06, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.26783958077430725, "step": 3430, "valid_targets_mean": 4032.3, "valid_targets_min": 1287 }, { "epoch": 6.1449016100178895, "grad_norm": 0.5331137313762538, "learning_rate": 1.7989455425378266e-06, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.2545079290866852, "step": 3435, "valid_targets_mean": 4148.0, "valid_targets_min": 1830 }, { "epoch": 6.153846153846154, "grad_norm": 0.511372820106071, "learning_rate": 1.7621439245896943e-06, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.25283390283584595, "step": 3440, "valid_targets_mean": 4522.1, "valid_targets_min": 1614 }, { "epoch": 6.162790697674419, "grad_norm": 0.642569852208313, "learning_rate": 1.7257052850296996e-06, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.24894089996814728, "step": 3445, "valid_targets_mean": 3752.3, "valid_targets_min": 697 }, { "epoch": 6.171735241502684, "grad_norm": 0.5666144603072086, "learning_rate": 1.6896303490767829e-06, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.24932259321212769, "step": 3450, "valid_targets_mean": 3750.7, "valid_targets_min": 1707 }, { "epoch": 6.180679785330948, "grad_norm": 0.5143915126274258, "learning_rate": 1.6539198347112884e-06, "loss": 0.245, "loss_nan_ranks": 0, "loss_rank_avg": 0.2590116560459137, "step": 3455, "valid_targets_mean": 4465.8, "valid_targets_min": 1477 }, { "epoch": 6.189624329159213, "grad_norm": 0.5657080432140568, "learning_rate": 1.6185744526606706e-06, "loss": 0.2248, "loss_nan_ranks": 0, "loss_rank_avg": 0.22567050158977509, "step": 3460, "valid_targets_mean": 4094.5, "valid_targets_min": 1981 }, { "epoch": 6.198568872987478, "grad_norm": 0.6089266321722668, "learning_rate": 1.583594906385335e-06, "loss": 0.2516, "loss_nan_ranks": 0, "loss_rank_avg": 0.2387622594833374, "step": 3465, "valid_targets_mean": 4029.4, "valid_targets_min": 1928 }, { "epoch": 6.207513416815742, "grad_norm": 0.4852359479822391, "learning_rate": 1.548981892064665e-06, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.24283546209335327, "step": 3470, "valid_targets_mean": 5261.4, "valid_targets_min": 1062 }, { "epoch": 6.216457960644007, "grad_norm": 0.4537685331486559, "learning_rate": 1.5147360985831516e-06, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.21774128079414368, "step": 3475, "valid_targets_mean": 5369.9, "valid_targets_min": 3175 }, { "epoch": 6.225402504472272, "grad_norm": 0.5236024964731602, "learning_rate": 1.4808582075166778e-06, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.25047406554222107, "step": 3480, "valid_targets_mean": 4213.7, "valid_targets_min": 1750 }, { "epoch": 6.2343470483005365, "grad_norm": 0.594758118058126, "learning_rate": 1.447348893118965e-06, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.2589150667190552, "step": 3485, "valid_targets_mean": 3918.9, "valid_targets_min": 2197 }, { "epoch": 6.243291592128801, "grad_norm": 0.5390376277621793, "learning_rate": 1.4142088223081408e-06, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.24606183171272278, "step": 3490, "valid_targets_mean": 4628.6, "valid_targets_min": 2230 }, { "epoch": 6.252236135957066, "grad_norm": 0.515173541243895, "learning_rate": 1.3814386546534864e-06, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.2567700147628784, "step": 3495, "valid_targets_mean": 4171.9, "valid_targets_min": 1779 }, { "epoch": 6.261180679785331, "grad_norm": 0.5308974195526618, "learning_rate": 1.3490390423622856e-06, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.22043094038963318, "step": 3500, "valid_targets_mean": 4421.9, "valid_targets_min": 1412 }, { "epoch": 6.270125223613595, "grad_norm": 0.5045875631623113, "learning_rate": 1.3170106302668616e-06, "loss": 0.2455, "loss_nan_ranks": 0, "loss_rank_avg": 0.23024529218673706, "step": 3505, "valid_targets_mean": 4453.3, "valid_targets_min": 1660 }, { "epoch": 6.27906976744186, "grad_norm": 0.5448476578553636, "learning_rate": 1.2853540558117272e-06, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.24999341368675232, "step": 3510, "valid_targets_mean": 4241.5, "valid_targets_min": 1712 }, { "epoch": 6.288014311270125, "grad_norm": 0.5759478717126266, "learning_rate": 1.254069949040917e-06, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.25016283988952637, "step": 3515, "valid_targets_mean": 3847.2, "valid_targets_min": 669 }, { "epoch": 6.29695885509839, "grad_norm": 0.542415226047018, "learning_rate": 1.2231589325854354e-06, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.2293107956647873, "step": 3520, "valid_targets_mean": 4337.9, "valid_targets_min": 1502 }, { "epoch": 6.305903398926655, "grad_norm": 0.5091719583649115, "learning_rate": 1.1926216216508735e-06, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.25717687606811523, "step": 3525, "valid_targets_mean": 4432.9, "valid_targets_min": 737 }, { "epoch": 6.31484794275492, "grad_norm": 0.4941207542833962, "learning_rate": 1.162458624005145e-06, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.24258843064308167, "step": 3530, "valid_targets_mean": 4559.1, "valid_targets_min": 1824 }, { "epoch": 6.3237924865831845, "grad_norm": 0.5967014559288393, "learning_rate": 1.1326705399664207e-06, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.23474426567554474, "step": 3535, "valid_targets_mean": 3250.2, "valid_targets_min": 1600 }, { "epoch": 6.332737030411449, "grad_norm": 0.5207543513220922, "learning_rate": 1.103257962391151e-06, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.24193906784057617, "step": 3540, "valid_targets_mean": 4304.2, "valid_targets_min": 763 }, { "epoch": 6.341681574239714, "grad_norm": 0.5920796448944554, "learning_rate": 1.0742214766622938e-06, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.2564089596271515, "step": 3545, "valid_targets_mean": 3882.9, "valid_targets_min": 579 }, { "epoch": 6.350626118067979, "grad_norm": 0.5232360068927403, "learning_rate": 1.0455616606776363e-06, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.2539476156234741, "step": 3550, "valid_targets_mean": 3925.2, "valid_targets_min": 805 }, { "epoch": 6.359570661896243, "grad_norm": 0.4866461666276335, "learning_rate": 1.0172790848383141e-06, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.24338996410369873, "step": 3555, "valid_targets_mean": 4900.0, "valid_targets_min": 2526 }, { "epoch": 6.368515205724508, "grad_norm": 0.5299824855199575, "learning_rate": 9.893743120374543e-07, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.24363267421722412, "step": 3560, "valid_targets_mean": 3905.7, "valid_targets_min": 1083 }, { "epoch": 6.377459749552773, "grad_norm": 0.5642560950283441, "learning_rate": 9.618478976489709e-07, "loss": 0.2517, "loss_nan_ranks": 0, "loss_rank_avg": 0.23905110359191895, "step": 3565, "valid_targets_mean": 4138.6, "valid_targets_min": 856 }, { "epoch": 6.386404293381037, "grad_norm": 0.5115018928118804, "learning_rate": 9.347003895165052e-07, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.26956266164779663, "step": 3570, "valid_targets_mean": 5040.1, "valid_targets_min": 1505 }, { "epoch": 6.395348837209302, "grad_norm": 0.5710236424221047, "learning_rate": 9.079323279425245e-07, "loss": 0.2532, "loss_nan_ranks": 0, "loss_rank_avg": 0.2561646103858948, "step": 3575, "valid_targets_mean": 4197.1, "valid_targets_min": 1158 }, { "epoch": 6.404293381037567, "grad_norm": 0.5054247186866906, "learning_rate": 8.815442456775835e-07, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.25438791513442993, "step": 3580, "valid_targets_mean": 4520.4, "valid_targets_min": 1430 }, { "epoch": 6.4132379248658316, "grad_norm": 0.5325941678660696, "learning_rate": 8.555366679097043e-07, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.24359354376792908, "step": 3585, "valid_targets_mean": 4353.4, "valid_targets_min": 1339 }, { "epoch": 6.422182468694096, "grad_norm": 0.5189637715129809, "learning_rate": 8.29910112253931e-07, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.2488621473312378, "step": 3590, "valid_targets_mean": 4283.8, "valid_targets_min": 2266 }, { "epoch": 6.431127012522361, "grad_norm": 0.5866424542601351, "learning_rate": 8.046650887420227e-07, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.26135364174842834, "step": 3595, "valid_targets_mean": 3206.2, "valid_targets_min": 1617 }, { "epoch": 6.440071556350626, "grad_norm": 0.5499318781593886, "learning_rate": 7.798020998123101e-07, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.2563382685184479, "step": 3600, "valid_targets_mean": 4393.6, "valid_targets_min": 710 }, { "epoch": 6.449016100178891, "grad_norm": 0.5310211310663512, "learning_rate": 7.55321640299691e-07, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.25477510690689087, "step": 3605, "valid_targets_mean": 4263.4, "valid_targets_min": 2011 }, { "epoch": 6.457960644007156, "grad_norm": 0.560059078942515, "learning_rate": 7.312241974257861e-07, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.2293008267879486, "step": 3610, "valid_targets_mean": 3617.6, "valid_targets_min": 1590 }, { "epoch": 6.466905187835421, "grad_norm": 0.5267478780824102, "learning_rate": 7.075102507892295e-07, "loss": 0.247, "loss_nan_ranks": 0, "loss_rank_avg": 0.23703113198280334, "step": 3615, "valid_targets_mean": 4467.4, "valid_targets_min": 1654 }, { "epoch": 6.475849731663685, "grad_norm": 0.5537266130087152, "learning_rate": 6.841802723561408e-07, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.241033136844635, "step": 3620, "valid_targets_mean": 4434.5, "valid_targets_min": 680 }, { "epoch": 6.48479427549195, "grad_norm": 0.5258675827998067, "learning_rate": 6.612347264507257e-07, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.23057600855827332, "step": 3625, "valid_targets_mean": 4508.6, "valid_targets_min": 1675 }, { "epoch": 6.493738819320215, "grad_norm": 0.6060163526427282, "learning_rate": 6.386740697460281e-07, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.266754686832428, "step": 3630, "valid_targets_mean": 3405.2, "valid_targets_min": 1494 }, { "epoch": 6.5026833631484795, "grad_norm": 1.243756853379082, "learning_rate": 6.164987512548415e-07, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.24251213669776917, "step": 3635, "valid_targets_mean": 4815.0, "valid_targets_min": 748 }, { "epoch": 6.511627906976744, "grad_norm": 0.4905512612650833, "learning_rate": 5.947092123207854e-07, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.2418278455734253, "step": 3640, "valid_targets_mean": 4851.4, "valid_targets_min": 1723 }, { "epoch": 6.520572450805009, "grad_norm": 0.6977038416301831, "learning_rate": 5.733058866095143e-07, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.25958025455474854, "step": 3645, "valid_targets_mean": 3321.6, "valid_targets_min": 864 }, { "epoch": 6.529516994633274, "grad_norm": 0.5620237411481044, "learning_rate": 5.522892001000801e-07, "loss": 0.247, "loss_nan_ranks": 0, "loss_rank_avg": 0.25899815559387207, "step": 3650, "valid_targets_mean": 3941.6, "valid_targets_min": 645 }, { "epoch": 6.538461538461538, "grad_norm": 0.5931969111624182, "learning_rate": 5.316595710764594e-07, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.2590034008026123, "step": 3655, "valid_targets_mean": 3292.1, "valid_targets_min": 1140 }, { "epoch": 6.547406082289803, "grad_norm": 0.5619298957004911, "learning_rate": 5.114174101192282e-07, "loss": 0.2551, "loss_nan_ranks": 0, "loss_rank_avg": 0.25470370054244995, "step": 3660, "valid_targets_mean": 4170.2, "valid_targets_min": 1529 }, { "epoch": 6.556350626118068, "grad_norm": 0.5338888004490264, "learning_rate": 4.915631200973958e-07, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.23330549895763397, "step": 3665, "valid_targets_mean": 4152.4, "valid_targets_min": 1548 }, { "epoch": 6.565295169946332, "grad_norm": 0.5029110114373035, "learning_rate": 4.7209709616038214e-07, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.2532098591327667, "step": 3670, "valid_targets_mean": 4623.9, "valid_targets_min": 1504 }, { "epoch": 6.574239713774597, "grad_norm": 0.5553623774184658, "learning_rate": 4.5301972573014163e-07, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.25203073024749756, "step": 3675, "valid_targets_mean": 4177.2, "valid_targets_min": 954 }, { "epoch": 6.583184257602863, "grad_norm": 0.5645036118540637, "learning_rate": 4.3433138849347854e-07, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.25823813676834106, "step": 3680, "valid_targets_mean": 4475.9, "valid_targets_min": 2315 }, { "epoch": 6.592128801431127, "grad_norm": 0.5703760997362556, "learning_rate": 4.1603245639446845e-07, "loss": 0.2475, "loss_nan_ranks": 0, "loss_rank_avg": 0.24437285959720612, "step": 3685, "valid_targets_mean": 4044.4, "valid_targets_min": 1603 }, { "epoch": 6.601073345259392, "grad_norm": 0.5422079585581118, "learning_rate": 3.981232936270596e-07, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.23096385598182678, "step": 3690, "valid_targets_mean": 4084.5, "valid_targets_min": 2212 }, { "epoch": 6.610017889087657, "grad_norm": 0.560268180958077, "learning_rate": 3.806042566278345e-07, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.3074514865875244, "step": 3695, "valid_targets_mean": 4345.9, "valid_targets_min": 1526 }, { "epoch": 6.618962432915922, "grad_norm": 0.5139061022298529, "learning_rate": 3.6347569406890213e-07, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.24795208871364594, "step": 3700, "valid_targets_mean": 4453.6, "valid_targets_min": 2173 }, { "epoch": 6.627906976744186, "grad_norm": 0.5732304901299363, "learning_rate": 3.467379468509746e-07, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.2507464289665222, "step": 3705, "valid_targets_mean": 3565.4, "valid_targets_min": 1726 }, { "epoch": 6.636851520572451, "grad_norm": 0.5275323599021355, "learning_rate": 3.3039134809656594e-07, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.25029295682907104, "step": 3710, "valid_targets_mean": 4312.4, "valid_targets_min": 1826 }, { "epoch": 6.645796064400716, "grad_norm": 0.5142402557074688, "learning_rate": 3.144362231433706e-07, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.24940407276153564, "step": 3715, "valid_targets_mean": 4422.9, "valid_targets_min": 747 }, { "epoch": 6.65474060822898, "grad_norm": 0.5730417596248877, "learning_rate": 2.9887288953778903e-07, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.2630217671394348, "step": 3720, "valid_targets_mean": 4032.0, "valid_targets_min": 1372 }, { "epoch": 6.663685152057245, "grad_norm": 0.554437674633871, "learning_rate": 2.8370165702860553e-07, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.26767322421073914, "step": 3725, "valid_targets_mean": 4060.4, "valid_targets_min": 1319 }, { "epoch": 6.67262969588551, "grad_norm": 0.5716086807724999, "learning_rate": 2.6892282756082246e-07, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.23963013291358948, "step": 3730, "valid_targets_mean": 3399.0, "valid_targets_min": 691 }, { "epoch": 6.6815742397137745, "grad_norm": 0.5079641007584742, "learning_rate": 2.545366952696582e-07, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.2464374452829361, "step": 3735, "valid_targets_mean": 4499.1, "valid_targets_min": 1971 }, { "epoch": 6.690518783542039, "grad_norm": 0.9402640194261683, "learning_rate": 2.405435464746786e-07, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.27681803703308105, "step": 3740, "valid_targets_mean": 3995.8, "valid_targets_min": 656 }, { "epoch": 6.699463327370304, "grad_norm": 0.5895147291124684, "learning_rate": 2.2694365967411258e-07, "loss": 0.2572, "loss_nan_ranks": 0, "loss_rank_avg": 0.26021093130111694, "step": 3745, "valid_targets_mean": 3512.1, "valid_targets_min": 922 }, { "epoch": 6.708407871198569, "grad_norm": 0.5247512021335333, "learning_rate": 2.137373055393055e-07, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.2672116756439209, "step": 3750, "valid_targets_mean": 4461.2, "valid_targets_min": 1031 }, { "epoch": 6.717352415026833, "grad_norm": 0.5648115569047794, "learning_rate": 2.009247469093234e-07, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.24653485417366028, "step": 3755, "valid_targets_mean": 3891.8, "valid_targets_min": 1329 }, { "epoch": 6.726296958855098, "grad_norm": 0.5935904883224387, "learning_rate": 1.8850623878573505e-07, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.2428642213344574, "step": 3760, "valid_targets_mean": 3706.3, "valid_targets_min": 931 }, { "epoch": 6.735241502683364, "grad_norm": 0.5282006716958451, "learning_rate": 1.7648202832752924e-07, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.22287273406982422, "step": 3765, "valid_targets_mean": 4499.3, "valid_targets_min": 1662 }, { "epoch": 6.7441860465116275, "grad_norm": 0.5697571140348834, "learning_rate": 1.6485235484619665e-07, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.25361984968185425, "step": 3770, "valid_targets_mean": 3464.8, "valid_targets_min": 1843 }, { "epoch": 6.753130590339893, "grad_norm": 0.561107497561089, "learning_rate": 1.5361744980096905e-07, "loss": 0.2382, "loss_nan_ranks": 0, "loss_rank_avg": 0.23007211089134216, "step": 3775, "valid_targets_mean": 3861.9, "valid_targets_min": 1742 }, { "epoch": 6.762075134168158, "grad_norm": 0.5240522175257502, "learning_rate": 1.427775367942097e-07, "loss": 0.2564, "loss_nan_ranks": 0, "loss_rank_avg": 0.25991159677505493, "step": 3780, "valid_targets_mean": 4519.6, "valid_targets_min": 1936 }, { "epoch": 6.7710196779964225, "grad_norm": 0.5553928938449468, "learning_rate": 1.3233283156696142e-07, "loss": 0.2437, "loss_nan_ranks": 0, "loss_rank_avg": 0.2548370659351349, "step": 3785, "valid_targets_mean": 3997.4, "valid_targets_min": 621 }, { "epoch": 6.779964221824687, "grad_norm": 0.5074568016914366, "learning_rate": 1.222835419946633e-07, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.23944196105003357, "step": 3790, "valid_targets_mean": 5238.7, "valid_targets_min": 2620 }, { "epoch": 6.788908765652952, "grad_norm": 0.5333184632049403, "learning_rate": 1.1262986808300291e-07, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.25998786091804504, "step": 3795, "valid_targets_mean": 4385.2, "valid_targets_min": 1617 }, { "epoch": 6.797853309481217, "grad_norm": 0.5068220624841174, "learning_rate": 1.0337200196393505e-07, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.25370797514915466, "step": 3800, "valid_targets_mean": 4350.8, "valid_targets_min": 1473 }, { "epoch": 6.806797853309481, "grad_norm": 0.5340749980997674, "learning_rate": 9.451012789186476e-08, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.24803949892520905, "step": 3805, "valid_targets_mean": 4403.3, "valid_targets_min": 784 }, { "epoch": 6.815742397137746, "grad_norm": 0.5465845662554875, "learning_rate": 8.604442223998144e-08, "loss": 0.2621, "loss_nan_ranks": 0, "loss_rank_avg": 0.28449052572250366, "step": 3810, "valid_targets_mean": 4181.7, "valid_targets_min": 1019 }, { "epoch": 6.824686940966011, "grad_norm": 0.5740109665058152, "learning_rate": 7.797505349673496e-08, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.24289534986019135, "step": 3815, "valid_targets_mean": 3507.5, "valid_targets_min": 1523 }, { "epoch": 6.833631484794275, "grad_norm": 0.532987766803314, "learning_rate": 7.030218226250051e-08, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.24493467807769775, "step": 3820, "valid_targets_mean": 4069.8, "valid_targets_min": 795 }, { "epoch": 6.84257602862254, "grad_norm": 0.6131271407710378, "learning_rate": 6.302596124636573e-08, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.2517031729221344, "step": 3825, "valid_targets_mean": 4256.1, "valid_targets_min": 741 }, { "epoch": 6.851520572450805, "grad_norm": 0.5260881026648205, "learning_rate": 5.6146535263106314e-08, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.22869578003883362, "step": 3830, "valid_targets_mean": 4011.5, "valid_targets_min": 1329 }, { "epoch": 6.8604651162790695, "grad_norm": 0.6127050009448671, "learning_rate": 4.966404123029289e-08, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.2303614318370819, "step": 3835, "valid_targets_mean": 4033.9, "valid_targets_min": 1573 }, { "epoch": 6.869409660107334, "grad_norm": 0.5818917098959172, "learning_rate": 4.357860816557091e-08, "loss": 0.2611, "loss_nan_ranks": 0, "loss_rank_avg": 0.2567775249481201, "step": 3840, "valid_targets_mean": 3792.1, "valid_targets_min": 529 }, { "epoch": 6.878354203935599, "grad_norm": 0.5360181923150845, "learning_rate": 3.789035718408718e-08, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.24667097628116608, "step": 3845, "valid_targets_mean": 3941.6, "valid_targets_min": 1016 }, { "epoch": 6.8872987477638645, "grad_norm": 0.596035881473606, "learning_rate": 3.259940149609175e-08, "loss": 0.2522, "loss_nan_ranks": 0, "loss_rank_avg": 0.278276652097702, "step": 3850, "valid_targets_mean": 3848.6, "valid_targets_min": 884 }, { "epoch": 6.896243291592128, "grad_norm": 0.5426279598087133, "learning_rate": 2.7705846404670888e-08, "loss": 0.2362, "loss_nan_ranks": 0, "loss_rank_avg": 0.25362810492515564, "step": 3855, "valid_targets_mean": 3896.8, "valid_targets_min": 1947 }, { "epoch": 6.905187835420394, "grad_norm": 0.5217040663626972, "learning_rate": 2.3209789303657582e-08, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.24874532222747803, "step": 3860, "valid_targets_mean": 4455.1, "valid_targets_min": 1374 }, { "epoch": 6.914132379248659, "grad_norm": 0.6253844624269363, "learning_rate": 1.9111319675699792e-08, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.24061639606952667, "step": 3865, "valid_targets_mean": 4007.6, "valid_targets_min": 1409 }, { "epoch": 6.923076923076923, "grad_norm": 0.600953932839311, "learning_rate": 1.5410519090461872e-08, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.25711876153945923, "step": 3870, "valid_targets_mean": 3362.2, "valid_targets_min": 995 }, { "epoch": 6.932021466905188, "grad_norm": 0.5660567298832868, "learning_rate": 1.210746120302142e-08, "loss": 0.2463, "loss_nan_ranks": 0, "loss_rank_avg": 0.2501237392425537, "step": 3875, "valid_targets_mean": 3972.0, "valid_targets_min": 2149 }, { "epoch": 6.940966010733453, "grad_norm": 0.6014456216364971, "learning_rate": 9.202211752386003e-09, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.25210267305374146, "step": 3880, "valid_targets_mean": 4391.4, "valid_targets_min": 1615 }, { "epoch": 6.9499105545617175, "grad_norm": 0.5988847243290031, "learning_rate": 6.694828560200872e-09, "loss": 0.2572, "loss_nan_ranks": 0, "loss_rank_avg": 0.2896597385406494, "step": 3885, "valid_targets_mean": 4030.7, "valid_targets_min": 1853 }, { "epoch": 6.958855098389982, "grad_norm": 0.5395682499202165, "learning_rate": 4.585361529581001e-09, "loss": 0.2411, "loss_nan_ranks": 0, "loss_rank_avg": 0.2411486953496933, "step": 3890, "valid_targets_mean": 4078.4, "valid_targets_min": 822 }, { "epoch": 6.967799642218247, "grad_norm": 0.6335748048992399, "learning_rate": 2.87385264413631e-09, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.2603016793727875, "step": 3895, "valid_targets_mean": 2954.7, "valid_targets_min": 911 }, { "epoch": 6.976744186046512, "grad_norm": 0.5727655803906435, "learning_rate": 1.560335967114579e-09, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.25090134143829346, "step": 3900, "valid_targets_mean": 4419.8, "valid_targets_min": 1517 }, { "epoch": 6.985688729874776, "grad_norm": 0.5157971974589199, "learning_rate": 6.4483764074863e-10, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.2580246329307556, "step": 3905, "valid_targets_mean": 4267.4, "valid_targets_min": 1483 }, { "epoch": 6.994633273703041, "grad_norm": 0.5412701822718862, "learning_rate": 1.273758857145424e-10, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.2360781729221344, "step": 3910, "valid_targets_mean": 3865.5, "valid_targets_min": 653 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.23571906983852386, "step": 3913, "total_flos": 1325319151616000.0, "train_loss": 0.29724271997234386, "train_runtime": 27386.6627, "train_samples_per_second": 2.285, "train_steps_per_second": 0.143, "valid_targets_mean": 3601.1, "valid_targets_min": 1303 } ], "logging_steps": 5, "max_steps": 3913, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1325319151616000.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }