{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4606, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.007598784194528876, "grad_norm": 16.54100795724015, "learning_rate": 3.4707158351409984e-07, "loss": 0.6415, "loss_nan_ranks": 0, "loss_rank_avg": 0.6890859603881836, "step": 5, "valid_targets_mean": 4029.6, "valid_targets_min": 742 }, { "epoch": 0.015197568389057751, "grad_norm": 17.760320126405695, "learning_rate": 7.809110629067245e-07, "loss": 0.6735, "loss_nan_ranks": 0, "loss_rank_avg": 0.6768203973770142, "step": 10, "valid_targets_mean": 4724.0, "valid_targets_min": 333 }, { "epoch": 0.022796352583586626, "grad_norm": 14.700502278309516, "learning_rate": 1.2147505422993492e-06, "loss": 0.6621, "loss_nan_ranks": 0, "loss_rank_avg": 0.6386404633522034, "step": 15, "valid_targets_mean": 4853.7, "valid_targets_min": 1059 }, { "epoch": 0.030395136778115502, "grad_norm": 12.016024137339164, "learning_rate": 1.6485900216919743e-06, "loss": 0.6268, "loss_nan_ranks": 0, "loss_rank_avg": 0.6092511415481567, "step": 20, "valid_targets_mean": 5505.4, "valid_targets_min": 2608 }, { "epoch": 0.037993920972644375, "grad_norm": 7.202624222295684, "learning_rate": 2.0824295010845986e-06, "loss": 0.5318, "loss_nan_ranks": 0, "loss_rank_avg": 0.4805890917778015, "step": 25, "valid_targets_mean": 4894.8, "valid_targets_min": 746 }, { "epoch": 0.04559270516717325, "grad_norm": 5.248039681477442, "learning_rate": 2.516268980477224e-06, "loss": 0.5034, "loss_nan_ranks": 0, "loss_rank_avg": 0.5152153372764587, "step": 30, "valid_targets_mean": 4687.7, "valid_targets_min": 1705 }, { "epoch": 0.05319148936170213, "grad_norm": 2.714176181066118, "learning_rate": 2.950108459869848e-06, "loss": 0.4815, "loss_nan_ranks": 0, "loss_rank_avg": 0.4753047823905945, "step": 35, "valid_targets_mean": 4859.7, "valid_targets_min": 456 }, { "epoch": 0.060790273556231005, "grad_norm": 1.7777692231211755, "learning_rate": 3.383947939262473e-06, "loss": 0.4372, "loss_nan_ranks": 0, "loss_rank_avg": 0.4611857831478119, "step": 40, "valid_targets_mean": 4217.9, "valid_targets_min": 741 }, { "epoch": 0.06838905775075987, "grad_norm": 1.3787959870798525, "learning_rate": 3.817787418655098e-06, "loss": 0.4164, "loss_nan_ranks": 0, "loss_rank_avg": 0.4521799385547638, "step": 45, "valid_targets_mean": 3577.2, "valid_targets_min": 525 }, { "epoch": 0.07598784194528875, "grad_norm": 1.0709482777091444, "learning_rate": 4.251626898047723e-06, "loss": 0.4129, "loss_nan_ranks": 0, "loss_rank_avg": 0.45762407779693604, "step": 50, "valid_targets_mean": 4046.8, "valid_targets_min": 847 }, { "epoch": 0.08358662613981763, "grad_norm": 0.8316164594444523, "learning_rate": 4.685466377440348e-06, "loss": 0.3775, "loss_nan_ranks": 0, "loss_rank_avg": 0.38839221000671387, "step": 55, "valid_targets_mean": 5905.9, "valid_targets_min": 1232 }, { "epoch": 0.0911854103343465, "grad_norm": 0.7446660666424425, "learning_rate": 5.1193058568329725e-06, "loss": 0.3891, "loss_nan_ranks": 0, "loss_rank_avg": 0.34218358993530273, "step": 60, "valid_targets_mean": 4599.2, "valid_targets_min": 554 }, { "epoch": 0.09878419452887538, "grad_norm": 0.8425007884341953, "learning_rate": 5.5531453362255974e-06, "loss": 0.3781, "loss_nan_ranks": 0, "loss_rank_avg": 0.36715853214263916, "step": 65, "valid_targets_mean": 4719.6, "valid_targets_min": 590 }, { "epoch": 0.10638297872340426, "grad_norm": 0.6619149306280321, "learning_rate": 5.986984815618222e-06, "loss": 0.3861, "loss_nan_ranks": 0, "loss_rank_avg": 0.3819279968738556, "step": 70, "valid_targets_mean": 4757.8, "valid_targets_min": 881 }, { "epoch": 0.11398176291793313, "grad_norm": 0.5731111234637317, "learning_rate": 6.420824295010846e-06, "loss": 0.3629, "loss_nan_ranks": 0, "loss_rank_avg": 0.3706345558166504, "step": 75, "valid_targets_mean": 5672.5, "valid_targets_min": 1128 }, { "epoch": 0.12158054711246201, "grad_norm": 0.6080686326455707, "learning_rate": 6.854663774403471e-06, "loss": 0.3312, "loss_nan_ranks": 0, "loss_rank_avg": 0.38144651055336, "step": 80, "valid_targets_mean": 4179.6, "valid_targets_min": 814 }, { "epoch": 0.12917933130699089, "grad_norm": 0.6499495432455763, "learning_rate": 7.288503253796096e-06, "loss": 0.3446, "loss_nan_ranks": 0, "loss_rank_avg": 0.3940460979938507, "step": 85, "valid_targets_mean": 4595.6, "valid_targets_min": 583 }, { "epoch": 0.13677811550151975, "grad_norm": 0.4843533852497594, "learning_rate": 7.722342733188721e-06, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.3182428181171417, "step": 90, "valid_targets_mean": 5585.4, "valid_targets_min": 740 }, { "epoch": 0.14437689969604864, "grad_norm": 0.6242189491842878, "learning_rate": 8.156182212581345e-06, "loss": 0.3316, "loss_nan_ranks": 0, "loss_rank_avg": 0.3119521737098694, "step": 95, "valid_targets_mean": 5690.2, "valid_targets_min": 792 }, { "epoch": 0.1519756838905775, "grad_norm": 0.5346923069880523, "learning_rate": 8.59002169197397e-06, "loss": 0.3313, "loss_nan_ranks": 0, "loss_rank_avg": 0.31788039207458496, "step": 100, "valid_targets_mean": 4587.9, "valid_targets_min": 767 }, { "epoch": 0.1595744680851064, "grad_norm": 0.5073268077298685, "learning_rate": 9.023861171366595e-06, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.3051730990409851, "step": 105, "valid_targets_mean": 5143.8, "valid_targets_min": 823 }, { "epoch": 0.16717325227963525, "grad_norm": 0.5467162692473684, "learning_rate": 9.457700650759219e-06, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.32401126623153687, "step": 110, "valid_targets_mean": 5420.0, "valid_targets_min": 674 }, { "epoch": 0.17477203647416414, "grad_norm": 0.5541588789236693, "learning_rate": 9.891540130151845e-06, "loss": 0.3334, "loss_nan_ranks": 0, "loss_rank_avg": 0.3607725501060486, "step": 115, "valid_targets_mean": 5116.0, "valid_targets_min": 569 }, { "epoch": 0.182370820668693, "grad_norm": 0.5403092031436869, "learning_rate": 1.032537960954447e-05, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.290938138961792, "step": 120, "valid_targets_mean": 4455.6, "valid_targets_min": 1819 }, { "epoch": 0.1899696048632219, "grad_norm": 0.5924655899271373, "learning_rate": 1.0759219088937095e-05, "loss": 0.3343, "loss_nan_ranks": 0, "loss_rank_avg": 0.31885042786598206, "step": 125, "valid_targets_mean": 3642.6, "valid_targets_min": 401 }, { "epoch": 0.19756838905775076, "grad_norm": 0.49980402806514684, "learning_rate": 1.119305856832972e-05, "loss": 0.2857, "loss_nan_ranks": 0, "loss_rank_avg": 0.2728749215602875, "step": 130, "valid_targets_mean": 4462.3, "valid_targets_min": 585 }, { "epoch": 0.20516717325227962, "grad_norm": 0.5224338478901207, "learning_rate": 1.1626898047722344e-05, "loss": 0.2962, "loss_nan_ranks": 0, "loss_rank_avg": 0.29036590456962585, "step": 135, "valid_targets_mean": 4953.9, "valid_targets_min": 901 }, { "epoch": 0.2127659574468085, "grad_norm": 0.5647977318046398, "learning_rate": 1.2060737527114967e-05, "loss": 0.2992, "loss_nan_ranks": 0, "loss_rank_avg": 0.30531400442123413, "step": 140, "valid_targets_mean": 3919.9, "valid_targets_min": 797 }, { "epoch": 0.22036474164133737, "grad_norm": 0.5768676708119788, "learning_rate": 1.2494577006507593e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.3926551342010498, "step": 145, "valid_targets_mean": 4445.3, "valid_targets_min": 595 }, { "epoch": 0.22796352583586627, "grad_norm": 0.46004731662025494, "learning_rate": 1.2928416485900217e-05, "loss": 0.2964, "loss_nan_ranks": 0, "loss_rank_avg": 0.23685210943222046, "step": 150, "valid_targets_mean": 4963.2, "valid_targets_min": 1646 }, { "epoch": 0.23556231003039513, "grad_norm": 0.6456923331623713, "learning_rate": 1.3362255965292842e-05, "loss": 0.2947, "loss_nan_ranks": 0, "loss_rank_avg": 0.32530516386032104, "step": 155, "valid_targets_mean": 3147.6, "valid_targets_min": 713 }, { "epoch": 0.24316109422492402, "grad_norm": 0.5132446277120045, "learning_rate": 1.3796095444685466e-05, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.3017147481441498, "step": 160, "valid_targets_mean": 5447.2, "valid_targets_min": 662 }, { "epoch": 0.2507598784194529, "grad_norm": 0.5526604062654956, "learning_rate": 1.4229934924078092e-05, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.2687798738479614, "step": 165, "valid_targets_mean": 4341.5, "valid_targets_min": 756 }, { "epoch": 0.25835866261398177, "grad_norm": 0.5293460369161004, "learning_rate": 1.4663774403470716e-05, "loss": 0.2804, "loss_nan_ranks": 0, "loss_rank_avg": 0.28431305289268494, "step": 170, "valid_targets_mean": 6130.4, "valid_targets_min": 1724 }, { "epoch": 0.26595744680851063, "grad_norm": 0.5138145073678304, "learning_rate": 1.5097613882863342e-05, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.29994410276412964, "step": 175, "valid_targets_mean": 4394.1, "valid_targets_min": 589 }, { "epoch": 0.2735562310030395, "grad_norm": 0.5043230432581788, "learning_rate": 1.5531453362255964e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.2635194659233093, "step": 180, "valid_targets_mean": 4637.4, "valid_targets_min": 588 }, { "epoch": 0.2811550151975684, "grad_norm": 0.5633614566403176, "learning_rate": 1.5965292841648592e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.349490761756897, "step": 185, "valid_targets_mean": 5181.4, "valid_targets_min": 1743 }, { "epoch": 0.2887537993920973, "grad_norm": 0.5633432190899903, "learning_rate": 1.6399132321041216e-05, "loss": 0.2859, "loss_nan_ranks": 0, "loss_rank_avg": 0.28400588035583496, "step": 190, "valid_targets_mean": 4035.6, "valid_targets_min": 1318 }, { "epoch": 0.29635258358662614, "grad_norm": 0.48584306761961266, "learning_rate": 1.6832971800433843e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.2302139550447464, "step": 195, "valid_targets_mean": 5217.0, "valid_targets_min": 1825 }, { "epoch": 0.303951367781155, "grad_norm": 0.5423337122654377, "learning_rate": 1.7266811279826464e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.2699054479598999, "step": 200, "valid_targets_mean": 4060.4, "valid_targets_min": 824 }, { "epoch": 0.31155015197568386, "grad_norm": 0.583883380975703, "learning_rate": 1.770065075921909e-05, "loss": 0.263, "loss_nan_ranks": 0, "loss_rank_avg": 0.28162840008735657, "step": 205, "valid_targets_mean": 4595.1, "valid_targets_min": 446 }, { "epoch": 0.3191489361702128, "grad_norm": 0.5187106940915953, "learning_rate": 1.8134490238611715e-05, "loss": 0.2586, "loss_nan_ranks": 0, "loss_rank_avg": 0.25653451681137085, "step": 210, "valid_targets_mean": 4721.1, "valid_targets_min": 885 }, { "epoch": 0.32674772036474165, "grad_norm": 0.5079241607768279, "learning_rate": 1.856832971800434e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.257007360458374, "step": 215, "valid_targets_mean": 5210.9, "valid_targets_min": 784 }, { "epoch": 0.3343465045592705, "grad_norm": 0.6159525490464162, "learning_rate": 1.9002169197396964e-05, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.3035469651222229, "step": 220, "valid_targets_mean": 4253.7, "valid_targets_min": 670 }, { "epoch": 0.34194528875379937, "grad_norm": 0.618048775817979, "learning_rate": 1.9436008676789588e-05, "loss": 0.2914, "loss_nan_ranks": 0, "loss_rank_avg": 0.3232946991920471, "step": 225, "valid_targets_mean": 3915.6, "valid_targets_min": 686 }, { "epoch": 0.3495440729483283, "grad_norm": 0.4988454732686451, "learning_rate": 1.9869848156182215e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.2464175820350647, "step": 230, "valid_targets_mean": 4478.2, "valid_targets_min": 1934 }, { "epoch": 0.35714285714285715, "grad_norm": 0.5788630961414701, "learning_rate": 2.030368763557484e-05, "loss": 0.2697, "loss_nan_ranks": 0, "loss_rank_avg": 0.25093919038772583, "step": 235, "valid_targets_mean": 4403.9, "valid_targets_min": 2002 }, { "epoch": 0.364741641337386, "grad_norm": 0.5727233609316779, "learning_rate": 2.0737527114967463e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930532693862915, "step": 240, "valid_targets_mean": 3878.2, "valid_targets_min": 683 }, { "epoch": 0.3723404255319149, "grad_norm": 0.507643333171839, "learning_rate": 2.117136659436009e-05, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.26503849029541016, "step": 245, "valid_targets_mean": 5116.3, "valid_targets_min": 1771 }, { "epoch": 0.3799392097264438, "grad_norm": 0.5575549222120635, "learning_rate": 2.160520607375271e-05, "loss": 0.239, "loss_nan_ranks": 0, "loss_rank_avg": 0.24154013395309448, "step": 250, "valid_targets_mean": 4581.1, "valid_targets_min": 446 }, { "epoch": 0.38753799392097266, "grad_norm": 0.5133849867561285, "learning_rate": 2.203904555314534e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.2547852694988251, "step": 255, "valid_targets_mean": 4651.8, "valid_targets_min": 434 }, { "epoch": 0.3951367781155015, "grad_norm": 0.46783460540928934, "learning_rate": 2.2472885032537963e-05, "loss": 0.2714, "loss_nan_ranks": 0, "loss_rank_avg": 0.23877258598804474, "step": 260, "valid_targets_mean": 5490.8, "valid_targets_min": 1221 }, { "epoch": 0.4027355623100304, "grad_norm": 0.5446072363730794, "learning_rate": 2.290672451193059e-05, "loss": 0.2643, "loss_nan_ranks": 0, "loss_rank_avg": 0.23716062307357788, "step": 265, "valid_targets_mean": 4415.1, "valid_targets_min": 567 }, { "epoch": 0.41033434650455924, "grad_norm": 0.5076237944415188, "learning_rate": 2.334056399132321e-05, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.2342528998851776, "step": 270, "valid_targets_mean": 4982.2, "valid_targets_min": 867 }, { "epoch": 0.41793313069908816, "grad_norm": 0.5204833234773354, "learning_rate": 2.3774403470715835e-05, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.24817609786987305, "step": 275, "valid_targets_mean": 4886.1, "valid_targets_min": 1124 }, { "epoch": 0.425531914893617, "grad_norm": 1.1929428353263904, "learning_rate": 2.4208242950108462e-05, "loss": 0.2534, "loss_nan_ranks": 0, "loss_rank_avg": 0.2741398513317108, "step": 280, "valid_targets_mean": 5717.5, "valid_targets_min": 863 }, { "epoch": 0.4331306990881459, "grad_norm": 0.585914448752194, "learning_rate": 2.464208242950109e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.27346092462539673, "step": 285, "valid_targets_mean": 4714.8, "valid_targets_min": 738 }, { "epoch": 0.44072948328267475, "grad_norm": 0.6700936401277653, "learning_rate": 2.507592190889371e-05, "loss": 0.2714, "loss_nan_ranks": 0, "loss_rank_avg": 0.3218214511871338, "step": 290, "valid_targets_mean": 3352.8, "valid_targets_min": 665 }, { "epoch": 0.44832826747720367, "grad_norm": 0.5819949812246825, "learning_rate": 2.5509761388286335e-05, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.24475443363189697, "step": 295, "valid_targets_mean": 5024.5, "valid_targets_min": 1008 }, { "epoch": 0.45592705167173253, "grad_norm": 0.5564851893611434, "learning_rate": 2.5943600867678962e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.25335440039634705, "step": 300, "valid_targets_mean": 4271.6, "valid_targets_min": 495 }, { "epoch": 0.4635258358662614, "grad_norm": 0.6776311836920197, "learning_rate": 2.637744034707159e-05, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.26621827483177185, "step": 305, "valid_targets_mean": 4792.2, "valid_targets_min": 585 }, { "epoch": 0.47112462006079026, "grad_norm": 0.5014128476072633, "learning_rate": 2.681127982646421e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.23652535676956177, "step": 310, "valid_targets_mean": 5203.9, "valid_targets_min": 631 }, { "epoch": 0.4787234042553192, "grad_norm": 0.5471285546055437, "learning_rate": 2.7245119305856834e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.2725940942764282, "step": 315, "valid_targets_mean": 4777.1, "valid_targets_min": 1762 }, { "epoch": 0.48632218844984804, "grad_norm": 0.5215837029470914, "learning_rate": 2.7678958785249462e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.2674940228462219, "step": 320, "valid_targets_mean": 4912.2, "valid_targets_min": 1286 }, { "epoch": 0.4939209726443769, "grad_norm": 0.5545464098953832, "learning_rate": 2.8112798264642082e-05, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.27066224813461304, "step": 325, "valid_targets_mean": 4713.8, "valid_targets_min": 581 }, { "epoch": 0.5015197568389058, "grad_norm": 0.5291981229160326, "learning_rate": 2.854663774403471e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.27261027693748474, "step": 330, "valid_targets_mean": 5018.4, "valid_targets_min": 825 }, { "epoch": 0.5091185410334347, "grad_norm": 0.5927074347019183, "learning_rate": 2.8980477223427334e-05, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.23593679070472717, "step": 335, "valid_targets_mean": 4369.9, "valid_targets_min": 852 }, { "epoch": 0.5167173252279635, "grad_norm": 0.5613566212263488, "learning_rate": 2.941431670281996e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.25743183493614197, "step": 340, "valid_targets_mean": 4878.5, "valid_targets_min": 736 }, { "epoch": 0.5243161094224924, "grad_norm": 0.43333351737553155, "learning_rate": 2.9848156182212582e-05, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.22708739340305328, "step": 345, "valid_targets_mean": 5272.6, "valid_targets_min": 2600 }, { "epoch": 0.5319148936170213, "grad_norm": 0.5349091750560264, "learning_rate": 3.028199566160521e-05, "loss": 0.2484, "loss_nan_ranks": 0, "loss_rank_avg": 0.2423931062221527, "step": 350, "valid_targets_mean": 4710.4, "valid_targets_min": 1708 }, { "epoch": 0.5395136778115501, "grad_norm": 0.552342573882699, "learning_rate": 3.0715835140997834e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.2209261655807495, "step": 355, "valid_targets_mean": 4220.2, "valid_targets_min": 498 }, { "epoch": 0.547112462006079, "grad_norm": 0.47358599117445827, "learning_rate": 3.114967462039046e-05, "loss": 0.2431, "loss_nan_ranks": 0, "loss_rank_avg": 0.22403742372989655, "step": 360, "valid_targets_mean": 5009.1, "valid_targets_min": 826 }, { "epoch": 0.5547112462006079, "grad_norm": 0.5508791979851065, "learning_rate": 3.158351409978308e-05, "loss": 0.271, "loss_nan_ranks": 0, "loss_rank_avg": 0.2744586765766144, "step": 365, "valid_targets_mean": 4221.0, "valid_targets_min": 658 }, { "epoch": 0.5623100303951368, "grad_norm": 0.4880656851972933, "learning_rate": 3.2017353579175706e-05, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.2102406919002533, "step": 370, "valid_targets_mean": 5021.4, "valid_targets_min": 422 }, { "epoch": 0.5699088145896657, "grad_norm": 0.5066085991817625, "learning_rate": 3.2451193058568337e-05, "loss": 0.2493, "loss_nan_ranks": 0, "loss_rank_avg": 0.220636785030365, "step": 375, "valid_targets_mean": 4511.9, "valid_targets_min": 904 }, { "epoch": 0.5775075987841946, "grad_norm": 0.7189915330518424, "learning_rate": 3.288503253796096e-05, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.2566250264644623, "step": 380, "valid_targets_mean": 4385.5, "valid_targets_min": 551 }, { "epoch": 0.5851063829787234, "grad_norm": 0.548460587196264, "learning_rate": 3.331887201735358e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.23478102684020996, "step": 385, "valid_targets_mean": 4521.1, "valid_targets_min": 940 }, { "epoch": 0.5927051671732523, "grad_norm": 0.7285447421019886, "learning_rate": 3.375271149674621e-05, "loss": 0.2528, "loss_nan_ranks": 0, "loss_rank_avg": 0.2555179297924042, "step": 390, "valid_targets_mean": 3723.9, "valid_targets_min": 409 }, { "epoch": 0.6003039513677811, "grad_norm": 0.5544467667445715, "learning_rate": 3.418655097613883e-05, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.2515088617801666, "step": 395, "valid_targets_mean": 4729.4, "valid_targets_min": 791 }, { "epoch": 0.60790273556231, "grad_norm": 0.53995409546225, "learning_rate": 3.462039045553146e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.23457960784435272, "step": 400, "valid_targets_mean": 5069.6, "valid_targets_min": 489 }, { "epoch": 0.6155015197568389, "grad_norm": 0.9196646418934739, "learning_rate": 3.505422993492408e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.23785921931266785, "step": 405, "valid_targets_mean": 4393.4, "valid_targets_min": 829 }, { "epoch": 0.6231003039513677, "grad_norm": 0.6099790951053485, "learning_rate": 3.5488069414316705e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.23619459569454193, "step": 410, "valid_targets_mean": 3865.0, "valid_targets_min": 1002 }, { "epoch": 0.6306990881458967, "grad_norm": 0.5925560150305617, "learning_rate": 3.592190889370933e-05, "loss": 0.2534, "loss_nan_ranks": 0, "loss_rank_avg": 0.24648156762123108, "step": 415, "valid_targets_mean": 5077.6, "valid_targets_min": 1028 }, { "epoch": 0.6382978723404256, "grad_norm": 0.5334746742630121, "learning_rate": 3.635574837310195e-05, "loss": 0.2337, "loss_nan_ranks": 0, "loss_rank_avg": 0.21448864042758942, "step": 420, "valid_targets_mean": 4616.1, "valid_targets_min": 574 }, { "epoch": 0.6458966565349544, "grad_norm": 0.5167724016109878, "learning_rate": 3.678958785249458e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.230168879032135, "step": 425, "valid_targets_mean": 4870.9, "valid_targets_min": 921 }, { "epoch": 0.6534954407294833, "grad_norm": 0.5454984899416742, "learning_rate": 3.722342733188721e-05, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.262331485748291, "step": 430, "valid_targets_mean": 5432.7, "valid_targets_min": 933 }, { "epoch": 0.6610942249240122, "grad_norm": 0.7273049295570767, "learning_rate": 3.765726681127983e-05, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.25644373893737793, "step": 435, "valid_targets_mean": 3536.0, "valid_targets_min": 710 }, { "epoch": 0.668693009118541, "grad_norm": 0.5453606831740409, "learning_rate": 3.8091106290672456e-05, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.24661529064178467, "step": 440, "valid_targets_mean": 4021.8, "valid_targets_min": 599 }, { "epoch": 0.6762917933130699, "grad_norm": 0.5397724365767885, "learning_rate": 3.852494577006508e-05, "loss": 0.2536, "loss_nan_ranks": 0, "loss_rank_avg": 0.2421499490737915, "step": 445, "valid_targets_mean": 4597.5, "valid_targets_min": 370 }, { "epoch": 0.6838905775075987, "grad_norm": 0.5764238756332084, "learning_rate": 3.8958785249457704e-05, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.2172556221485138, "step": 450, "valid_targets_mean": 5077.4, "valid_targets_min": 1299 }, { "epoch": 0.6914893617021277, "grad_norm": 0.5511870862131859, "learning_rate": 3.939262472885033e-05, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.23796507716178894, "step": 455, "valid_targets_mean": 3540.4, "valid_targets_min": 781 }, { "epoch": 0.6990881458966566, "grad_norm": 0.5240137590905279, "learning_rate": 3.982646420824295e-05, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.3238080143928528, "step": 460, "valid_targets_mean": 6050.4, "valid_targets_min": 921 }, { "epoch": 0.7066869300911854, "grad_norm": 0.504788443919895, "learning_rate": 3.999994829970777e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.2535270154476166, "step": 465, "valid_targets_mean": 4623.6, "valid_targets_min": 642 }, { "epoch": 0.7142857142857143, "grad_norm": 0.6552382106268326, "learning_rate": 3.999963235444541e-05, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.23992504179477692, "step": 470, "valid_targets_mean": 5108.4, "valid_targets_min": 702 }, { "epoch": 0.7218844984802432, "grad_norm": 0.5338400861286152, "learning_rate": 3.999902919083712e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.2298986315727234, "step": 475, "valid_targets_mean": 4551.4, "valid_targets_min": 827 }, { "epoch": 0.729483282674772, "grad_norm": 0.4717163253476549, "learning_rate": 3.999813881754504e-05, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.22416530549526215, "step": 480, "valid_targets_mean": 5166.6, "valid_targets_min": 2461 }, { "epoch": 0.7370820668693009, "grad_norm": 0.46569192135259724, "learning_rate": 3.999696124735598e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.20350381731987, "step": 485, "valid_targets_mean": 5345.7, "valid_targets_min": 1890 }, { "epoch": 0.7446808510638298, "grad_norm": 0.42173419222407094, "learning_rate": 3.999549649718124e-05, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.21917913854122162, "step": 490, "valid_targets_mean": 6391.4, "valid_targets_min": 3738 }, { "epoch": 0.7522796352583586, "grad_norm": 0.5432626540059464, "learning_rate": 3.999374458805636e-05, "loss": 0.2436, "loss_nan_ranks": 0, "loss_rank_avg": 0.2308879792690277, "step": 495, "valid_targets_mean": 4123.1, "valid_targets_min": 597 }, { "epoch": 0.7598784194528876, "grad_norm": 0.5137145588974806, "learning_rate": 3.999170554514082e-05, "loss": 0.2331, "loss_nan_ranks": 0, "loss_rank_avg": 0.23714055120944977, "step": 500, "valid_targets_mean": 4805.9, "valid_targets_min": 605 }, { "epoch": 0.7674772036474165, "grad_norm": 0.49268000212812557, "learning_rate": 3.998937939771771e-05, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.24276787042617798, "step": 505, "valid_targets_mean": 4071.9, "valid_targets_min": 790 }, { "epoch": 0.7750759878419453, "grad_norm": 0.6202296018779553, "learning_rate": 3.998676617919322e-05, "loss": 0.2437, "loss_nan_ranks": 0, "loss_rank_avg": 0.27594321966171265, "step": 510, "valid_targets_mean": 3380.7, "valid_targets_min": 440 }, { "epoch": 0.7826747720364742, "grad_norm": 0.4863803507783552, "learning_rate": 3.9983865927096276e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.24749267101287842, "step": 515, "valid_targets_mean": 5073.1, "valid_targets_min": 777 }, { "epoch": 0.790273556231003, "grad_norm": 0.5836827968647129, "learning_rate": 3.998067868307792e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.23861373960971832, "step": 520, "valid_targets_mean": 5020.6, "valid_targets_min": 570 }, { "epoch": 0.7978723404255319, "grad_norm": 0.5231558404449659, "learning_rate": 3.9977204492910744e-05, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.22653838992118835, "step": 525, "valid_targets_mean": 4575.4, "valid_targets_min": 565 }, { "epoch": 0.8054711246200608, "grad_norm": 0.5430934870471972, "learning_rate": 3.997344340648822e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.22603115439414978, "step": 530, "valid_targets_mean": 4679.3, "valid_targets_min": 937 }, { "epoch": 0.8130699088145896, "grad_norm": 0.5286884499015065, "learning_rate": 3.996939547782399e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.22073689103126526, "step": 535, "valid_targets_mean": 4476.1, "valid_targets_min": 718 }, { "epoch": 0.8206686930091185, "grad_norm": 0.5785998410503295, "learning_rate": 3.996506076505109e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.2660371661186218, "step": 540, "valid_targets_mean": 4106.3, "valid_targets_min": 487 }, { "epoch": 0.8282674772036475, "grad_norm": 0.6951317726718936, "learning_rate": 3.996043933042112e-05, "loss": 0.2367, "loss_nan_ranks": 0, "loss_rank_avg": 0.24442562460899353, "step": 545, "valid_targets_mean": 4844.5, "valid_targets_min": 834 }, { "epoch": 0.8358662613981763, "grad_norm": 0.43506966442749545, "learning_rate": 3.995553124030334e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.20776590704917908, "step": 550, "valid_targets_mean": 4980.6, "valid_targets_min": 465 }, { "epoch": 0.8434650455927052, "grad_norm": 0.4706049122050459, "learning_rate": 3.9950336565183725e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.27285271883010864, "step": 555, "valid_targets_mean": 5395.9, "valid_targets_min": 990 }, { "epoch": 0.851063829787234, "grad_norm": 0.49091088519408277, "learning_rate": 3.994485537966394e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2088671624660492, "step": 560, "valid_targets_mean": 4588.9, "valid_targets_min": 930 }, { "epoch": 0.8586626139817629, "grad_norm": 0.5986083125056836, "learning_rate": 3.993908776246029e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.24598953127861023, "step": 565, "valid_targets_mean": 3864.4, "valid_targets_min": 694 }, { "epoch": 0.8662613981762918, "grad_norm": 0.5161879038146385, "learning_rate": 3.993303379640256e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.24257272481918335, "step": 570, "valid_targets_mean": 3828.1, "valid_targets_min": 714 }, { "epoch": 0.8738601823708206, "grad_norm": 0.4991892963677317, "learning_rate": 3.992669356843287e-05, "loss": 0.218, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508493661880493, "step": 575, "valid_targets_mean": 4322.0, "valid_targets_min": 1183 }, { "epoch": 0.8814589665653495, "grad_norm": 0.46377204664593574, "learning_rate": 3.992006716960437e-05, "loss": 0.2293, "loss_nan_ranks": 0, "loss_rank_avg": 0.2126588225364685, "step": 580, "valid_targets_mean": 4726.4, "valid_targets_min": 771 }, { "epoch": 0.8890577507598785, "grad_norm": 0.4484638597015378, "learning_rate": 3.9913154695079983e-05, "loss": 0.2479, "loss_nan_ranks": 0, "loss_rank_avg": 0.2277049422264099, "step": 585, "valid_targets_mean": 5441.6, "valid_targets_min": 672 }, { "epoch": 0.8966565349544073, "grad_norm": 0.473975742493428, "learning_rate": 3.9905956244131e-05, "loss": 0.2406, "loss_nan_ranks": 0, "loss_rank_avg": 0.2310577630996704, "step": 590, "valid_targets_mean": 4966.7, "valid_targets_min": 171 }, { "epoch": 0.9042553191489362, "grad_norm": 0.5269660383414424, "learning_rate": 3.989847192013569e-05, "loss": 0.2439, "loss_nan_ranks": 0, "loss_rank_avg": 0.20536382496356964, "step": 595, "valid_targets_mean": 4305.1, "valid_targets_min": 818 }, { "epoch": 0.9118541033434651, "grad_norm": 0.5290469023785411, "learning_rate": 3.9890701830577784e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.19890496134757996, "step": 600, "valid_targets_mean": 3980.8, "valid_targets_min": 911 }, { "epoch": 0.9194528875379939, "grad_norm": 0.44803784041894573, "learning_rate": 3.9882646087044944e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.2399585247039795, "step": 605, "valid_targets_mean": 5333.2, "valid_targets_min": 280 }, { "epoch": 0.9270516717325228, "grad_norm": 0.4328101297576573, "learning_rate": 3.987430480522717e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.21868915855884552, "step": 610, "valid_targets_mean": 5678.4, "valid_targets_min": 1871 }, { "epoch": 0.9346504559270516, "grad_norm": 0.49304307903824257, "learning_rate": 3.986567810491511e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.2420819252729416, "step": 615, "valid_targets_mean": 4536.2, "valid_targets_min": 809 }, { "epoch": 0.9422492401215805, "grad_norm": 0.5700813425381566, "learning_rate": 3.9856766109998376e-05, "loss": 0.2407, "loss_nan_ranks": 0, "loss_rank_avg": 0.21311193704605103, "step": 620, "valid_targets_mean": 4451.4, "valid_targets_min": 593 }, { "epoch": 0.9498480243161094, "grad_norm": 0.6294683305416847, "learning_rate": 3.9847568948463754e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.20918530225753784, "step": 625, "valid_targets_mean": 4797.4, "valid_targets_min": 847 }, { "epoch": 0.9574468085106383, "grad_norm": 0.49380029688075006, "learning_rate": 3.983808675239333e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.2152310311794281, "step": 630, "valid_targets_mean": 4176.9, "valid_targets_min": 692 }, { "epoch": 0.9650455927051672, "grad_norm": 0.5200102205973911, "learning_rate": 3.9828319657962655e-05, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.2529393136501312, "step": 635, "valid_targets_mean": 4521.0, "valid_targets_min": 1069 }, { "epoch": 0.9726443768996961, "grad_norm": 0.5009014898507517, "learning_rate": 3.981826780543873e-05, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.2124088704586029, "step": 640, "valid_targets_mean": 4639.8, "valid_targets_min": 268 }, { "epoch": 0.9802431610942249, "grad_norm": 0.47854286438275906, "learning_rate": 3.980793133917805e-05, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.22133532166481018, "step": 645, "valid_targets_mean": 4939.1, "valid_targets_min": 1059 }, { "epoch": 0.9878419452887538, "grad_norm": 0.44229863697562477, "learning_rate": 3.979731040762446e-05, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.20959582924842834, "step": 650, "valid_targets_mean": 5179.6, "valid_targets_min": 805 }, { "epoch": 0.9954407294832827, "grad_norm": 0.4641726376092792, "learning_rate": 3.97864051633071e-05, "loss": 0.2249, "loss_nan_ranks": 0, "loss_rank_avg": 0.22157493233680725, "step": 655, "valid_targets_mean": 4819.9, "valid_targets_min": 646 }, { "epoch": 1.0030395136778116, "grad_norm": 0.7931644284514437, "learning_rate": 3.977521576283815e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.19440427422523499, "step": 660, "valid_targets_mean": 4668.7, "valid_targets_min": 915 }, { "epoch": 1.0106382978723405, "grad_norm": 0.48788029210277306, "learning_rate": 3.9763742366910626e-05, "loss": 0.206, "loss_nan_ranks": 0, "loss_rank_avg": 0.1956978291273117, "step": 665, "valid_targets_mean": 4805.8, "valid_targets_min": 694 }, { "epoch": 1.0182370820668694, "grad_norm": 0.5298990414713055, "learning_rate": 3.975198514029604e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.2972638010978699, "step": 670, "valid_targets_mean": 4853.2, "valid_targets_min": 512 }, { "epoch": 1.0258358662613982, "grad_norm": 0.5473369439399378, "learning_rate": 3.9739944251842054e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.21648220717906952, "step": 675, "valid_targets_mean": 5254.8, "valid_targets_min": 1077 }, { "epoch": 1.033434650455927, "grad_norm": 0.8965405989782883, "learning_rate": 3.9727619874470066e-05, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.24239912629127502, "step": 680, "valid_targets_mean": 4575.9, "valid_targets_min": 847 }, { "epoch": 1.041033434650456, "grad_norm": 0.45053643384905995, "learning_rate": 3.971501218517267e-05, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.20542305707931519, "step": 685, "valid_targets_mean": 4701.5, "valid_targets_min": 359 }, { "epoch": 1.0486322188449848, "grad_norm": 0.5355621304269382, "learning_rate": 3.9702121365011194e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.24637873470783234, "step": 690, "valid_targets_mean": 4662.4, "valid_targets_min": 797 }, { "epoch": 1.0562310030395137, "grad_norm": 0.46031160112965963, "learning_rate": 3.968894759911304e-05, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.22839926183223724, "step": 695, "valid_targets_mean": 5164.2, "valid_targets_min": 904 }, { "epoch": 1.0638297872340425, "grad_norm": 0.4910433091107382, "learning_rate": 3.9675491076669043e-05, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.21850205957889557, "step": 700, "valid_targets_mean": 4950.7, "valid_targets_min": 478 }, { "epoch": 1.0714285714285714, "grad_norm": 0.5876241654950701, "learning_rate": 3.966175199093077e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.23394906520843506, "step": 705, "valid_targets_mean": 3169.8, "valid_targets_min": 809 }, { "epoch": 1.0790273556231003, "grad_norm": 0.46432326611030017, "learning_rate": 3.9647730539207715e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.2200213074684143, "step": 710, "valid_targets_mean": 5574.2, "valid_targets_min": 2786 }, { "epoch": 1.0866261398176291, "grad_norm": 0.4275229879620877, "learning_rate": 3.963342692286449e-05, "loss": 0.2161, "loss_nan_ranks": 0, "loss_rank_avg": 0.20706182718276978, "step": 715, "valid_targets_mean": 5002.6, "valid_targets_min": 1028 }, { "epoch": 1.094224924012158, "grad_norm": 0.5268786606408785, "learning_rate": 3.9618841347317925e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.20836099982261658, "step": 720, "valid_targets_mean": 3824.6, "valid_targets_min": 834 }, { "epoch": 1.1018237082066868, "grad_norm": 0.44352266391750467, "learning_rate": 3.9603974022034117e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.1991317719221115, "step": 725, "valid_targets_mean": 5762.8, "valid_targets_min": 2565 }, { "epoch": 1.1094224924012157, "grad_norm": 0.5059377730602702, "learning_rate": 3.9588825160525406e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.2332250475883484, "step": 730, "valid_targets_mean": 4394.6, "valid_targets_min": 778 }, { "epoch": 1.1170212765957448, "grad_norm": 0.5277265421398942, "learning_rate": 3.9573394980347354e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.23748330771923065, "step": 735, "valid_targets_mean": 4523.4, "valid_targets_min": 588 }, { "epoch": 1.1246200607902737, "grad_norm": 0.46757311577973365, "learning_rate": 3.9557683703095564e-05, "loss": 0.2074, "loss_nan_ranks": 0, "loss_rank_avg": 0.20653977990150452, "step": 740, "valid_targets_mean": 5119.2, "valid_targets_min": 446 }, { "epoch": 1.1322188449848025, "grad_norm": 0.4423041648030623, "learning_rate": 3.954169155440255e-05, "loss": 0.2234, "loss_nan_ranks": 0, "loss_rank_avg": 0.2072131335735321, "step": 745, "valid_targets_mean": 4472.0, "valid_targets_min": 271 }, { "epoch": 1.1398176291793314, "grad_norm": 0.4428410311750491, "learning_rate": 3.952541876393444e-05, "loss": 0.2206, "loss_nan_ranks": 0, "loss_rank_avg": 0.23159939050674438, "step": 750, "valid_targets_mean": 4634.8, "valid_targets_min": 810 }, { "epoch": 1.1474164133738602, "grad_norm": 0.5243183428010766, "learning_rate": 3.9508865565387745e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.22126150131225586, "step": 755, "valid_targets_mean": 4285.5, "valid_targets_min": 702 }, { "epoch": 1.155015197568389, "grad_norm": 0.45761304225615707, "learning_rate": 3.949203219648594e-05, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.20640668272972107, "step": 760, "valid_targets_mean": 4922.4, "valid_targets_min": 229 }, { "epoch": 1.162613981762918, "grad_norm": 0.4830790302776904, "learning_rate": 3.94749188989761e-05, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2300214022397995, "step": 765, "valid_targets_mean": 4988.9, "valid_targets_min": 2275 }, { "epoch": 1.1702127659574468, "grad_norm": 0.6344964312381591, "learning_rate": 3.945752591862538e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.22842663526535034, "step": 770, "valid_targets_mean": 3627.2, "valid_targets_min": 662 }, { "epoch": 1.1778115501519757, "grad_norm": 0.48098689360030655, "learning_rate": 3.943985350521753e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.2292681783437729, "step": 775, "valid_targets_mean": 4028.1, "valid_targets_min": 732 }, { "epoch": 1.1854103343465046, "grad_norm": 0.5336086809835088, "learning_rate": 3.942190191254928e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.22446206212043762, "step": 780, "valid_targets_mean": 4275.8, "valid_targets_min": 741 }, { "epoch": 1.1930091185410334, "grad_norm": 0.613832091134627, "learning_rate": 3.9403671398426705e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.2014659196138382, "step": 785, "valid_targets_mean": 5527.8, "valid_targets_min": 2519 }, { "epoch": 1.2006079027355623, "grad_norm": 0.7772463802272693, "learning_rate": 3.938516222466153e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.20852729678153992, "step": 790, "valid_targets_mean": 4968.9, "valid_targets_min": 605 }, { "epoch": 1.2082066869300911, "grad_norm": 0.5158401148303159, "learning_rate": 3.936637465706735e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.25038856267929077, "step": 795, "valid_targets_mean": 4784.4, "valid_targets_min": 655 }, { "epoch": 1.21580547112462, "grad_norm": 1.031320737042501, "learning_rate": 3.934730896545583e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.21661558747291565, "step": 800, "valid_targets_mean": 3556.4, "valid_targets_min": 653 }, { "epoch": 1.2234042553191489, "grad_norm": 0.46779923698778514, "learning_rate": 3.932796542363283e-05, "loss": 0.2113, "loss_nan_ranks": 0, "loss_rank_avg": 0.19566161930561066, "step": 805, "valid_targets_mean": 4376.0, "valid_targets_min": 810 }, { "epoch": 1.2310030395136777, "grad_norm": 0.4326481517949445, "learning_rate": 3.930834430939444e-05, "loss": 0.2145, "loss_nan_ranks": 0, "loss_rank_avg": 0.19606706500053406, "step": 810, "valid_targets_mean": 5616.6, "valid_targets_min": 2732 }, { "epoch": 1.2386018237082066, "grad_norm": 0.47029688029877836, "learning_rate": 3.9288445904523063e-05, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.1963462084531784, "step": 815, "valid_targets_mean": 4256.6, "valid_targets_min": 1593 }, { "epoch": 1.2462006079027357, "grad_norm": 0.4914352971694942, "learning_rate": 3.926827049478329e-05, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.2369862049818039, "step": 820, "valid_targets_mean": 5430.8, "valid_targets_min": 465 }, { "epoch": 1.2537993920972643, "grad_norm": 0.4983986981283837, "learning_rate": 3.924781836991783e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.2174890637397766, "step": 825, "valid_targets_mean": 4507.7, "valid_targets_min": 801 }, { "epoch": 1.2613981762917934, "grad_norm": 0.4385888971144186, "learning_rate": 3.922708982364337e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.21676486730575562, "step": 830, "valid_targets_mean": 5402.2, "valid_targets_min": 933 }, { "epoch": 1.2689969604863223, "grad_norm": 0.45249778212242275, "learning_rate": 3.920608515364631e-05, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.20077060163021088, "step": 835, "valid_targets_mean": 4443.8, "valid_targets_min": 491 }, { "epoch": 1.2765957446808511, "grad_norm": 0.47777362802657686, "learning_rate": 3.9184804661578535e-05, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.23784896731376648, "step": 840, "valid_targets_mean": 5061.4, "valid_targets_min": 846 }, { "epoch": 1.28419452887538, "grad_norm": 0.4135085697969651, "learning_rate": 3.9163248653053033e-05, "loss": 0.2066, "loss_nan_ranks": 0, "loss_rank_avg": 0.20635738968849182, "step": 845, "valid_targets_mean": 5489.4, "valid_targets_min": 1148 }, { "epoch": 1.2917933130699089, "grad_norm": 0.4117297091921728, "learning_rate": 3.9141417437639566e-05, "loss": 0.2018, "loss_nan_ranks": 0, "loss_rank_avg": 0.18252739310264587, "step": 850, "valid_targets_mean": 4780.3, "valid_targets_min": 799 }, { "epoch": 1.2993920972644377, "grad_norm": 0.48551756342329966, "learning_rate": 3.911931132886016e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.24173299968242645, "step": 855, "valid_targets_mean": 5113.2, "valid_targets_min": 756 }, { "epoch": 1.3069908814589666, "grad_norm": 0.4727140541170104, "learning_rate": 3.9096930644184674e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.1915874183177948, "step": 860, "valid_targets_mean": 4394.3, "valid_targets_min": 685 }, { "epoch": 1.3145896656534954, "grad_norm": 0.48025400940036744, "learning_rate": 3.907427570502616e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.2418954074382782, "step": 865, "valid_targets_mean": 3894.8, "valid_targets_min": 502 }, { "epoch": 1.3221884498480243, "grad_norm": 0.4849042187708983, "learning_rate": 3.90513468367363e-05, "loss": 0.2157, "loss_nan_ranks": 0, "loss_rank_avg": 0.2329632043838501, "step": 870, "valid_targets_mean": 4571.7, "valid_targets_min": 1992 }, { "epoch": 1.3297872340425532, "grad_norm": 0.5027508815921192, "learning_rate": 3.9028144368600746e-05, "loss": 0.2072, "loss_nan_ranks": 0, "loss_rank_avg": 0.19249165058135986, "step": 875, "valid_targets_mean": 4092.1, "valid_targets_min": 490 }, { "epoch": 1.337386018237082, "grad_norm": 0.43340094826535847, "learning_rate": 3.900466863383434e-05, "loss": 0.2074, "loss_nan_ranks": 0, "loss_rank_avg": 0.16721683740615845, "step": 880, "valid_targets_mean": 4360.1, "valid_targets_min": 678 }, { "epoch": 1.344984802431611, "grad_norm": 0.42492899268845147, "learning_rate": 3.898091996957638e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.18311715126037598, "step": 885, "valid_targets_mean": 5269.4, "valid_targets_min": 2234 }, { "epoch": 1.3525835866261398, "grad_norm": 0.45185682893053764, "learning_rate": 3.895689871688571e-05, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.2394876629114151, "step": 890, "valid_targets_mean": 5222.2, "valid_targets_min": 779 }, { "epoch": 1.3601823708206686, "grad_norm": 0.4595708686629068, "learning_rate": 3.893260522073591e-05, "loss": 0.2037, "loss_nan_ranks": 0, "loss_rank_avg": 0.19897980988025665, "step": 895, "valid_targets_mean": 4327.2, "valid_targets_min": 1913 }, { "epoch": 1.3677811550151975, "grad_norm": 0.5538183693714539, "learning_rate": 3.8908039830010296e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.21077513694763184, "step": 900, "valid_targets_mean": 4477.2, "valid_targets_min": 1914 }, { "epoch": 1.3753799392097266, "grad_norm": 0.4826233268835563, "learning_rate": 3.888320289749687e-05, "loss": 0.2167, "loss_nan_ranks": 0, "loss_rank_avg": 0.20590105652809143, "step": 905, "valid_targets_mean": 4855.0, "valid_targets_min": 987 }, { "epoch": 1.3829787234042552, "grad_norm": 0.45816874548401804, "learning_rate": 3.885809477988334e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.18594498932361603, "step": 910, "valid_targets_mean": 4613.8, "valid_targets_min": 486 }, { "epoch": 1.3905775075987843, "grad_norm": 0.46458650367475696, "learning_rate": 3.883271583775194e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.20757240056991577, "step": 915, "valid_targets_mean": 5135.2, "valid_targets_min": 567 }, { "epoch": 1.3981762917933132, "grad_norm": 0.49573212835944025, "learning_rate": 3.880706643557425e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.20922252535820007, "step": 920, "valid_targets_mean": 4993.9, "valid_targets_min": 1608 }, { "epoch": 1.405775075987842, "grad_norm": 0.5065076653284654, "learning_rate": 3.8781146941705975e-05, "loss": 0.219, "loss_nan_ranks": 0, "loss_rank_avg": 0.22266633808612823, "step": 925, "valid_targets_mean": 3984.9, "valid_targets_min": 663 }, { "epoch": 1.4133738601823709, "grad_norm": 0.46389395621934165, "learning_rate": 3.8754957728381676e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.1952955424785614, "step": 930, "valid_targets_mean": 4305.5, "valid_targets_min": 659 }, { "epoch": 1.4209726443768997, "grad_norm": 0.4244364300260148, "learning_rate": 3.87284991717094e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.19909913837909698, "step": 935, "valid_targets_mean": 5106.8, "valid_targets_min": 692 }, { "epoch": 1.4285714285714286, "grad_norm": 0.48753574099908936, "learning_rate": 3.870177165166526e-05, "loss": 0.2278, "loss_nan_ranks": 0, "loss_rank_avg": 0.22329512238502502, "step": 940, "valid_targets_mean": 4227.9, "valid_targets_min": 960 }, { "epoch": 1.4361702127659575, "grad_norm": 0.46921808961532296, "learning_rate": 3.8674775552088034e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.1966555416584015, "step": 945, "valid_targets_mean": 4668.8, "valid_targets_min": 1045 }, { "epoch": 1.4437689969604863, "grad_norm": 0.5011462054285303, "learning_rate": 3.864751126067359e-05, "loss": 0.2288, "loss_nan_ranks": 0, "loss_rank_avg": 0.3067967891693115, "step": 950, "valid_targets_mean": 5225.8, "valid_targets_min": 982 }, { "epoch": 1.4513677811550152, "grad_norm": 0.45640279658712546, "learning_rate": 3.861997916896937e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.20878750085830688, "step": 955, "valid_targets_mean": 4429.0, "valid_targets_min": 401 }, { "epoch": 1.458966565349544, "grad_norm": 0.4318101933694944, "learning_rate": 3.859217967236872e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.21009142696857452, "step": 960, "valid_targets_mean": 5187.9, "valid_targets_min": 1245 }, { "epoch": 1.466565349544073, "grad_norm": 0.4639537052196582, "learning_rate": 3.856411317010525e-05, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.20182490348815918, "step": 965, "valid_targets_mean": 4228.9, "valid_targets_min": 1395 }, { "epoch": 1.4741641337386018, "grad_norm": 0.5830750830049942, "learning_rate": 3.853578006524711e-05, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.25057747960090637, "step": 970, "valid_targets_mean": 3692.9, "valid_targets_min": 853 }, { "epoch": 1.4817629179331306, "grad_norm": 0.6135846306078634, "learning_rate": 3.8507180764691134e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.26475679874420166, "step": 975, "valid_targets_mean": 5166.6, "valid_targets_min": 2214 }, { "epoch": 1.4893617021276595, "grad_norm": 0.42930269291397805, "learning_rate": 3.847831567915706e-05, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.22688277065753937, "step": 980, "valid_targets_mean": 5970.2, "valid_targets_min": 1687 }, { "epoch": 1.4969604863221884, "grad_norm": 0.44889401709296317, "learning_rate": 3.844918522318164e-05, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.2054261565208435, "step": 985, "valid_targets_mean": 4887.9, "valid_targets_min": 1082 }, { "epoch": 1.5045592705167175, "grad_norm": 0.4849219730059719, "learning_rate": 3.84197898151126e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.2193393111228943, "step": 990, "valid_targets_mean": 5518.3, "valid_targets_min": 348 }, { "epoch": 1.512158054711246, "grad_norm": 0.47364060795273005, "learning_rate": 3.839012987710275e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.2376159131526947, "step": 995, "valid_targets_mean": 4844.3, "valid_targets_min": 873 }, { "epoch": 1.5197568389057752, "grad_norm": 0.477005009585305, "learning_rate": 3.836020583510382e-05, "loss": 0.2223, "loss_nan_ranks": 0, "loss_rank_avg": 0.23394693434238434, "step": 1000, "valid_targets_mean": 4632.9, "valid_targets_min": 763 }, { "epoch": 1.5273556231003038, "grad_norm": 0.43901547735782315, "learning_rate": 3.833001811886041e-05, "loss": 0.2131, "loss_nan_ranks": 0, "loss_rank_avg": 0.2290436327457428, "step": 1005, "valid_targets_mean": 4733.1, "valid_targets_min": 729 }, { "epoch": 1.534954407294833, "grad_norm": 0.4128584010075957, "learning_rate": 3.8299567161903787e-05, "loss": 0.2134, "loss_nan_ranks": 0, "loss_rank_avg": 0.18785551190376282, "step": 1010, "valid_targets_mean": 5352.2, "valid_targets_min": 2335 }, { "epoch": 1.5425531914893615, "grad_norm": 0.5109402768329384, "learning_rate": 3.826885340154566e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.25076034665107727, "step": 1015, "valid_targets_mean": 4775.5, "valid_targets_min": 891 }, { "epoch": 1.5501519756838906, "grad_norm": 0.4615963241009783, "learning_rate": 3.8237877278871916e-05, "loss": 0.2257, "loss_nan_ranks": 0, "loss_rank_avg": 0.22021520137786865, "step": 1020, "valid_targets_mean": 4804.6, "valid_targets_min": 1759 }, { "epoch": 1.5577507598784195, "grad_norm": 0.41168421067320043, "learning_rate": 3.820663923873626e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.22017160058021545, "step": 1025, "valid_targets_mean": 5034.6, "valid_targets_min": 689 }, { "epoch": 1.5653495440729484, "grad_norm": 0.5570301288304671, "learning_rate": 3.817513972975385e-05, "loss": 0.2154, "loss_nan_ranks": 0, "loss_rank_avg": 0.21190384030342102, "step": 1030, "valid_targets_mean": 3886.7, "valid_targets_min": 816 }, { "epoch": 1.5729483282674772, "grad_norm": 0.48710822220429656, "learning_rate": 3.814337920429485e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.21960590779781342, "step": 1035, "valid_targets_mean": 4042.9, "valid_targets_min": 546 }, { "epoch": 1.580547112462006, "grad_norm": 0.4956003916710543, "learning_rate": 3.811135811847792e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.2413313090801239, "step": 1040, "valid_targets_mean": 4299.2, "valid_targets_min": 605 }, { "epoch": 1.588145896656535, "grad_norm": 0.5142660653107718, "learning_rate": 3.807907693216368e-05, "loss": 0.2109, "loss_nan_ranks": 0, "loss_rank_avg": 0.23288393020629883, "step": 1045, "valid_targets_mean": 4768.5, "valid_targets_min": 811 }, { "epoch": 1.5957446808510638, "grad_norm": 0.5129928776520155, "learning_rate": 3.804653610894811e-05, "loss": 0.2157, "loss_nan_ranks": 0, "loss_rank_avg": 0.20630177855491638, "step": 1050, "valid_targets_mean": 3965.7, "valid_targets_min": 1768 }, { "epoch": 1.6033434650455927, "grad_norm": 0.4428766734377924, "learning_rate": 3.801373611615585e-05, "loss": 0.218, "loss_nan_ranks": 0, "loss_rank_avg": 0.2139415144920349, "step": 1055, "valid_targets_mean": 4501.2, "valid_targets_min": 528 }, { "epoch": 1.6109422492401215, "grad_norm": 0.3976871596351703, "learning_rate": 3.798067742483355e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.1983199268579483, "step": 1060, "valid_targets_mean": 4932.3, "valid_targets_min": 593 }, { "epoch": 1.6185410334346506, "grad_norm": 0.43538181451443764, "learning_rate": 3.794736050974308e-05, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.21794393658638, "step": 1065, "valid_targets_mean": 5077.6, "valid_targets_min": 828 }, { "epoch": 1.6261398176291793, "grad_norm": 0.41261656921486206, "learning_rate": 3.7913785849354693e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.18821759521961212, "step": 1070, "valid_targets_mean": 4659.0, "valid_targets_min": 776 }, { "epoch": 1.6337386018237083, "grad_norm": 0.4607656496157841, "learning_rate": 3.787995392584017e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.23070788383483887, "step": 1075, "valid_targets_mean": 5037.2, "valid_targets_min": 767 }, { "epoch": 1.641337386018237, "grad_norm": 0.521744416704874, "learning_rate": 3.784586522506589e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.23326215147972107, "step": 1080, "valid_targets_mean": 4300.6, "valid_targets_min": 752 }, { "epoch": 1.648936170212766, "grad_norm": 0.5411151907665869, "learning_rate": 3.781152023658588e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.19801482558250427, "step": 1085, "valid_targets_mean": 4037.4, "valid_targets_min": 565 }, { "epoch": 1.6565349544072947, "grad_norm": 0.4881180236795167, "learning_rate": 3.7776919453634735e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.20285995304584503, "step": 1090, "valid_targets_mean": 4716.8, "valid_targets_min": 1812 }, { "epoch": 1.6641337386018238, "grad_norm": 0.3892565204932596, "learning_rate": 3.774206337312058e-05, "loss": 0.2146, "loss_nan_ranks": 0, "loss_rank_avg": 0.19384154677391052, "step": 1095, "valid_targets_mean": 5548.1, "valid_targets_min": 1723 }, { "epoch": 1.6717325227963524, "grad_norm": 0.6079201585046432, "learning_rate": 3.7706952495617895e-05, "loss": 0.2228, "loss_nan_ranks": 0, "loss_rank_avg": 0.2272331863641739, "step": 1100, "valid_targets_mean": 4440.2, "valid_targets_min": 754 }, { "epoch": 1.6793313069908815, "grad_norm": 0.4392880697961998, "learning_rate": 3.767158732536037e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.20622758567333221, "step": 1105, "valid_targets_mean": 5115.8, "valid_targets_min": 2178 }, { "epoch": 1.6869300911854104, "grad_norm": 0.4760913157214835, "learning_rate": 3.7635968370233625e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.22895006835460663, "step": 1110, "valid_targets_mean": 4197.4, "valid_targets_min": 664 }, { "epoch": 1.6945288753799392, "grad_norm": 0.42921725245111436, "learning_rate": 3.760009614176792e-05, "loss": 0.2092, "loss_nan_ranks": 0, "loss_rank_avg": 0.20630860328674316, "step": 1115, "valid_targets_mean": 5539.1, "valid_targets_min": 1629 }, { "epoch": 1.702127659574468, "grad_norm": 0.47421657315391796, "learning_rate": 3.7563971155130834e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.19295352697372437, "step": 1120, "valid_targets_mean": 4742.3, "valid_targets_min": 900 }, { "epoch": 1.709726443768997, "grad_norm": 0.44277966038489874, "learning_rate": 3.752759392911986e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.21693378686904907, "step": 1125, "valid_targets_mean": 5488.9, "valid_targets_min": 2673 }, { "epoch": 1.7173252279635258, "grad_norm": 0.35764926472016434, "learning_rate": 3.7490964986154936e-05, "loss": 0.2056, "loss_nan_ranks": 0, "loss_rank_avg": 0.1632017195224762, "step": 1130, "valid_targets_mean": 5798.2, "valid_targets_min": 2382 }, { "epoch": 1.7249240121580547, "grad_norm": 0.46310293456133733, "learning_rate": 3.745408485227094e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.2125653326511383, "step": 1135, "valid_targets_mean": 4493.4, "valid_targets_min": 703 }, { "epoch": 1.7325227963525835, "grad_norm": 0.48402636671915206, "learning_rate": 3.7416954057110165e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.2212226539850235, "step": 1140, "valid_targets_mean": 4891.2, "valid_targets_min": 422 }, { "epoch": 1.7401215805471124, "grad_norm": 0.48544415851378125, "learning_rate": 3.7379573133914686e-05, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.24577516317367554, "step": 1145, "valid_targets_mean": 4704.4, "valid_targets_min": 683 }, { "epoch": 1.7477203647416415, "grad_norm": 0.4686217061157862, "learning_rate": 3.7341942619518736e-05, "loss": 0.2134, "loss_nan_ranks": 0, "loss_rank_avg": 0.20010778307914734, "step": 1150, "valid_targets_mean": 4060.2, "valid_targets_min": 740 }, { "epoch": 1.7553191489361701, "grad_norm": 0.456474362675113, "learning_rate": 3.730406305434093e-05, "loss": 0.2183, "loss_nan_ranks": 0, "loss_rank_avg": 0.21529576182365417, "step": 1155, "valid_targets_mean": 4461.8, "valid_targets_min": 407 }, { "epoch": 1.7629179331306992, "grad_norm": 0.39386216864446827, "learning_rate": 3.726593498237659e-05, "loss": 0.2173, "loss_nan_ranks": 0, "loss_rank_avg": 0.20742088556289673, "step": 1160, "valid_targets_mean": 5696.4, "valid_targets_min": 832 }, { "epoch": 1.7705167173252279, "grad_norm": 0.4954398039746765, "learning_rate": 3.7227558951189866e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2127082198858261, "step": 1165, "valid_targets_mean": 4003.1, "valid_targets_min": 1097 }, { "epoch": 1.778115501519757, "grad_norm": 0.47012021916770536, "learning_rate": 3.7188935511905895e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.2261389195919037, "step": 1170, "valid_targets_mean": 5014.4, "valid_targets_min": 1036 }, { "epoch": 1.7857142857142856, "grad_norm": 0.4746767287862107, "learning_rate": 3.715006521920289e-05, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.19433888792991638, "step": 1175, "valid_targets_mean": 4523.8, "valid_targets_min": 625 }, { "epoch": 1.7933130699088147, "grad_norm": 0.4791758218613005, "learning_rate": 3.711094863130417e-05, "loss": 0.2161, "loss_nan_ranks": 0, "loss_rank_avg": 0.22052708268165588, "step": 1180, "valid_targets_mean": 5126.8, "valid_targets_min": 1164 }, { "epoch": 1.8009118541033433, "grad_norm": 0.43857817303439106, "learning_rate": 3.707158630997015e-05, "loss": 0.2186, "loss_nan_ranks": 0, "loss_rank_avg": 0.21629557013511658, "step": 1185, "valid_targets_mean": 5371.6, "valid_targets_min": 728 }, { "epoch": 1.8085106382978724, "grad_norm": 0.5348041335538533, "learning_rate": 3.703197882049026e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.2324264943599701, "step": 1190, "valid_targets_mean": 3775.2, "valid_targets_min": 637 }, { "epoch": 1.8161094224924013, "grad_norm": 0.3889586019552747, "learning_rate": 3.699212673167484e-05, "loss": 0.2116, "loss_nan_ranks": 0, "loss_rank_avg": 0.2274361550807953, "step": 1195, "valid_targets_mean": 6306.4, "valid_targets_min": 622 }, { "epoch": 1.8237082066869301, "grad_norm": 0.46857624747519244, "learning_rate": 3.695203061584695e-05, "loss": 0.2068, "loss_nan_ranks": 0, "loss_rank_avg": 0.23175036907196045, "step": 1200, "valid_targets_mean": 4628.2, "valid_targets_min": 429 }, { "epoch": 1.831306990881459, "grad_norm": 0.4885718145421046, "learning_rate": 3.69116910488342e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.22779184579849243, "step": 1205, "valid_targets_mean": 4191.6, "valid_targets_min": 156 }, { "epoch": 1.8389057750759878, "grad_norm": 0.4639904198544056, "learning_rate": 3.687110860996041e-05, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.2027101218700409, "step": 1210, "valid_targets_mean": 4831.6, "valid_targets_min": 699 }, { "epoch": 1.8465045592705167, "grad_norm": 0.46833719588845396, "learning_rate": 3.6830283882037335e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.20325730741024017, "step": 1215, "valid_targets_mean": 5097.8, "valid_targets_min": 465 }, { "epoch": 1.8541033434650456, "grad_norm": 0.41463391792421084, "learning_rate": 3.678921745135631e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.20085079967975616, "step": 1220, "valid_targets_mean": 5023.6, "valid_targets_min": 633 }, { "epoch": 1.8617021276595744, "grad_norm": 0.44749514129370893, "learning_rate": 3.674790990767979e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.20688676834106445, "step": 1225, "valid_targets_mean": 4845.9, "valid_targets_min": 667 }, { "epoch": 1.8693009118541033, "grad_norm": 0.4502221753599573, "learning_rate": 3.670636184423288e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.19071269035339355, "step": 1230, "valid_targets_mean": 4245.0, "valid_targets_min": 500 }, { "epoch": 1.8768996960486324, "grad_norm": 0.5334681412726286, "learning_rate": 3.666457385769487e-05, "loss": 0.2042, "loss_nan_ranks": 0, "loss_rank_avg": 0.2248763144016266, "step": 1235, "valid_targets_mean": 4481.5, "valid_targets_min": 770 }, { "epoch": 1.884498480243161, "grad_norm": 0.4644916347166466, "learning_rate": 3.66225465481906e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.2305462807416916, "step": 1240, "valid_targets_mean": 4303.9, "valid_targets_min": 630 }, { "epoch": 1.89209726443769, "grad_norm": 0.4267832479199372, "learning_rate": 3.658028051928189e-05, "loss": 0.2092, "loss_nan_ranks": 0, "loss_rank_avg": 0.18598158657550812, "step": 1245, "valid_targets_mean": 4759.4, "valid_targets_min": 965 }, { "epoch": 1.8996960486322187, "grad_norm": 0.46975601834979414, "learning_rate": 3.6537776377958836e-05, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.2438843995332718, "step": 1250, "valid_targets_mean": 4358.6, "valid_targets_min": 545 }, { "epoch": 1.9072948328267478, "grad_norm": 0.41467959071923455, "learning_rate": 3.649503473463112e-05, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.18656185269355774, "step": 1255, "valid_targets_mean": 4789.7, "valid_targets_min": 622 }, { "epoch": 1.9148936170212765, "grad_norm": 0.48720410950048604, "learning_rate": 3.645205620311923e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.2179066389799118, "step": 1260, "valid_targets_mean": 4316.3, "valid_targets_min": 718 }, { "epoch": 1.9224924012158056, "grad_norm": 0.47737074347118913, "learning_rate": 3.6408841400645644e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.20159170031547546, "step": 1265, "valid_targets_mean": 4676.4, "valid_targets_min": 920 }, { "epoch": 1.9300911854103342, "grad_norm": 0.38561599683027503, "learning_rate": 3.636539094782598e-05, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.18330830335617065, "step": 1270, "valid_targets_mean": 4813.8, "valid_targets_min": 811 }, { "epoch": 1.9376899696048633, "grad_norm": 0.4850605122437156, "learning_rate": 3.632170546866007e-05, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.22532254457473755, "step": 1275, "valid_targets_mean": 3973.6, "valid_targets_min": 335 }, { "epoch": 1.9452887537993921, "grad_norm": 0.43992666790664475, "learning_rate": 3.6277785590523e-05, "loss": 0.2201, "loss_nan_ranks": 0, "loss_rank_avg": 0.24039697647094727, "step": 1280, "valid_targets_mean": 5707.9, "valid_targets_min": 511 }, { "epoch": 1.952887537993921, "grad_norm": 3.9664174496666083, "learning_rate": 3.623363194415609e-05, "loss": 0.214, "loss_nan_ranks": 0, "loss_rank_avg": 0.21847763657569885, "step": 1285, "valid_targets_mean": 4531.5, "valid_targets_min": 991 }, { "epoch": 1.9604863221884499, "grad_norm": 0.4595577415716105, "learning_rate": 3.618924516365788e-05, "loss": 0.2042, "loss_nan_ranks": 0, "loss_rank_avg": 0.20071235299110413, "step": 1290, "valid_targets_mean": 4902.6, "valid_targets_min": 777 }, { "epoch": 1.9680851063829787, "grad_norm": 0.44567806699122325, "learning_rate": 3.614462588647495e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.24957430362701416, "step": 1295, "valid_targets_mean": 4669.9, "valid_targets_min": 1479 }, { "epoch": 1.9756838905775076, "grad_norm": 0.42210130028239157, "learning_rate": 3.609977475339284e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.2057563215494156, "step": 1300, "valid_targets_mean": 5229.6, "valid_targets_min": 969 }, { "epoch": 1.9832826747720365, "grad_norm": 0.48785866462041777, "learning_rate": 3.6054692408526806e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.2031518667936325, "step": 1305, "valid_targets_mean": 3585.4, "valid_targets_min": 843 }, { "epoch": 1.9908814589665653, "grad_norm": 0.4191280920943274, "learning_rate": 3.6009379499312563e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.21392418444156647, "step": 1310, "valid_targets_mean": 5448.1, "valid_targets_min": 2162 }, { "epoch": 1.9984802431610942, "grad_norm": 0.571865229628622, "learning_rate": 3.5963836676497034e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.21553698182106018, "step": 1315, "valid_targets_mean": 3434.1, "valid_targets_min": 460 }, { "epoch": 2.0060790273556233, "grad_norm": 0.4580819817800281, "learning_rate": 3.5918064594128946e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.18602877855300903, "step": 1320, "valid_targets_mean": 4337.8, "valid_targets_min": 527 }, { "epoch": 2.013677811550152, "grad_norm": 0.4308848554547568, "learning_rate": 3.5872063909549465e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.1809544563293457, "step": 1325, "valid_targets_mean": 4842.1, "valid_targets_min": 305 }, { "epoch": 2.021276595744681, "grad_norm": 0.4304570423447681, "learning_rate": 3.5825835283382754e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.17694029211997986, "step": 1330, "valid_targets_mean": 5139.7, "valid_targets_min": 1709 }, { "epoch": 2.0288753799392096, "grad_norm": 0.4201481077802898, "learning_rate": 3.5779379379526516e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.17606091499328613, "step": 1335, "valid_targets_mean": 5894.2, "valid_targets_min": 348 }, { "epoch": 2.0364741641337387, "grad_norm": 0.43796821938518954, "learning_rate": 3.57326968651424e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.19579800963401794, "step": 1340, "valid_targets_mean": 4780.1, "valid_targets_min": 1077 }, { "epoch": 2.0440729483282674, "grad_norm": 0.431578307043594, "learning_rate": 3.5685788410646455e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.17831829190254211, "step": 1345, "valid_targets_mean": 4907.6, "valid_targets_min": 590 }, { "epoch": 2.0516717325227964, "grad_norm": 0.4188648321222995, "learning_rate": 3.5638654689699493e-05, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.15893448889255524, "step": 1350, "valid_targets_mean": 5083.1, "valid_targets_min": 1164 }, { "epoch": 2.059270516717325, "grad_norm": 0.4452501919855169, "learning_rate": 3.559129637919744e-05, "loss": 0.194, "loss_nan_ranks": 0, "loss_rank_avg": 0.19416233897209167, "step": 1355, "valid_targets_mean": 4871.6, "valid_targets_min": 1124 }, { "epoch": 2.066869300911854, "grad_norm": 0.5486933381235863, "learning_rate": 3.5543714159261576e-05, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.21765755116939545, "step": 1360, "valid_targets_mean": 4549.6, "valid_targets_min": 756 }, { "epoch": 2.074468085106383, "grad_norm": 0.46291383560602983, "learning_rate": 3.5495908713228774e-05, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.22245173156261444, "step": 1365, "valid_targets_mean": 4870.3, "valid_targets_min": 829 }, { "epoch": 2.082066869300912, "grad_norm": 0.43346588262932606, "learning_rate": 3.544788072764173e-05, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.16855968534946442, "step": 1370, "valid_targets_mean": 5086.5, "valid_targets_min": 1568 }, { "epoch": 2.0896656534954405, "grad_norm": 0.46753186284834775, "learning_rate": 3.5399630892239036e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.17375516891479492, "step": 1375, "valid_targets_mean": 4855.5, "valid_targets_min": 1441 }, { "epoch": 2.0972644376899696, "grad_norm": 0.5417497219166529, "learning_rate": 3.535115989994533e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.22097179293632507, "step": 1380, "valid_targets_mean": 4113.6, "valid_targets_min": 608 }, { "epoch": 2.1048632218844983, "grad_norm": 0.5031450181476247, "learning_rate": 3.530246844686133e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.20294921100139618, "step": 1385, "valid_targets_mean": 4546.1, "valid_targets_min": 610 }, { "epoch": 2.1124620060790273, "grad_norm": 0.4352408641314383, "learning_rate": 3.5253557232253805e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.18328158557415009, "step": 1390, "valid_targets_mean": 4523.4, "valid_targets_min": 317 }, { "epoch": 2.1200607902735564, "grad_norm": 0.4965079663934899, "learning_rate": 3.520442695854558e-05, "loss": 0.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.19759127497673035, "step": 1395, "valid_targets_mean": 4122.6, "valid_targets_min": 651 }, { "epoch": 2.127659574468085, "grad_norm": 0.4372048480171316, "learning_rate": 3.515507833130543e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.260989785194397, "step": 1400, "valid_targets_mean": 5767.1, "valid_targets_min": 647 }, { "epoch": 2.135258358662614, "grad_norm": 0.4432824108788825, "learning_rate": 3.510551205923793e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.1798432469367981, "step": 1405, "valid_targets_mean": 4649.9, "valid_targets_min": 887 }, { "epoch": 2.142857142857143, "grad_norm": 0.47056895174749847, "learning_rate": 3.50557288541733e-05, "loss": 0.2022, "loss_nan_ranks": 0, "loss_rank_avg": 0.28239643573760986, "step": 1410, "valid_targets_mean": 5144.9, "valid_targets_min": 668 }, { "epoch": 2.150455927051672, "grad_norm": 0.48033852287738354, "learning_rate": 3.5005729431057176e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.18898963928222656, "step": 1415, "valid_targets_mean": 4188.7, "valid_targets_min": 642 }, { "epoch": 2.1580547112462005, "grad_norm": 0.44907430023415723, "learning_rate": 3.4955514507940335e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.21947622299194336, "step": 1420, "valid_targets_mean": 4689.1, "valid_targets_min": 811 }, { "epoch": 2.1656534954407296, "grad_norm": 0.48987352731998796, "learning_rate": 3.490508480596839e-05, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.23712974786758423, "step": 1425, "valid_targets_mean": 4526.9, "valid_targets_min": 1906 }, { "epoch": 2.1732522796352582, "grad_norm": 0.4635255839622089, "learning_rate": 3.485444104937144e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.19113010168075562, "step": 1430, "valid_targets_mean": 5611.0, "valid_targets_min": 506 }, { "epoch": 2.1808510638297873, "grad_norm": 0.5259676202088338, "learning_rate": 3.4803583965453635e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.1842001974582672, "step": 1435, "valid_targets_mean": 5102.6, "valid_targets_min": 2495 }, { "epoch": 2.188449848024316, "grad_norm": 0.44606267698952673, "learning_rate": 3.475251428458281e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.16230902075767517, "step": 1440, "valid_targets_mean": 4659.9, "valid_targets_min": 559 }, { "epoch": 2.196048632218845, "grad_norm": 0.4688428145128331, "learning_rate": 3.4701232740179876e-05, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.20408767461776733, "step": 1445, "valid_targets_mean": 4121.8, "valid_targets_min": 589 }, { "epoch": 2.2036474164133737, "grad_norm": 0.5991278401653526, "learning_rate": 3.464974006870841e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.1730174869298935, "step": 1450, "valid_targets_mean": 4380.2, "valid_targets_min": 872 }, { "epoch": 2.211246200607903, "grad_norm": 0.5317059372292597, "learning_rate": 3.4598037009664e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.21209636330604553, "step": 1455, "valid_targets_mean": 4217.3, "valid_targets_min": 576 }, { "epoch": 2.2188449848024314, "grad_norm": 0.430168348759962, "learning_rate": 3.454612430556365e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.1825931817293167, "step": 1460, "valid_targets_mean": 5261.9, "valid_targets_min": 605 }, { "epoch": 2.2264437689969605, "grad_norm": 0.3749747542503873, "learning_rate": 3.44940027019351e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.17250074446201324, "step": 1465, "valid_targets_mean": 5484.4, "valid_targets_min": 702 }, { "epoch": 2.2340425531914896, "grad_norm": 0.4590123136778495, "learning_rate": 3.444167294730617e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.21813246607780457, "step": 1470, "valid_targets_mean": 5121.4, "valid_targets_min": 306 }, { "epoch": 2.2416413373860182, "grad_norm": 0.49931169623759, "learning_rate": 3.4389135793193935e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.218278706073761, "step": 1475, "valid_targets_mean": 3389.2, "valid_targets_min": 545 }, { "epoch": 2.2492401215805473, "grad_norm": 0.44543315364919134, "learning_rate": 3.4336391994094e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.18760555982589722, "step": 1480, "valid_targets_mean": 4307.0, "valid_targets_min": 666 }, { "epoch": 2.256838905775076, "grad_norm": 0.4886663621134491, "learning_rate": 3.4283442307469625e-05, "loss": 0.1915, "loss_nan_ranks": 0, "loss_rank_avg": 0.2062349021434784, "step": 1485, "valid_targets_mean": 4356.3, "valid_targets_min": 766 }, { "epoch": 2.264437689969605, "grad_norm": 0.4376731027831436, "learning_rate": 3.423028749374086e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.1697554588317871, "step": 1490, "valid_targets_mean": 4621.5, "valid_targets_min": 626 }, { "epoch": 2.2720364741641337, "grad_norm": 0.44145953072536115, "learning_rate": 3.417692831627361e-05, "loss": 0.1953, "loss_nan_ranks": 0, "loss_rank_avg": 0.17671933770179749, "step": 1495, "valid_targets_mean": 4243.6, "valid_targets_min": 490 }, { "epoch": 2.2796352583586628, "grad_norm": 0.46231753746429277, "learning_rate": 3.412336554136871e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.217167928814888, "step": 1500, "valid_targets_mean": 4889.9, "valid_targets_min": 940 }, { "epoch": 2.2872340425531914, "grad_norm": 0.41849411158618643, "learning_rate": 3.406959993825088e-05, "loss": 0.1879, "loss_nan_ranks": 0, "loss_rank_avg": 0.1857946813106537, "step": 1505, "valid_targets_mean": 4538.6, "valid_targets_min": 1136 }, { "epoch": 2.2948328267477205, "grad_norm": 0.42440454933579597, "learning_rate": 3.4015632279057675e-05, "loss": 0.1913, "loss_nan_ranks": 0, "loss_rank_avg": 0.19058769941329956, "step": 1510, "valid_targets_mean": 5174.3, "valid_targets_min": 2350 }, { "epoch": 2.302431610942249, "grad_norm": 0.4531043322688376, "learning_rate": 3.396146333882846e-05, "loss": 0.2017, "loss_nan_ranks": 0, "loss_rank_avg": 0.207040473818779, "step": 1515, "valid_targets_mean": 5085.9, "valid_targets_min": 1122 }, { "epoch": 2.310030395136778, "grad_norm": 0.43663796857915893, "learning_rate": 3.3907093895493186e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.19464045763015747, "step": 1520, "valid_targets_mean": 4950.9, "valid_targets_min": 709 }, { "epoch": 2.317629179331307, "grad_norm": 0.42579767171142163, "learning_rate": 3.385252472986129e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.17376163601875305, "step": 1525, "valid_targets_mean": 5796.6, "valid_targets_min": 829 }, { "epoch": 2.325227963525836, "grad_norm": 0.4254323477143335, "learning_rate": 3.379775662561045e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.20658773183822632, "step": 1530, "valid_targets_mean": 4603.7, "valid_targets_min": 937 }, { "epoch": 2.3328267477203646, "grad_norm": 0.40841513731217177, "learning_rate": 3.374279036927535e-05, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.18336258828639984, "step": 1535, "valid_targets_mean": 4597.2, "valid_targets_min": 376 }, { "epoch": 2.3404255319148937, "grad_norm": 0.40660499202393396, "learning_rate": 3.368762675023635e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.17899194359779358, "step": 1540, "valid_targets_mean": 5368.1, "valid_targets_min": 748 }, { "epoch": 2.3480243161094223, "grad_norm": 0.4869497094603196, "learning_rate": 3.363226656070819e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.20963457226753235, "step": 1545, "valid_targets_mean": 4233.9, "valid_targets_min": 799 }, { "epoch": 2.3556231003039514, "grad_norm": 0.42891641992075347, "learning_rate": 3.3576710595728586e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.18602633476257324, "step": 1550, "valid_targets_mean": 4363.8, "valid_targets_min": 156 }, { "epoch": 2.36322188449848, "grad_norm": 0.4784395146562949, "learning_rate": 3.352095965314682e-05, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.20554772019386292, "step": 1555, "valid_targets_mean": 4412.3, "valid_targets_min": 732 }, { "epoch": 2.370820668693009, "grad_norm": 0.3940116430034305, "learning_rate": 3.3465014533612295e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.16700813174247742, "step": 1560, "valid_targets_mean": 4859.4, "valid_targets_min": 2115 }, { "epoch": 2.378419452887538, "grad_norm": 0.4053824724130465, "learning_rate": 3.340887604056301e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.19125846028327942, "step": 1565, "valid_targets_mean": 5586.5, "valid_targets_min": 855 }, { "epoch": 2.386018237082067, "grad_norm": 0.467001631524023, "learning_rate": 3.335254498021404e-05, "loss": 0.1987, "loss_nan_ranks": 0, "loss_rank_avg": 0.21299326419830322, "step": 1570, "valid_targets_mean": 4965.8, "valid_targets_min": 333 }, { "epoch": 2.393617021276596, "grad_norm": 0.46807262963090795, "learning_rate": 3.329602216154594e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.21306315064430237, "step": 1575, "valid_targets_mean": 4142.6, "valid_targets_min": 618 }, { "epoch": 2.4012158054711246, "grad_norm": 0.4351369955863477, "learning_rate": 3.323930839629318e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.192465141415596, "step": 1580, "valid_targets_mean": 4713.5, "valid_targets_min": 805 }, { "epoch": 2.4088145896656536, "grad_norm": 0.4664276306785285, "learning_rate": 3.318240449893242e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.20806226134300232, "step": 1585, "valid_targets_mean": 4086.8, "valid_targets_min": 616 }, { "epoch": 2.4164133738601823, "grad_norm": 0.4691257656452498, "learning_rate": 3.3125311286670836e-05, "loss": 0.1982, "loss_nan_ranks": 0, "loss_rank_avg": 0.23262707889080048, "step": 1590, "valid_targets_mean": 4931.9, "valid_targets_min": 633 }, { "epoch": 2.4240121580547114, "grad_norm": 0.42906847559664973, "learning_rate": 3.3068029579434404e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.19915705919265747, "step": 1595, "valid_targets_mean": 4431.0, "valid_targets_min": 397 }, { "epoch": 2.43161094224924, "grad_norm": 0.4018736513467274, "learning_rate": 3.3010560199856105e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.16372954845428467, "step": 1600, "valid_targets_mean": 5064.1, "valid_targets_min": 1229 }, { "epoch": 2.439209726443769, "grad_norm": 0.4520461458479404, "learning_rate": 3.2952903973264115e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.19510574638843536, "step": 1605, "valid_targets_mean": 4399.9, "valid_targets_min": 646 }, { "epoch": 2.4468085106382977, "grad_norm": 0.3918033831100767, "learning_rate": 3.289506172766997e-05, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.1935116946697235, "step": 1610, "valid_targets_mean": 5341.8, "valid_targets_min": 801 }, { "epoch": 2.454407294832827, "grad_norm": 0.43294616241650447, "learning_rate": 3.283703429375663e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.16868659853935242, "step": 1615, "valid_targets_mean": 4395.4, "valid_targets_min": 518 }, { "epoch": 2.4620060790273555, "grad_norm": 0.5245421221092823, "learning_rate": 3.2778822504866594e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.2138800024986267, "step": 1620, "valid_targets_mean": 3523.9, "valid_targets_min": 736 }, { "epoch": 2.4696048632218845, "grad_norm": 0.44947552448463496, "learning_rate": 3.272042719698992e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.2089487910270691, "step": 1625, "valid_targets_mean": 4868.6, "valid_targets_min": 708 }, { "epoch": 2.477203647416413, "grad_norm": 0.5745948604608038, "learning_rate": 3.2661849208752205e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.15748457610607147, "step": 1630, "valid_targets_mean": 5253.4, "valid_targets_min": 1100 }, { "epoch": 2.4848024316109423, "grad_norm": 0.466310291931274, "learning_rate": 3.2603089381402574e-05, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.18000131845474243, "step": 1635, "valid_targets_mean": 4540.9, "valid_targets_min": 594 }, { "epoch": 2.4924012158054714, "grad_norm": 0.4887847049484213, "learning_rate": 3.254414855880155e-05, "loss": 0.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.19799655675888062, "step": 1640, "valid_targets_mean": 3895.6, "valid_targets_min": 632 }, { "epoch": 2.5, "grad_norm": 0.44432072579472404, "learning_rate": 3.2485027587408965e-05, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.18566831946372986, "step": 1645, "valid_targets_mean": 4716.8, "valid_targets_min": 785 }, { "epoch": 2.5075987841945286, "grad_norm": 0.7254579276839739, "learning_rate": 3.2425727316271814e-05, "loss": 0.2156, "loss_nan_ranks": 0, "loss_rank_avg": 0.2835049033164978, "step": 1650, "valid_targets_mean": 4848.5, "valid_targets_min": 1102 }, { "epoch": 2.5151975683890577, "grad_norm": 0.45281348742054633, "learning_rate": 3.2366248597012037e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.21764954924583435, "step": 1655, "valid_targets_mean": 4480.8, "valid_targets_min": 808 }, { "epoch": 2.522796352583587, "grad_norm": 0.45329008128640347, "learning_rate": 3.230659228381432e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.19859766960144043, "step": 1660, "valid_targets_mean": 4694.1, "valid_targets_min": 710 }, { "epoch": 2.5303951367781155, "grad_norm": 0.3991066726887112, "learning_rate": 3.2246759233413765e-05, "loss": 0.2077, "loss_nan_ranks": 0, "loss_rank_avg": 0.18775928020477295, "step": 1665, "valid_targets_mean": 5537.6, "valid_targets_min": 2270 }, { "epoch": 2.5379939209726445, "grad_norm": 0.45660075830572106, "learning_rate": 3.218675030508367e-05, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.21159949898719788, "step": 1670, "valid_targets_mean": 4234.2, "valid_targets_min": 465 }, { "epoch": 2.545592705167173, "grad_norm": 0.47845524476355505, "learning_rate": 3.212656636062314e-05, "loss": 0.2034, "loss_nan_ranks": 0, "loss_rank_avg": 0.18367314338684082, "step": 1675, "valid_targets_mean": 3884.0, "valid_targets_min": 609 }, { "epoch": 2.5531914893617023, "grad_norm": 0.47337775511493685, "learning_rate": 3.2066208264344695e-05, "loss": 0.1954, "loss_nan_ranks": 0, "loss_rank_avg": 0.19395776093006134, "step": 1680, "valid_targets_mean": 4240.3, "valid_targets_min": 1731 }, { "epoch": 2.560790273556231, "grad_norm": 0.49086260546972615, "learning_rate": 3.200567688306192e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.2288236916065216, "step": 1685, "valid_targets_mean": 3920.8, "valid_targets_min": 658 }, { "epoch": 2.56838905775076, "grad_norm": 0.48820274570312466, "learning_rate": 3.194497308607694e-05, "loss": 0.2084, "loss_nan_ranks": 0, "loss_rank_avg": 0.2082967460155487, "step": 1690, "valid_targets_mean": 4256.8, "valid_targets_min": 440 }, { "epoch": 2.5759878419452886, "grad_norm": 0.43205681075466934, "learning_rate": 3.1884097745167986e-05, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.1597200632095337, "step": 1695, "valid_targets_mean": 4130.8, "valid_targets_min": 878 }, { "epoch": 2.5835866261398177, "grad_norm": 0.5054254906668799, "learning_rate": 3.182305173457688e-05, "loss": 0.2034, "loss_nan_ranks": 0, "loss_rank_avg": 0.2262079417705536, "step": 1700, "valid_targets_mean": 4460.6, "valid_targets_min": 401 }, { "epoch": 2.5911854103343464, "grad_norm": 0.504689704310772, "learning_rate": 3.1761835930996424e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.1995968520641327, "step": 1705, "valid_targets_mean": 3648.3, "valid_targets_min": 558 }, { "epoch": 2.5987841945288754, "grad_norm": 0.4392316385094666, "learning_rate": 3.1700451213557896e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.20353609323501587, "step": 1710, "valid_targets_mean": 4641.1, "valid_targets_min": 845 }, { "epoch": 2.6063829787234045, "grad_norm": 0.44339996982872454, "learning_rate": 3.1638898463818336e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.15977585315704346, "step": 1715, "valid_targets_mean": 4352.1, "valid_targets_min": 827 }, { "epoch": 2.613981762917933, "grad_norm": 0.5398477413573792, "learning_rate": 3.157717856574794e-05, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.18378981947898865, "step": 1720, "valid_targets_mean": 4131.6, "valid_targets_min": 331 }, { "epoch": 2.621580547112462, "grad_norm": 0.39672349034501203, "learning_rate": 3.151529240571737e-05, "loss": 0.2048, "loss_nan_ranks": 0, "loss_rank_avg": 0.19032993912696838, "step": 1725, "valid_targets_mean": 5932.7, "valid_targets_min": 2148 }, { "epoch": 2.629179331306991, "grad_norm": 0.4826721393487148, "learning_rate": 3.1453240872484974e-05, "loss": 0.2209, "loss_nan_ranks": 0, "loss_rank_avg": 0.21052716672420502, "step": 1730, "valid_targets_mean": 4064.6, "valid_targets_min": 713 }, { "epoch": 2.63677811550152, "grad_norm": 0.40797959815259904, "learning_rate": 3.139102485718407e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.18385851383209229, "step": 1735, "valid_targets_mean": 5094.5, "valid_targets_min": 774 }, { "epoch": 2.6443768996960486, "grad_norm": 0.49388764627269777, "learning_rate": 3.1328645253310136e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.20751240849494934, "step": 1740, "valid_targets_mean": 4489.2, "valid_targets_min": 668 }, { "epoch": 2.6519756838905773, "grad_norm": 0.41221441649011, "learning_rate": 3.126610295670798e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.18350102007389069, "step": 1745, "valid_targets_mean": 5068.5, "valid_targets_min": 1047 }, { "epoch": 2.6595744680851063, "grad_norm": 0.43487564674132706, "learning_rate": 3.120339886555885e-05, "loss": 0.2039, "loss_nan_ranks": 0, "loss_rank_avg": 0.1929788887500763, "step": 1750, "valid_targets_mean": 4648.7, "valid_targets_min": 1712 }, { "epoch": 2.6671732522796354, "grad_norm": 0.3931845374369816, "learning_rate": 3.114053388036757e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.17840635776519775, "step": 1755, "valid_targets_mean": 5762.4, "valid_targets_min": 537 }, { "epoch": 2.674772036474164, "grad_norm": 0.46325220533318656, "learning_rate": 3.1077508903949594e-05, "loss": 0.1857, "loss_nan_ranks": 0, "loss_rank_avg": 0.15973162651062012, "step": 1760, "valid_targets_mean": 4577.9, "valid_targets_min": 1190 }, { "epoch": 2.682370820668693, "grad_norm": 0.448314100365069, "learning_rate": 3.1014324841418025e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.21308580040931702, "step": 1765, "valid_targets_mean": 4523.5, "valid_targets_min": 689 }, { "epoch": 2.689969604863222, "grad_norm": 0.4126949676808008, "learning_rate": 3.095098260017065e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.17054617404937744, "step": 1770, "valid_targets_mean": 4661.3, "valid_targets_min": 940 }, { "epoch": 2.697568389057751, "grad_norm": 0.520594987471646, "learning_rate": 3.088748308987687e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.18412724137306213, "step": 1775, "valid_targets_mean": 4541.3, "valid_targets_min": 425 }, { "epoch": 2.7051671732522795, "grad_norm": 0.4292929031518839, "learning_rate": 3.082382722246467e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.18564680218696594, "step": 1780, "valid_targets_mean": 4726.2, "valid_targets_min": 849 }, { "epoch": 2.7127659574468086, "grad_norm": 0.4143100769110258, "learning_rate": 3.07600159121075e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.19952227175235748, "step": 1785, "valid_targets_mean": 6396.9, "valid_targets_min": 2406 }, { "epoch": 2.7203647416413372, "grad_norm": 0.5138412636257836, "learning_rate": 3.069605007521115e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.21767953038215637, "step": 1790, "valid_targets_mean": 4080.7, "valid_targets_min": 855 }, { "epoch": 2.7279635258358663, "grad_norm": 0.9274624474305112, "learning_rate": 3.063193063040061e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.2023240178823471, "step": 1795, "valid_targets_mean": 4271.2, "valid_targets_min": 299 }, { "epoch": 2.735562310030395, "grad_norm": 0.4505218736377883, "learning_rate": 3.0567658498506835e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.19997933506965637, "step": 1800, "valid_targets_mean": 6215.2, "valid_targets_min": 834 }, { "epoch": 2.743161094224924, "grad_norm": 0.45112279832870705, "learning_rate": 3.050323460255359e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.20109710097312927, "step": 1805, "valid_targets_mean": 4547.4, "valid_targets_min": 594 }, { "epoch": 2.750759878419453, "grad_norm": 0.45439465696192066, "learning_rate": 3.0438659867744104e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.22971929609775543, "step": 1810, "valid_targets_mean": 4679.8, "valid_targets_min": 630 }, { "epoch": 2.7583586626139818, "grad_norm": 0.4239951858010868, "learning_rate": 3.0373935221447846e-05, "loss": 0.1861, "loss_nan_ranks": 0, "loss_rank_avg": 0.18463487923145294, "step": 1815, "valid_targets_mean": 4548.8, "valid_targets_min": 832 }, { "epoch": 2.7659574468085104, "grad_norm": 0.46571130038179387, "learning_rate": 3.030906159318721e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.2257537692785263, "step": 1820, "valid_targets_mean": 4535.1, "valid_targets_min": 822 }, { "epoch": 2.7735562310030395, "grad_norm": 0.5251100785646777, "learning_rate": 3.0244039914624127e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.16839849948883057, "step": 1825, "valid_targets_mean": 4547.6, "valid_targets_min": 551 }, { "epoch": 2.7811550151975686, "grad_norm": 0.46551771612143145, "learning_rate": 3.017887111954671e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.21392841637134552, "step": 1830, "valid_targets_mean": 4989.8, "valid_targets_min": 1092 }, { "epoch": 2.788753799392097, "grad_norm": 0.45282545824018966, "learning_rate": 3.0113556143855836e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.17507150769233704, "step": 1835, "valid_targets_mean": 3937.5, "valid_targets_min": 433 }, { "epoch": 2.7963525835866263, "grad_norm": 0.8573211013484289, "learning_rate": 3.004809592555172e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.1929873377084732, "step": 1840, "valid_targets_mean": 4398.6, "valid_targets_min": 447 }, { "epoch": 2.803951367781155, "grad_norm": 0.4511946895966249, "learning_rate": 2.9982491404720408e-05, "loss": 0.2171, "loss_nan_ranks": 0, "loss_rank_avg": 0.25569894909858704, "step": 1845, "valid_targets_mean": 5263.1, "valid_targets_min": 704 }, { "epoch": 2.811550151975684, "grad_norm": 0.4075365034632511, "learning_rate": 2.9916743523520336e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.18254083395004272, "step": 1850, "valid_targets_mean": 5106.1, "valid_targets_min": 1353 }, { "epoch": 2.8191489361702127, "grad_norm": 0.39703735203471957, "learning_rate": 2.9850853226168738e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.1689942181110382, "step": 1855, "valid_targets_mean": 5267.1, "valid_targets_min": 1235 }, { "epoch": 2.8267477203647418, "grad_norm": 0.4300034911707786, "learning_rate": 2.9784821458928116e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.19870391488075256, "step": 1860, "valid_targets_mean": 4619.8, "valid_targets_min": 672 }, { "epoch": 2.8343465045592704, "grad_norm": 0.4731017750575238, "learning_rate": 2.9718649170092653e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.2331341654062271, "step": 1865, "valid_targets_mean": 4517.1, "valid_targets_min": 673 }, { "epoch": 2.8419452887537995, "grad_norm": 0.47588128492307696, "learning_rate": 2.9652337309974582e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.17996634542942047, "step": 1870, "valid_targets_mean": 3985.2, "valid_targets_min": 962 }, { "epoch": 2.849544072948328, "grad_norm": 0.5647869677542844, "learning_rate": 2.958588683089056e-05, "loss": 0.194, "loss_nan_ranks": 0, "loss_rank_avg": 0.21768032014369965, "step": 1875, "valid_targets_mean": 3708.1, "valid_targets_min": 342 }, { "epoch": 2.857142857142857, "grad_norm": 0.4169198649338515, "learning_rate": 2.9519298687147945e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.17996545135974884, "step": 1880, "valid_targets_mean": 4830.1, "valid_targets_min": 834 }, { "epoch": 2.8647416413373863, "grad_norm": 0.46342593085414296, "learning_rate": 2.9452573835031154e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.17930959165096283, "step": 1885, "valid_targets_mean": 5006.9, "valid_targets_min": 1043 }, { "epoch": 2.872340425531915, "grad_norm": 0.5952920705102613, "learning_rate": 2.9385713232787877e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.17503748834133148, "step": 1890, "valid_targets_mean": 4345.5, "valid_targets_min": 702 }, { "epoch": 2.8799392097264436, "grad_norm": 1.5179001765998326, "learning_rate": 2.9318717840615352e-05, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.17403315007686615, "step": 1895, "valid_targets_mean": 5409.5, "valid_targets_min": 2159 }, { "epoch": 2.8875379939209727, "grad_norm": 0.45039073631427357, "learning_rate": 2.9251588620646543e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.19473648071289062, "step": 1900, "valid_targets_mean": 4456.6, "valid_targets_min": 561 }, { "epoch": 2.8951367781155017, "grad_norm": 0.5386037897816643, "learning_rate": 2.9184326536936356e-05, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.20459288358688354, "step": 1905, "valid_targets_mean": 5313.1, "valid_targets_min": 1889 }, { "epoch": 2.9027355623100304, "grad_norm": 0.5171036731287691, "learning_rate": 2.9116932555447764e-05, "loss": 0.1924, "loss_nan_ranks": 0, "loss_rank_avg": 0.19427910447120667, "step": 1910, "valid_targets_mean": 4551.8, "valid_targets_min": 640 }, { "epoch": 2.910334346504559, "grad_norm": 0.3956323253175454, "learning_rate": 2.904940764403795e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.16807705163955688, "step": 1915, "valid_targets_mean": 5148.9, "valid_targets_min": 1114 }, { "epoch": 2.917933130699088, "grad_norm": 0.4609179179948364, "learning_rate": 2.898175277244441e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.18651928007602692, "step": 1920, "valid_targets_mean": 4270.8, "valid_targets_min": 829 }, { "epoch": 2.925531914893617, "grad_norm": 0.3746013132633794, "learning_rate": 2.891396891227103e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.18432965874671936, "step": 1925, "valid_targets_mean": 5464.6, "valid_targets_min": 869 }, { "epoch": 2.933130699088146, "grad_norm": 0.44757073319717156, "learning_rate": 2.88460570369741e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.2037007212638855, "step": 1930, "valid_targets_mean": 5044.7, "valid_targets_min": 650 }, { "epoch": 2.940729483282675, "grad_norm": 0.5165497089688482, "learning_rate": 2.877801812184838e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.19577309489250183, "step": 1935, "valid_targets_mean": 3723.6, "valid_targets_min": 263 }, { "epoch": 2.9483282674772036, "grad_norm": 0.5248044839976569, "learning_rate": 2.8709853144013063e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.17888793349266052, "step": 1940, "valid_targets_mean": 5473.5, "valid_targets_min": 2971 }, { "epoch": 2.9559270516717326, "grad_norm": 0.46290978562548923, "learning_rate": 2.8641563082397755e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.19724613428115845, "step": 1945, "valid_targets_mean": 4504.6, "valid_targets_min": 683 }, { "epoch": 2.9635258358662613, "grad_norm": 0.47247130378721536, "learning_rate": 2.857314891772841e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.1742001324892044, "step": 1950, "valid_targets_mean": 4378.8, "valid_targets_min": 900 }, { "epoch": 2.9711246200607904, "grad_norm": 0.38540265276997787, "learning_rate": 2.850461163251325e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.1545667052268982, "step": 1955, "valid_targets_mean": 4485.9, "valid_targets_min": 825 }, { "epoch": 2.978723404255319, "grad_norm": 0.4375842807396514, "learning_rate": 2.8435952211028652e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.20349517464637756, "step": 1960, "valid_targets_mean": 4611.9, "valid_targets_min": 1259 }, { "epoch": 2.986322188449848, "grad_norm": 0.393339700104493, "learning_rate": 2.8367171639305014e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.1762651801109314, "step": 1965, "valid_targets_mean": 4854.0, "valid_targets_min": 1188 }, { "epoch": 2.9939209726443767, "grad_norm": 0.4408583709677064, "learning_rate": 2.8298270905112598e-05, "loss": 0.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.17071180045604706, "step": 1970, "valid_targets_mean": 4334.9, "valid_targets_min": 1033 }, { "epoch": 3.001519756838906, "grad_norm": 0.4509769720521314, "learning_rate": 2.8229250997947338e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.19761110842227936, "step": 1975, "valid_targets_mean": 5020.1, "valid_targets_min": 464 }, { "epoch": 3.0091185410334345, "grad_norm": 0.44397107618825393, "learning_rate": 2.8160112909016627e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.15861201286315918, "step": 1980, "valid_targets_mean": 4464.9, "valid_targets_min": 434 }, { "epoch": 3.0167173252279635, "grad_norm": 0.4590917607720272, "learning_rate": 2.8090857631225105e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.17721785604953766, "step": 1985, "valid_targets_mean": 4993.2, "valid_targets_min": 443 }, { "epoch": 3.024316109422492, "grad_norm": 1.6476449501443067, "learning_rate": 2.8021486159160365e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.21059048175811768, "step": 1990, "valid_targets_mean": 3777.8, "valid_targets_min": 567 }, { "epoch": 3.0319148936170213, "grad_norm": 0.3955766292317692, "learning_rate": 2.7951999489078697e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.15698814392089844, "step": 1995, "valid_targets_mean": 5706.5, "valid_targets_min": 1789 }, { "epoch": 3.0395136778115504, "grad_norm": 0.6060112559647506, "learning_rate": 2.7882398618890763e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.17217731475830078, "step": 2000, "valid_targets_mean": 4799.2, "valid_targets_min": 675 }, { "epoch": 3.047112462006079, "grad_norm": 0.48214170254530214, "learning_rate": 2.781268454814728e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.18182724714279175, "step": 2005, "valid_targets_mean": 4482.8, "valid_targets_min": 268 }, { "epoch": 3.054711246200608, "grad_norm": 0.4254186774774426, "learning_rate": 2.7742858278024657e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.17712415754795074, "step": 2010, "valid_targets_mean": 5016.2, "valid_targets_min": 933 }, { "epoch": 3.0623100303951367, "grad_norm": 0.4561837122624953, "learning_rate": 2.7672920811310615e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.1763693392276764, "step": 2015, "valid_targets_mean": 5105.2, "valid_targets_min": 1198 }, { "epoch": 3.069908814589666, "grad_norm": 0.6538535804895353, "learning_rate": 2.7602873152389795e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.15733420848846436, "step": 2020, "valid_targets_mean": 4136.8, "valid_targets_min": 1002 }, { "epoch": 3.0775075987841944, "grad_norm": 0.4383597724717559, "learning_rate": 2.7532716307229325e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.18817880749702454, "step": 2025, "valid_targets_mean": 4361.4, "valid_targets_min": 566 }, { "epoch": 3.0851063829787235, "grad_norm": 0.4468187218329756, "learning_rate": 2.7462451283364372e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.18754516541957855, "step": 2030, "valid_targets_mean": 5809.6, "valid_targets_min": 2367 }, { "epoch": 3.092705167173252, "grad_norm": 0.4923380379793573, "learning_rate": 2.739207908988369e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.1901119500398636, "step": 2035, "valid_targets_mean": 4648.6, "valid_targets_min": 651 }, { "epoch": 3.1003039513677813, "grad_norm": 0.43950335258891504, "learning_rate": 2.7321600737415103e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.1579056680202484, "step": 2040, "valid_targets_mean": 4848.3, "valid_targets_min": 513 }, { "epoch": 3.10790273556231, "grad_norm": 0.43941575889354745, "learning_rate": 2.7251017238111014e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.17752686142921448, "step": 2045, "valid_targets_mean": 4887.9, "valid_targets_min": 552 }, { "epoch": 3.115501519756839, "grad_norm": 0.43006557381731564, "learning_rate": 2.718032960563384e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.1756466031074524, "step": 2050, "valid_targets_mean": 5296.2, "valid_targets_min": 1395 }, { "epoch": 3.1231003039513676, "grad_norm": 0.3962603202091622, "learning_rate": 2.710953885514149e-05, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.13223829865455627, "step": 2055, "valid_targets_mean": 4657.5, "valid_targets_min": 1941 }, { "epoch": 3.1306990881458967, "grad_norm": 0.47787066171111203, "learning_rate": 2.7038646003272778e-05, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.1752995252609253, "step": 2060, "valid_targets_mean": 4332.5, "valid_targets_min": 523 }, { "epoch": 3.1382978723404253, "grad_norm": 0.49333053682614264, "learning_rate": 2.6967652068132787e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.1864144653081894, "step": 2065, "valid_targets_mean": 3611.1, "valid_targets_min": 567 }, { "epoch": 3.1458966565349544, "grad_norm": 0.4781276995658994, "learning_rate": 2.6896558069278294e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.14743542671203613, "step": 2070, "valid_targets_mean": 4010.8, "valid_targets_min": 543 }, { "epoch": 3.1534954407294835, "grad_norm": 0.4481532756441824, "learning_rate": 2.6825365027703104e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.1980597823858261, "step": 2075, "valid_targets_mean": 5291.1, "valid_targets_min": 446 }, { "epoch": 3.161094224924012, "grad_norm": 0.44883490224285716, "learning_rate": 2.6754073965823394e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.19897349178791046, "step": 2080, "valid_targets_mean": 5601.1, "valid_targets_min": 460 }, { "epoch": 3.1686930091185412, "grad_norm": 0.47818122842888633, "learning_rate": 2.668268590746303e-05, "loss": 0.17, "loss_nan_ranks": 0, "loss_rank_avg": 0.16886334121227264, "step": 2085, "valid_targets_mean": 3956.9, "valid_targets_min": 672 }, { "epoch": 3.17629179331307, "grad_norm": 0.44699975246028895, "learning_rate": 2.6611201877838858e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.1886739879846573, "step": 2090, "valid_targets_mean": 5496.0, "valid_targets_min": 1891 }, { "epoch": 3.183890577507599, "grad_norm": 0.46241733640368204, "learning_rate": 2.6539622903545992e-05, "loss": 0.1736, "loss_nan_ranks": 0, "loss_rank_avg": 0.16013459861278534, "step": 2095, "valid_targets_mean": 5061.5, "valid_targets_min": 842 }, { "epoch": 3.1914893617021276, "grad_norm": 0.419537783672445, "learning_rate": 2.6467950012543055e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.15453095734119415, "step": 2100, "valid_targets_mean": 5147.8, "valid_targets_min": 1776 }, { "epoch": 3.1990881458966567, "grad_norm": 0.4430059744559326, "learning_rate": 2.639618423413742e-05, "loss": 0.1786, "loss_nan_ranks": 0, "loss_rank_avg": 0.15962053835391998, "step": 2105, "valid_targets_mean": 4258.2, "valid_targets_min": 719 }, { "epoch": 3.2066869300911853, "grad_norm": 0.4601551349059534, "learning_rate": 2.6324326598970447e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.19752000272274017, "step": 2110, "valid_targets_mean": 5594.7, "valid_targets_min": 2157 }, { "epoch": 3.2142857142857144, "grad_norm": 0.4432941671854632, "learning_rate": 2.6252378139002666e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.16792172193527222, "step": 2115, "valid_targets_mean": 4681.6, "valid_targets_min": 831 }, { "epoch": 3.221884498480243, "grad_norm": 1.0521842556961734, "learning_rate": 2.618033988749895e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.18343770503997803, "step": 2120, "valid_targets_mean": 4442.8, "valid_targets_min": 593 }, { "epoch": 3.229483282674772, "grad_norm": 0.4703582807896684, "learning_rate": 2.6108212879013694e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.182417631149292, "step": 2125, "valid_targets_mean": 5050.2, "valid_targets_min": 882 }, { "epoch": 3.237082066869301, "grad_norm": 0.5066204484636513, "learning_rate": 2.6035998149375928e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.23296314477920532, "step": 2130, "valid_targets_mean": 4509.6, "valid_targets_min": 585 }, { "epoch": 3.24468085106383, "grad_norm": 0.47427217437454394, "learning_rate": 2.5963696735674487e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.1860450804233551, "step": 2135, "valid_targets_mean": 4647.2, "valid_targets_min": 697 }, { "epoch": 3.2522796352583585, "grad_norm": 0.4250698588091916, "learning_rate": 2.5891309676243084e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.16689786314964294, "step": 2140, "valid_targets_mean": 4561.6, "valid_targets_min": 756 }, { "epoch": 3.2598784194528876, "grad_norm": 0.47029762963920585, "learning_rate": 2.5818838010645393e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.15192772448062897, "step": 2145, "valid_targets_mean": 4186.0, "valid_targets_min": 434 }, { "epoch": 3.2674772036474162, "grad_norm": 0.4554599632142264, "learning_rate": 2.5746282779660145e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.17261144518852234, "step": 2150, "valid_targets_mean": 4568.7, "valid_targets_min": 1854 }, { "epoch": 3.2750759878419453, "grad_norm": 0.4502827257632833, "learning_rate": 2.5673645025266174e-05, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.1779678761959076, "step": 2155, "valid_targets_mean": 4289.7, "valid_targets_min": 781 }, { "epoch": 3.282674772036474, "grad_norm": 0.4787827101748988, "learning_rate": 2.5600925790627423e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.1940232217311859, "step": 2160, "valid_targets_mean": 4486.1, "valid_targets_min": 171 }, { "epoch": 3.290273556231003, "grad_norm": 0.45438086048067683, "learning_rate": 2.5528126120078018e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.19441285729408264, "step": 2165, "valid_targets_mean": 5050.3, "valid_targets_min": 1728 }, { "epoch": 3.297872340425532, "grad_norm": 0.40566641587346486, "learning_rate": 2.545524705910722e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.17091290652751923, "step": 2170, "valid_targets_mean": 5804.4, "valid_targets_min": 1156 }, { "epoch": 3.3054711246200608, "grad_norm": 0.42598008462425585, "learning_rate": 2.5382289654344433e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.16645470261573792, "step": 2175, "valid_targets_mean": 4971.6, "valid_targets_min": 673 }, { "epoch": 3.31306990881459, "grad_norm": 0.440353868517696, "learning_rate": 2.530925495354418e-05, "loss": 0.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.17304345965385437, "step": 2180, "valid_targets_mean": 4552.6, "valid_targets_min": 1465 }, { "epoch": 3.3206686930091185, "grad_norm": 0.45749279193739023, "learning_rate": 2.523614400557103e-05, "loss": 0.167, "loss_nan_ranks": 0, "loss_rank_avg": 0.16047537326812744, "step": 2185, "valid_targets_mean": 4131.4, "valid_targets_min": 641 }, { "epoch": 3.3282674772036476, "grad_norm": 0.42763280388882297, "learning_rate": 2.516295786038457e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.19560299813747406, "step": 2190, "valid_targets_mean": 5307.1, "valid_targets_min": 686 }, { "epoch": 3.335866261398176, "grad_norm": 0.45229487644284055, "learning_rate": 2.5089697569024293e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.17956998944282532, "step": 2195, "valid_targets_mean": 4415.1, "valid_targets_min": 479 }, { "epoch": 3.3434650455927053, "grad_norm": 0.49947402828635423, "learning_rate": 2.501636418359453e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.19726476073265076, "step": 2200, "valid_targets_mean": 4160.0, "valid_targets_min": 702 }, { "epoch": 3.351063829787234, "grad_norm": 0.5624015949940533, "learning_rate": 2.4942958757249322e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.17548981308937073, "step": 2205, "valid_targets_mean": 4641.6, "valid_targets_min": 741 }, { "epoch": 3.358662613981763, "grad_norm": 0.47188014259395983, "learning_rate": 2.4869482344177297e-05, "loss": 0.1912, "loss_nan_ranks": 0, "loss_rank_avg": 0.191510871052742, "step": 2210, "valid_targets_mean": 5098.9, "valid_targets_min": 732 }, { "epoch": 3.3662613981762917, "grad_norm": 0.4044372525372168, "learning_rate": 2.479593599958655e-05, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.1595427691936493, "step": 2215, "valid_targets_mean": 4987.1, "valid_targets_min": 2150 }, { "epoch": 3.3738601823708207, "grad_norm": 0.4610514723176418, "learning_rate": 2.472232077968947e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.18796592950820923, "step": 2220, "valid_targets_mean": 4755.8, "valid_targets_min": 804 }, { "epoch": 3.3814589665653494, "grad_norm": 0.4762033973991841, "learning_rate": 2.4648637741687572e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.17647765576839447, "step": 2225, "valid_targets_mean": 4052.8, "valid_targets_min": 1097 }, { "epoch": 3.3890577507598785, "grad_norm": 0.5674700704733731, "learning_rate": 2.4574887943756322e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.21014189720153809, "step": 2230, "valid_targets_mean": 5642.9, "valid_targets_min": 887 }, { "epoch": 3.396656534954407, "grad_norm": 0.45407587371796526, "learning_rate": 2.450107244502994e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.18419310450553894, "step": 2235, "valid_targets_mean": 4964.2, "valid_targets_min": 631 }, { "epoch": 3.404255319148936, "grad_norm": 0.6036076286770431, "learning_rate": 2.442719230558619e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.19704486429691315, "step": 2240, "valid_targets_mean": 3990.9, "valid_targets_min": 879 }, { "epoch": 3.4118541033434653, "grad_norm": 0.5044426709371705, "learning_rate": 2.435324858643114e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.17976920306682587, "step": 2245, "valid_targets_mean": 4607.1, "valid_targets_min": 276 }, { "epoch": 3.419452887537994, "grad_norm": 0.47427419752248345, "learning_rate": 2.4279242349483945e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.18903280794620514, "step": 2250, "valid_targets_mean": 4716.1, "valid_targets_min": 1806 }, { "epoch": 3.4270516717325226, "grad_norm": 0.5315098096977057, "learning_rate": 2.42051746575616e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.22392138838768005, "step": 2255, "valid_targets_mean": 3496.4, "valid_targets_min": 263 }, { "epoch": 3.4346504559270516, "grad_norm": 0.39060444130604355, "learning_rate": 2.413104657436365e-05, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.14147084951400757, "step": 2260, "valid_targets_mean": 4482.1, "valid_targets_min": 527 }, { "epoch": 3.4422492401215807, "grad_norm": 0.44338388859066824, "learning_rate": 2.4056859164456933e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.20094552636146545, "step": 2265, "valid_targets_mean": 5268.6, "valid_targets_min": 601 }, { "epoch": 3.4498480243161094, "grad_norm": 0.4361432780966179, "learning_rate": 2.3982613493260298e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.1768036186695099, "step": 2270, "valid_targets_mean": 5291.0, "valid_targets_min": 506 }, { "epoch": 3.4574468085106385, "grad_norm": 0.5069263015357972, "learning_rate": 2.390831062702929e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.19090662896633148, "step": 2275, "valid_targets_mean": 4792.0, "valid_targets_min": 361 }, { "epoch": 3.465045592705167, "grad_norm": 0.40616123029264917, "learning_rate": 2.383395163284083e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.15730628371238708, "step": 2280, "valid_targets_mean": 5398.0, "valid_targets_min": 1965 }, { "epoch": 3.472644376899696, "grad_norm": 0.4339438381996928, "learning_rate": 2.3759537578577926e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.16227596998214722, "step": 2285, "valid_targets_mean": 5389.4, "valid_targets_min": 682 }, { "epoch": 3.480243161094225, "grad_norm": 0.44867888022495267, "learning_rate": 2.3685069532914292e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.1895052194595337, "step": 2290, "valid_targets_mean": 5373.5, "valid_targets_min": 1378 }, { "epoch": 3.487841945288754, "grad_norm": 0.45859302831224075, "learning_rate": 2.3610548565299044e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.161161869764328, "step": 2295, "valid_targets_mean": 4974.8, "valid_targets_min": 963 }, { "epoch": 3.4954407294832825, "grad_norm": 0.47990973790811997, "learning_rate": 2.35359757459413e-05, "loss": 0.1861, "loss_nan_ranks": 0, "loss_rank_avg": 0.1807297170162201, "step": 2300, "valid_targets_mean": 3966.6, "valid_targets_min": 594 }, { "epoch": 3.5030395136778116, "grad_norm": 0.4458814501241054, "learning_rate": 2.3461352145794835e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.1584734320640564, "step": 2305, "valid_targets_mean": 4710.0, "valid_targets_min": 1068 }, { "epoch": 3.5106382978723403, "grad_norm": 0.5204277337187776, "learning_rate": 2.338667883654271e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.19432294368743896, "step": 2310, "valid_targets_mean": 3841.7, "valid_targets_min": 403 }, { "epoch": 3.5182370820668694, "grad_norm": 0.5002703947790278, "learning_rate": 2.3311956890581845e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.1830371916294098, "step": 2315, "valid_targets_mean": 4266.8, "valid_targets_min": 588 }, { "epoch": 3.5258358662613984, "grad_norm": 0.45671055489988216, "learning_rate": 2.3237187381007654e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.17926675081253052, "step": 2320, "valid_targets_mean": 4515.0, "valid_targets_min": 654 }, { "epoch": 3.533434650455927, "grad_norm": 0.44706162372061575, "learning_rate": 2.3162371381598627e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.17958760261535645, "step": 2325, "valid_targets_mean": 4538.9, "valid_targets_min": 646 }, { "epoch": 3.5410334346504557, "grad_norm": 0.48526337740475023, "learning_rate": 2.308750996680089e-05, "loss": 0.1857, "loss_nan_ranks": 0, "loss_rank_avg": 0.1857941448688507, "step": 2330, "valid_targets_mean": 4541.9, "valid_targets_min": 718 }, { "epoch": 3.548632218844985, "grad_norm": 0.6863209953782875, "learning_rate": 2.3012604211712787e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.15989352762699127, "step": 2335, "valid_targets_mean": 4711.3, "valid_targets_min": 905 }, { "epoch": 3.556231003039514, "grad_norm": 0.43601817882878313, "learning_rate": 2.2937655192069453e-05, "loss": 0.1727, "loss_nan_ranks": 0, "loss_rank_avg": 0.15695396065711975, "step": 2340, "valid_targets_mean": 4525.1, "valid_targets_min": 554 }, { "epoch": 3.5638297872340425, "grad_norm": 0.4384690019868411, "learning_rate": 2.286266398422734e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.17277196049690247, "step": 2345, "valid_targets_mean": 5536.7, "valid_targets_min": 966 }, { "epoch": 3.571428571428571, "grad_norm": 0.50720927906344, "learning_rate": 2.278763166514879e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.1746547669172287, "step": 2350, "valid_targets_mean": 4262.4, "valid_targets_min": 688 }, { "epoch": 3.5790273556231003, "grad_norm": 0.5082859794711881, "learning_rate": 2.2712559312386525e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.16094228625297546, "step": 2355, "valid_targets_mean": 4750.5, "valid_targets_min": 354 }, { "epoch": 3.5866261398176293, "grad_norm": 0.5324693739038185, "learning_rate": 2.2637448004068227e-05, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.1898549497127533, "step": 2360, "valid_targets_mean": 4889.1, "valid_targets_min": 868 }, { "epoch": 3.594224924012158, "grad_norm": 0.40332096235924436, "learning_rate": 2.2562298818881005e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.1677415668964386, "step": 2365, "valid_targets_mean": 4815.6, "valid_targets_min": 449 }, { "epoch": 3.601823708206687, "grad_norm": 0.4975962462446565, "learning_rate": 2.2487112836055932e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.1909307986497879, "step": 2370, "valid_targets_mean": 4240.7, "valid_targets_min": 873 }, { "epoch": 3.6094224924012157, "grad_norm": 0.4333440171846238, "learning_rate": 2.241189113535253e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.17210185527801514, "step": 2375, "valid_targets_mean": 4546.3, "valid_targets_min": 814 }, { "epoch": 3.617021276595745, "grad_norm": 0.4286229722867218, "learning_rate": 2.2336634797043294e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.17077794671058655, "step": 2380, "valid_targets_mean": 4828.9, "valid_targets_min": 2075 }, { "epoch": 3.6246200607902734, "grad_norm": 0.5351152453484341, "learning_rate": 2.226134490189813e-05, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.20225580036640167, "step": 2385, "valid_targets_mean": 4493.8, "valid_targets_min": 816 }, { "epoch": 3.6322188449848025, "grad_norm": 0.4595793337143316, "learning_rate": 2.2186022531168877e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.18067389726638794, "step": 2390, "valid_targets_mean": 4226.4, "valid_targets_min": 876 }, { "epoch": 3.639817629179331, "grad_norm": 0.4376288036773449, "learning_rate": 2.2110668766573756e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.17458736896514893, "step": 2395, "valid_targets_mean": 4607.4, "valid_targets_min": 378 }, { "epoch": 3.6474164133738602, "grad_norm": 0.4235273238288212, "learning_rate": 2.2035284690281835e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.16206535696983337, "step": 2400, "valid_targets_mean": 4671.6, "valid_targets_min": 427 }, { "epoch": 3.655015197568389, "grad_norm": 0.4645835996278293, "learning_rate": 2.1959871384897508e-05, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.1612105816602707, "step": 2405, "valid_targets_mean": 4012.2, "valid_targets_min": 736 }, { "epoch": 3.662613981762918, "grad_norm": 0.4339263612443116, "learning_rate": 2.188442993344492e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.18110080063343048, "step": 2410, "valid_targets_mean": 5371.9, "valid_targets_min": 1880 }, { "epoch": 3.670212765957447, "grad_norm": 0.5156390412963044, "learning_rate": 2.1808961419352433e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.19328826665878296, "step": 2415, "valid_targets_mean": 5049.5, "valid_targets_min": 1733 }, { "epoch": 3.6778115501519757, "grad_norm": 0.4257958182746545, "learning_rate": 2.173346692643706e-05, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.15053753554821014, "step": 2420, "valid_targets_mean": 4545.5, "valid_targets_min": 845 }, { "epoch": 3.6854103343465043, "grad_norm": 0.41421446171755727, "learning_rate": 2.1657947538888907e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.15670928359031677, "step": 2425, "valid_targets_mean": 4735.4, "valid_targets_min": 2303 }, { "epoch": 3.6930091185410334, "grad_norm": 0.46488209722389967, "learning_rate": 2.158240434125557e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.17502865195274353, "step": 2430, "valid_targets_mean": 4069.9, "valid_targets_min": 843 }, { "epoch": 3.7006079027355625, "grad_norm": 0.44273639823588856, "learning_rate": 2.150683841842662e-05, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.17152325809001923, "step": 2435, "valid_targets_mean": 4846.6, "valid_targets_min": 1167 }, { "epoch": 3.708206686930091, "grad_norm": 0.41156415643010313, "learning_rate": 2.1431250855617978e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.15151536464691162, "step": 2440, "valid_targets_mean": 4472.1, "valid_targets_min": 280 }, { "epoch": 3.71580547112462, "grad_norm": 0.45636761630984557, "learning_rate": 2.1355642738356327e-05, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.16730879247188568, "step": 2445, "valid_targets_mean": 3877.2, "valid_targets_min": 406 }, { "epoch": 3.723404255319149, "grad_norm": 0.41821546008836596, "learning_rate": 2.128001515246355e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.1652117371559143, "step": 2450, "valid_targets_mean": 5117.6, "valid_targets_min": 1054 }, { "epoch": 3.731003039513678, "grad_norm": 0.5195131380448494, "learning_rate": 2.1204369184041115e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.21220675110816956, "step": 2455, "valid_targets_mean": 3935.9, "valid_targets_min": 608 }, { "epoch": 3.7386018237082066, "grad_norm": 0.4759365332843418, "learning_rate": 2.1128705919454488e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.21190626919269562, "step": 2460, "valid_targets_mean": 5204.1, "valid_targets_min": 776 }, { "epoch": 3.7462006079027357, "grad_norm": 0.44340296838544296, "learning_rate": 2.1053026445317534e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.16357441246509552, "step": 2465, "valid_targets_mean": 5137.4, "valid_targets_min": 531 }, { "epoch": 3.7537993920972643, "grad_norm": 0.602232408360396, "learning_rate": 2.09773318484769e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.14004534482955933, "step": 2470, "valid_targets_mean": 4292.4, "valid_targets_min": 861 }, { "epoch": 3.7613981762917934, "grad_norm": 0.4860093104756001, "learning_rate": 2.0901623215996406e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.17179439961910248, "step": 2475, "valid_targets_mean": 4222.4, "valid_targets_min": 2111 }, { "epoch": 3.768996960486322, "grad_norm": 0.5345377630387919, "learning_rate": 2.082590163514146e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.19142243266105652, "step": 2480, "valid_targets_mean": 3549.6, "valid_targets_min": 650 }, { "epoch": 3.776595744680851, "grad_norm": 0.5131611773395347, "learning_rate": 2.07501681933634e-05, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.23167961835861206, "step": 2485, "valid_targets_mean": 4783.1, "valid_targets_min": 422 }, { "epoch": 3.78419452887538, "grad_norm": 0.43772278574910306, "learning_rate": 2.0674423978283924e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.159462109208107, "step": 2490, "valid_targets_mean": 4151.8, "valid_targets_min": 1045 }, { "epoch": 3.791793313069909, "grad_norm": 0.48634040579611115, "learning_rate": 2.059867007767943e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.1738453060388565, "step": 2495, "valid_targets_mean": 4146.1, "valid_targets_min": 314 }, { "epoch": 3.7993920972644375, "grad_norm": 0.45093092640477583, "learning_rate": 2.0522907579465413e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.1663065254688263, "step": 2500, "valid_targets_mean": 3941.2, "valid_targets_min": 1010 }, { "epoch": 3.8069908814589666, "grad_norm": 0.50654438664862, "learning_rate": 2.0447137571680856e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.20836275815963745, "step": 2505, "valid_targets_mean": 4301.9, "valid_targets_min": 870 }, { "epoch": 3.8145896656534957, "grad_norm": 0.47213930537918863, "learning_rate": 2.037136114247257e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.19136860966682434, "step": 2510, "valid_targets_mean": 4427.4, "valid_targets_min": 571 }, { "epoch": 3.8221884498480243, "grad_norm": 0.6652881182583804, "learning_rate": 2.0295579380079596e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.16894681751728058, "step": 2515, "valid_targets_mean": 4250.4, "valid_targets_min": 473 }, { "epoch": 3.829787234042553, "grad_norm": 0.4220064998153064, "learning_rate": 2.0219793372817557e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.1527949720621109, "step": 2520, "valid_targets_mean": 4826.4, "valid_targets_min": 827 }, { "epoch": 3.837386018237082, "grad_norm": 0.43668863176276407, "learning_rate": 2.0144004209063042e-05, "loss": 0.176, "loss_nan_ranks": 0, "loss_rank_avg": 0.1740725338459015, "step": 2525, "valid_targets_mean": 4150.2, "valid_targets_min": 772 }, { "epoch": 3.844984802431611, "grad_norm": 0.3823174418425911, "learning_rate": 2.0068212977237983e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.14751499891281128, "step": 2530, "valid_targets_mean": 5399.6, "valid_targets_min": 2779 }, { "epoch": 3.8525835866261398, "grad_norm": 0.4587095534889756, "learning_rate": 1.999242076579398e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.19451266527175903, "step": 2535, "valid_targets_mean": 4256.1, "valid_targets_min": 743 }, { "epoch": 3.860182370820669, "grad_norm": 0.45169233975095224, "learning_rate": 1.9916628663196743e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.17704080045223236, "step": 2540, "valid_targets_mean": 4775.8, "valid_targets_min": 2350 }, { "epoch": 3.8677811550151975, "grad_norm": 1.675127625058686, "learning_rate": 1.9840837757910383e-05, "loss": 0.1858, "loss_nan_ranks": 0, "loss_rank_avg": 0.1759578138589859, "step": 2545, "valid_targets_mean": 4113.9, "valid_targets_min": 720 }, { "epoch": 3.8753799392097266, "grad_norm": 0.43203621299681155, "learning_rate": 1.976504913838184e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.1715025007724762, "step": 2550, "valid_targets_mean": 5221.4, "valid_targets_min": 1839 }, { "epoch": 3.882978723404255, "grad_norm": 0.4384904057940854, "learning_rate": 1.968926389302521e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.16733646392822266, "step": 2555, "valid_targets_mean": 4565.3, "valid_targets_min": 609 }, { "epoch": 3.8905775075987843, "grad_norm": 0.4481617113710614, "learning_rate": 1.9613483110206154e-05, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.17321643233299255, "step": 2560, "valid_targets_mean": 4512.8, "valid_targets_min": 895 }, { "epoch": 3.898176291793313, "grad_norm": 0.45819511671682567, "learning_rate": 1.9537707878226216e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.17141106724739075, "step": 2565, "valid_targets_mean": 4315.5, "valid_targets_min": 440 }, { "epoch": 3.905775075987842, "grad_norm": 0.4764235545857351, "learning_rate": 1.9461939285307247e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.1686917096376419, "step": 2570, "valid_targets_mean": 3827.4, "valid_targets_min": 622 }, { "epoch": 3.9133738601823707, "grad_norm": 0.4437209902659711, "learning_rate": 1.9386178419575745e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.16246762871742249, "step": 2575, "valid_targets_mean": 4545.2, "valid_targets_min": 746 }, { "epoch": 3.9209726443768997, "grad_norm": 0.3844261379651969, "learning_rate": 1.931042636904724e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.17688338458538055, "step": 2580, "valid_targets_mean": 5911.6, "valid_targets_min": 3130 }, { "epoch": 3.928571428571429, "grad_norm": 0.4052859116056726, "learning_rate": 1.923468422161066e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.16950541734695435, "step": 2585, "valid_targets_mean": 5731.0, "valid_targets_min": 509 }, { "epoch": 3.9361702127659575, "grad_norm": 0.4236870787112286, "learning_rate": 1.9158953065012715e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.15792736411094666, "step": 2590, "valid_targets_mean": 5720.6, "valid_targets_min": 2293 }, { "epoch": 3.943768996960486, "grad_norm": 0.46365326810020263, "learning_rate": 1.9083233986842275e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.17180944979190826, "step": 2595, "valid_targets_mean": 5083.0, "valid_targets_min": 711 }, { "epoch": 3.951367781155015, "grad_norm": 0.44863750873052993, "learning_rate": 1.900752807451475e-05, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.16900160908699036, "step": 2600, "valid_targets_mean": 4392.1, "valid_targets_min": 810 }, { "epoch": 3.9589665653495443, "grad_norm": 0.462622398920299, "learning_rate": 1.8931836415256468e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.16800816357135773, "step": 2605, "valid_targets_mean": 4713.2, "valid_targets_min": 740 }, { "epoch": 3.966565349544073, "grad_norm": 0.46050975543187894, "learning_rate": 1.885616009608907e-05, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.14823880791664124, "step": 2610, "valid_targets_mean": 4082.6, "valid_targets_min": 401 }, { "epoch": 3.9741641337386016, "grad_norm": 0.46421973514436904, "learning_rate": 1.8780500203813902e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.18864090740680695, "step": 2615, "valid_targets_mean": 4411.6, "valid_targets_min": 655 }, { "epoch": 3.9817629179331306, "grad_norm": 0.4291031448782404, "learning_rate": 1.870485782499638e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.17856952548027039, "step": 2620, "valid_targets_mean": 4765.4, "valid_targets_min": 348 }, { "epoch": 3.9893617021276597, "grad_norm": 0.44985063891512206, "learning_rate": 1.8629234045950434e-05, "loss": 0.1904, "loss_nan_ranks": 0, "loss_rank_avg": 0.16248270869255066, "step": 2625, "valid_targets_mean": 4526.0, "valid_targets_min": 1027 }, { "epoch": 3.9969604863221884, "grad_norm": 0.4752973434947488, "learning_rate": 1.8553629952722853e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.17370517551898956, "step": 2630, "valid_targets_mean": 4128.8, "valid_targets_min": 843 }, { "epoch": 4.004559270516717, "grad_norm": 0.4277885641586408, "learning_rate": 1.8478046631077734e-05, "loss": 0.167, "loss_nan_ranks": 0, "loss_rank_avg": 0.1758805513381958, "step": 2635, "valid_targets_mean": 4960.5, "valid_targets_min": 647 }, { "epoch": 4.0121580547112465, "grad_norm": 0.4340489860844752, "learning_rate": 1.8402485166480854e-05, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.1884659081697464, "step": 2640, "valid_targets_mean": 5273.1, "valid_targets_min": 787 }, { "epoch": 4.019756838905775, "grad_norm": 0.4325490917240746, "learning_rate": 1.8326946644084112e-05, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.1543048769235611, "step": 2645, "valid_targets_mean": 4604.4, "valid_targets_min": 547 }, { "epoch": 4.027355623100304, "grad_norm": 0.5514612078158647, "learning_rate": 1.8251432148709912e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.1609114408493042, "step": 2650, "valid_targets_mean": 3597.3, "valid_targets_min": 695 }, { "epoch": 4.0349544072948325, "grad_norm": 0.43126338580266377, "learning_rate": 1.817594276483563e-05, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.18365256488323212, "step": 2655, "valid_targets_mean": 5326.8, "valid_targets_min": 666 }, { "epoch": 4.042553191489362, "grad_norm": 0.4737332570423805, "learning_rate": 1.8100479576577973e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.17224054038524628, "step": 2660, "valid_targets_mean": 4818.4, "valid_targets_min": 918 }, { "epoch": 4.050151975683891, "grad_norm": 0.4438849641405412, "learning_rate": 1.8025043667677484e-05, "loss": 0.166, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628122627735138, "step": 2665, "valid_targets_mean": 4852.9, "valid_targets_min": 1421 }, { "epoch": 4.057750759878419, "grad_norm": 0.5200587086302579, "learning_rate": 1.794963612148291e-05, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.1755530685186386, "step": 2670, "valid_targets_mean": 3932.9, "valid_targets_min": 844 }, { "epoch": 4.065349544072948, "grad_norm": 0.5142004311196928, "learning_rate": 1.7874258020935708e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.16136983036994934, "step": 2675, "valid_targets_mean": 3818.9, "valid_targets_min": 758 }, { "epoch": 4.072948328267477, "grad_norm": 0.47669155432301397, "learning_rate": 1.7798910448554433e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.17607629299163818, "step": 2680, "valid_targets_mean": 4376.6, "valid_targets_min": 1368 }, { "epoch": 4.080547112462006, "grad_norm": 0.4655137661586852, "learning_rate": 1.7723594486419245e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.15961049497127533, "step": 2685, "valid_targets_mean": 4512.1, "valid_targets_min": 1601 }, { "epoch": 4.088145896656535, "grad_norm": 0.7525257215139017, "learning_rate": 1.764831121615631e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.21296311914920807, "step": 2690, "valid_targets_mean": 4298.8, "valid_targets_min": 756 }, { "epoch": 4.095744680851064, "grad_norm": 0.4433451433036404, "learning_rate": 1.7573061718922347e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.16739048063755035, "step": 2695, "valid_targets_mean": 5009.2, "valid_targets_min": 853 }, { "epoch": 4.103343465045593, "grad_norm": 0.4830355618281073, "learning_rate": 1.7497847075389004e-05, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.16623979806900024, "step": 2700, "valid_targets_mean": 4105.4, "valid_targets_min": 714 }, { "epoch": 4.1109422492401215, "grad_norm": 0.4179613714457159, "learning_rate": 1.7422668365727428e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.16168740391731262, "step": 2705, "valid_targets_mean": 5317.4, "valid_targets_min": 1811 }, { "epoch": 4.11854103343465, "grad_norm": 0.5056361715181314, "learning_rate": 1.734752666959268e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.16789555549621582, "step": 2710, "valid_targets_mean": 4172.6, "valid_targets_min": 666 }, { "epoch": 4.12613981762918, "grad_norm": 0.48722281404971973, "learning_rate": 1.7272423066108306e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.17382162809371948, "step": 2715, "valid_targets_mean": 4376.5, "valid_targets_min": 263 }, { "epoch": 4.133738601823708, "grad_norm": 0.4790825604864442, "learning_rate": 1.7197358633850744e-05, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.16230902075767517, "step": 2720, "valid_targets_mean": 4323.8, "valid_targets_min": 370 }, { "epoch": 4.141337386018237, "grad_norm": 0.41425680904063444, "learning_rate": 1.7122334450833933e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.18430155515670776, "step": 2725, "valid_targets_mean": 6086.1, "valid_targets_min": 567 }, { "epoch": 4.148936170212766, "grad_norm": 0.4752171364109056, "learning_rate": 1.7047351594493755e-05, "loss": 0.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.1950949728488922, "step": 2730, "valid_targets_mean": 5050.2, "valid_targets_min": 804 }, { "epoch": 4.156534954407295, "grad_norm": 0.4757519244575605, "learning_rate": 1.6972411141672614e-05, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.1867167055606842, "step": 2735, "valid_targets_mean": 4470.1, "valid_targets_min": 828 }, { "epoch": 4.164133738601824, "grad_norm": 0.4513608069410081, "learning_rate": 1.6897514168603924e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.1613789200782776, "step": 2740, "valid_targets_mean": 4477.4, "valid_targets_min": 742 }, { "epoch": 4.171732522796352, "grad_norm": 0.5141640145999388, "learning_rate": 1.6822661750896707e-05, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.19608411192893982, "step": 2745, "valid_targets_mean": 4257.2, "valid_targets_min": 892 }, { "epoch": 4.179331306990881, "grad_norm": 0.4724318719284284, "learning_rate": 1.67478549635201e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.1456223726272583, "step": 2750, "valid_targets_mean": 4336.9, "valid_targets_min": 541 }, { "epoch": 4.186930091185411, "grad_norm": 0.4970941462233452, "learning_rate": 1.6673094880787933e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.1658686399459839, "step": 2755, "valid_targets_mean": 4121.6, "valid_targets_min": 601 }, { "epoch": 4.194528875379939, "grad_norm": 0.5000186608612818, "learning_rate": 1.6598382576343312e-05, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.16827929019927979, "step": 2760, "valid_targets_mean": 5388.8, "valid_targets_min": 1463 }, { "epoch": 4.202127659574468, "grad_norm": 0.4684433964610707, "learning_rate": 1.6523719123143186e-05, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.15693283081054688, "step": 2765, "valid_targets_mean": 4821.7, "valid_targets_min": 746 }, { "epoch": 4.2097264437689965, "grad_norm": 0.45967354792383214, "learning_rate": 1.6449105593442936e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.19241458177566528, "step": 2770, "valid_targets_mean": 4597.6, "valid_targets_min": 855 }, { "epoch": 4.217325227963526, "grad_norm": 0.4733160030781719, "learning_rate": 1.6374543058780998e-05, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.16462013125419617, "step": 2775, "valid_targets_mean": 4405.4, "valid_targets_min": 850 }, { "epoch": 4.224924012158055, "grad_norm": 0.4815352707164652, "learning_rate": 1.6300032589963436e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.15910238027572632, "step": 2780, "valid_targets_mean": 4541.5, "valid_targets_min": 909 }, { "epoch": 4.232522796352583, "grad_norm": 0.47250106872988024, "learning_rate": 1.6225575257048622e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.1517636775970459, "step": 2785, "valid_targets_mean": 4741.7, "valid_targets_min": 1120 }, { "epoch": 4.240121580547113, "grad_norm": 1.1194758985013034, "learning_rate": 1.6151172129331786e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.16665083169937134, "step": 2790, "valid_targets_mean": 4795.9, "valid_targets_min": 567 }, { "epoch": 4.2477203647416415, "grad_norm": 0.5081276624925015, "learning_rate": 1.6076824275329758e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.16445952653884888, "step": 2795, "valid_targets_mean": 4864.7, "valid_targets_min": 1608 }, { "epoch": 4.25531914893617, "grad_norm": 0.48328270331504203, "learning_rate": 1.6002532762765524e-05, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.17975090444087982, "step": 2800, "valid_targets_mean": 4240.7, "valid_targets_min": 616 }, { "epoch": 4.262917933130699, "grad_norm": 0.46912231409179, "learning_rate": 1.5928298658552988e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.1919006109237671, "step": 2805, "valid_targets_mean": 5055.8, "valid_targets_min": 588 }, { "epoch": 4.270516717325228, "grad_norm": 0.6210976552983519, "learning_rate": 1.5854123028781557e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.1582549810409546, "step": 2810, "valid_targets_mean": 3868.8, "valid_targets_min": 365 }, { "epoch": 4.278115501519757, "grad_norm": 0.4072288493810071, "learning_rate": 1.5780006938700917e-05, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.16181963682174683, "step": 2815, "valid_targets_mean": 5906.6, "valid_targets_min": 1016 }, { "epoch": 4.285714285714286, "grad_norm": 0.45582906884120683, "learning_rate": 1.5705951452705654e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.14693260192871094, "step": 2820, "valid_targets_mean": 4234.7, "valid_targets_min": 811 }, { "epoch": 4.293313069908814, "grad_norm": 0.5429695412336001, "learning_rate": 1.5631957634320048e-05, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.1935248076915741, "step": 2825, "valid_targets_mean": 4832.9, "valid_targets_min": 774 }, { "epoch": 4.300911854103344, "grad_norm": 0.46340922363130344, "learning_rate": 1.555802654618272e-05, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.17274600267410278, "step": 2830, "valid_targets_mean": 5227.2, "valid_targets_min": 933 }, { "epoch": 4.308510638297872, "grad_norm": 0.8213856644150885, "learning_rate": 1.5484159250031445e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.17811016738414764, "step": 2835, "valid_targets_mean": 3817.1, "valid_targets_min": 692 }, { "epoch": 4.316109422492401, "grad_norm": 0.4391910613617335, "learning_rate": 1.541035680668785e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.17826610803604126, "step": 2840, "valid_targets_mean": 5220.5, "valid_targets_min": 571 }, { "epoch": 4.32370820668693, "grad_norm": 0.5400136046572052, "learning_rate": 1.5336620276042193e-05, "loss": 0.1738, "loss_nan_ranks": 0, "loss_rank_avg": 0.17823699116706848, "step": 2845, "valid_targets_mean": 4212.0, "valid_targets_min": 156 }, { "epoch": 4.331306990881459, "grad_norm": 0.4689908498540122, "learning_rate": 1.526295071703817e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.14596086740493774, "step": 2850, "valid_targets_mean": 4071.1, "valid_targets_min": 842 }, { "epoch": 4.338905775075988, "grad_norm": 0.43293471403933603, "learning_rate": 1.5189349187657665e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.1921626329421997, "step": 2855, "valid_targets_mean": 5745.9, "valid_targets_min": 899 }, { "epoch": 4.3465045592705165, "grad_norm": 0.4470655930449328, "learning_rate": 1.5115816744905596e-05, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.135872483253479, "step": 2860, "valid_targets_mean": 4759.4, "valid_targets_min": 872 }, { "epoch": 4.354103343465045, "grad_norm": 0.5712823358033652, "learning_rate": 1.504235444479469e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.20416559278964996, "step": 2865, "valid_targets_mean": 4337.3, "valid_targets_min": 361 }, { "epoch": 4.361702127659575, "grad_norm": 0.4182532739028534, "learning_rate": 1.4968963342330369e-05, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.17232292890548706, "step": 2870, "valid_targets_mean": 5397.1, "valid_targets_min": 1864 }, { "epoch": 4.369300911854103, "grad_norm": 0.4274336280548651, "learning_rate": 1.4895644491495547e-05, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.17278841137886047, "step": 2875, "valid_targets_mean": 5085.6, "valid_targets_min": 758 }, { "epoch": 4.376899696048632, "grad_norm": 0.4542314839910377, "learning_rate": 1.4822398945235545e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.15121108293533325, "step": 2880, "valid_targets_mean": 4447.8, "valid_targets_min": 422 }, { "epoch": 4.3844984802431615, "grad_norm": 0.4154772615137915, "learning_rate": 1.4749227755442927e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.1821514070034027, "step": 2885, "valid_targets_mean": 5593.2, "valid_targets_min": 2877 }, { "epoch": 4.39209726443769, "grad_norm": 0.4559773456464244, "learning_rate": 1.4676131972942416e-05, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.16653896868228912, "step": 2890, "valid_targets_mean": 4738.8, "valid_targets_min": 920 }, { "epoch": 4.399696048632219, "grad_norm": 0.41739506385968844, "learning_rate": 1.4603112647475795e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.15362367033958435, "step": 2895, "valid_targets_mean": 5320.4, "valid_targets_min": 552 }, { "epoch": 4.407294832826747, "grad_norm": 0.3845071167642644, "learning_rate": 1.4530170827686831e-05, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.13495799899101257, "step": 2900, "valid_targets_mean": 5222.8, "valid_targets_min": 583 }, { "epoch": 4.414893617021277, "grad_norm": 0.44390729359629055, "learning_rate": 1.4457307561106226e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.15813395380973816, "step": 2905, "valid_targets_mean": 4969.7, "valid_targets_min": 776 }, { "epoch": 4.422492401215806, "grad_norm": 0.5018673994147254, "learning_rate": 1.438452389413656e-05, "loss": 0.174, "loss_nan_ranks": 0, "loss_rank_avg": 0.15857061743736267, "step": 2910, "valid_targets_mean": 3932.9, "valid_targets_min": 633 }, { "epoch": 4.430091185410334, "grad_norm": 0.4806146977648294, "learning_rate": 1.4311820872037264e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.1731853187084198, "step": 2915, "valid_targets_mean": 4577.8, "valid_targets_min": 328 }, { "epoch": 4.437689969604863, "grad_norm": 0.4617241179372537, "learning_rate": 1.423919953890963e-05, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.18794915080070496, "step": 2920, "valid_targets_mean": 5022.4, "valid_targets_min": 629 }, { "epoch": 4.445288753799392, "grad_norm": 0.48939540976668194, "learning_rate": 1.4166660937681771e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.17850425839424133, "step": 2925, "valid_targets_mean": 4809.8, "valid_targets_min": 409 }, { "epoch": 4.452887537993921, "grad_norm": 0.4842928277510236, "learning_rate": 1.4094206110093712e-05, "loss": 0.1736, "loss_nan_ranks": 0, "loss_rank_avg": 0.1715683937072754, "step": 2930, "valid_targets_mean": 4601.0, "valid_targets_min": 1634 }, { "epoch": 4.46048632218845, "grad_norm": 0.4074913023031158, "learning_rate": 1.4021836096682343e-05, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.1516132950782776, "step": 2935, "valid_targets_mean": 5510.4, "valid_targets_min": 778 }, { "epoch": 4.468085106382979, "grad_norm": 0.42946649016106, "learning_rate": 1.394955193676657e-05, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.16095909476280212, "step": 2940, "valid_targets_mean": 5310.4, "valid_targets_min": 1020 }, { "epoch": 4.475683890577508, "grad_norm": 0.4385638298379317, "learning_rate": 1.3877354668432297e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.15726953744888306, "step": 2945, "valid_targets_mean": 4561.4, "valid_targets_min": 590 }, { "epoch": 4.4832826747720365, "grad_norm": 0.5193379752723524, "learning_rate": 1.38052453285176e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.16541394591331482, "step": 2950, "valid_targets_mean": 3761.6, "valid_targets_min": 561 }, { "epoch": 4.490881458966565, "grad_norm": 0.4490166063535176, "learning_rate": 1.3733224952597764e-05, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.1475997269153595, "step": 2955, "valid_targets_mean": 4226.3, "valid_targets_min": 666 }, { "epoch": 4.498480243161095, "grad_norm": 0.5152090350550662, "learning_rate": 1.3661294574970485e-05, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.18321773409843445, "step": 2960, "valid_targets_mean": 4961.2, "valid_targets_min": 602 }, { "epoch": 4.506079027355623, "grad_norm": 0.43396945945061266, "learning_rate": 1.3589455228640938e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.17606866359710693, "step": 2965, "valid_targets_mean": 5181.6, "valid_targets_min": 1460 }, { "epoch": 4.513677811550152, "grad_norm": 0.4690277765034569, "learning_rate": 1.3517707945307013e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.18834683299064636, "step": 2970, "valid_targets_mean": 4646.1, "valid_targets_min": 953 }, { "epoch": 4.5212765957446805, "grad_norm": 0.5066167184858231, "learning_rate": 1.3446053755344439e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.15756574273109436, "step": 2975, "valid_targets_mean": 4516.5, "valid_targets_min": 844 }, { "epoch": 4.52887537993921, "grad_norm": 0.5134300889609936, "learning_rate": 1.3374493687792045e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.19803106784820557, "step": 2980, "valid_targets_mean": 4092.7, "valid_targets_min": 719 }, { "epoch": 4.536474164133739, "grad_norm": 0.4463665768466012, "learning_rate": 1.3303028770336914e-05, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.1606081873178482, "step": 2985, "valid_targets_mean": 4620.2, "valid_targets_min": 714 }, { "epoch": 4.544072948328267, "grad_norm": 0.4159202471735973, "learning_rate": 1.3231660029299703e-05, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.16770178079605103, "step": 2990, "valid_targets_mean": 5974.0, "valid_targets_min": 1221 }, { "epoch": 4.551671732522796, "grad_norm": 0.4174566017417907, "learning_rate": 1.316038848961982e-05, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.16645801067352295, "step": 2995, "valid_targets_mean": 5945.2, "valid_targets_min": 1900 }, { "epoch": 4.5592705167173255, "grad_norm": 0.41700946512428255, "learning_rate": 1.3089215174840783e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.15380007028579712, "step": 3000, "valid_targets_mean": 5489.1, "valid_targets_min": 894 }, { "epoch": 4.566869300911854, "grad_norm": 0.5304865164006446, "learning_rate": 1.3018141107095455e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.16447263956069946, "step": 3005, "valid_targets_mean": 3494.4, "valid_targets_min": 491 }, { "epoch": 4.574468085106383, "grad_norm": 0.48520946915581575, "learning_rate": 1.2947167307091424e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.15445218980312347, "step": 3010, "valid_targets_mean": 4516.8, "valid_targets_min": 664 }, { "epoch": 4.5820668693009114, "grad_norm": 0.47660891700948743, "learning_rate": 1.287629479409628e-05, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.15592724084854126, "step": 3015, "valid_targets_mean": 4057.2, "valid_targets_min": 905 }, { "epoch": 4.589665653495441, "grad_norm": 0.41867433836985307, "learning_rate": 1.2805524585923048e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.1499272882938385, "step": 3020, "valid_targets_mean": 4869.1, "valid_targets_min": 501 }, { "epoch": 4.59726443768997, "grad_norm": 0.40048802671676303, "learning_rate": 1.2734857698915502e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.13745658099651337, "step": 3025, "valid_targets_mean": 5079.4, "valid_targets_min": 1254 }, { "epoch": 4.604863221884498, "grad_norm": 0.4149531859078102, "learning_rate": 1.266429514793363e-05, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.15537427365779877, "step": 3030, "valid_targets_mean": 5211.1, "valid_targets_min": 861 }, { "epoch": 4.612462006079028, "grad_norm": 0.6490039513363777, "learning_rate": 1.2593837946339008e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.18460866808891296, "step": 3035, "valid_targets_mean": 4625.2, "valid_targets_min": 918 }, { "epoch": 4.620060790273556, "grad_norm": 0.4992835453594247, "learning_rate": 1.252348710598029e-05, "loss": 0.1736, "loss_nan_ranks": 0, "loss_rank_avg": 0.167076975107193, "step": 3040, "valid_targets_mean": 4100.6, "valid_targets_min": 432 }, { "epoch": 4.627659574468085, "grad_norm": 0.4615786144106656, "learning_rate": 1.245324363717864e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.16426023840904236, "step": 3045, "valid_targets_mean": 4565.8, "valid_targets_min": 828 }, { "epoch": 4.635258358662614, "grad_norm": 0.41965629757500533, "learning_rate": 1.2383108548713254e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.1467415690422058, "step": 3050, "valid_targets_mean": 5088.9, "valid_targets_min": 1159 }, { "epoch": 4.642857142857143, "grad_norm": 0.4441828730212559, "learning_rate": 1.2313082847806852e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.1823854148387909, "step": 3055, "valid_targets_mean": 4715.0, "valid_targets_min": 741 }, { "epoch": 4.650455927051672, "grad_norm": 0.459237281832204, "learning_rate": 1.2243167540111216e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.14467957615852356, "step": 3060, "valid_targets_mean": 3859.3, "valid_targets_min": 673 }, { "epoch": 4.6580547112462005, "grad_norm": 0.4946697227727552, "learning_rate": 1.2173363629692756e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.19268517196178436, "step": 3065, "valid_targets_mean": 3953.9, "valid_targets_min": 931 }, { "epoch": 4.665653495440729, "grad_norm": 0.43385480300907053, "learning_rate": 1.2103672119018086e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.15391963720321655, "step": 3070, "valid_targets_mean": 4950.1, "valid_targets_min": 1644 }, { "epoch": 4.673252279635259, "grad_norm": 0.47954284812840575, "learning_rate": 1.2034094008939624e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.19548840820789337, "step": 3075, "valid_targets_mean": 5021.8, "valid_targets_min": 774 }, { "epoch": 4.680851063829787, "grad_norm": 0.4636621474235311, "learning_rate": 1.1964630298681221e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.14948098361492157, "step": 3080, "valid_targets_mean": 3846.4, "valid_targets_min": 940 }, { "epoch": 4.688449848024316, "grad_norm": 1.0079316283200346, "learning_rate": 1.1895281985823815e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.1952032595872879, "step": 3085, "valid_targets_mean": 3557.1, "valid_targets_min": 570 }, { "epoch": 4.696048632218845, "grad_norm": 0.4689910480215768, "learning_rate": 1.1826050066291097e-05, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.16652071475982666, "step": 3090, "valid_targets_mean": 4480.4, "valid_targets_min": 728 }, { "epoch": 4.703647416413374, "grad_norm": 0.451296162182404, "learning_rate": 1.1756935534335212e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.13410750031471252, "step": 3095, "valid_targets_mean": 4405.3, "valid_targets_min": 1325 }, { "epoch": 4.711246200607903, "grad_norm": 0.42448672661829445, "learning_rate": 1.1687939382522493e-05, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.1605660319328308, "step": 3100, "valid_targets_mean": 4885.4, "valid_targets_min": 1135 }, { "epoch": 4.718844984802431, "grad_norm": 0.4707749031713044, "learning_rate": 1.1619062601719171e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.1604931652545929, "step": 3105, "valid_targets_mean": 4170.2, "valid_targets_min": 857 }, { "epoch": 4.72644376899696, "grad_norm": 0.4670653605297488, "learning_rate": 1.15503061810772e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.16604188084602356, "step": 3110, "valid_targets_mean": 5626.7, "valid_targets_min": 414 }, { "epoch": 4.73404255319149, "grad_norm": 0.4609235488117921, "learning_rate": 1.1481671108019984e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.23836404085159302, "step": 3115, "valid_targets_mean": 5899.8, "valid_targets_min": 543 }, { "epoch": 4.741641337386018, "grad_norm": 0.46042215360634425, "learning_rate": 1.1413158368228249e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.163685142993927, "step": 3120, "valid_targets_mean": 4402.4, "valid_targets_min": 512 }, { "epoch": 4.749240121580547, "grad_norm": 0.5338506865095787, "learning_rate": 1.1344768945625884e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.1888251006603241, "step": 3125, "valid_targets_mean": 4155.4, "valid_targets_min": 537 }, { "epoch": 4.756838905775076, "grad_norm": 0.40137648604950027, "learning_rate": 1.127650382236578e-05, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.14810852706432343, "step": 3130, "valid_targets_mean": 5314.3, "valid_targets_min": 354 }, { "epoch": 4.764437689969605, "grad_norm": 0.5240009462617735, "learning_rate": 1.1208363978815746e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.18549123406410217, "step": 3135, "valid_targets_mean": 4340.2, "valid_targets_min": 593 }, { "epoch": 4.772036474164134, "grad_norm": 0.43622202592017323, "learning_rate": 1.1140350393544422e-05, "loss": 0.1593, "loss_nan_ranks": 0, "loss_rank_avg": 0.15057966113090515, "step": 3140, "valid_targets_mean": 4826.1, "valid_targets_min": 794 }, { "epoch": 4.779635258358662, "grad_norm": 0.46748847050986225, "learning_rate": 1.1072464043307259e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.20890364050865173, "step": 3145, "valid_targets_mean": 4810.9, "valid_targets_min": 434 }, { "epoch": 4.787234042553192, "grad_norm": 0.4709284580160048, "learning_rate": 1.1004705903032406e-05, "loss": 0.1661, "loss_nan_ranks": 0, "loss_rank_avg": 0.17572824656963348, "step": 3150, "valid_targets_mean": 4275.6, "valid_targets_min": 787 }, { "epoch": 4.7948328267477205, "grad_norm": 0.4947193520586711, "learning_rate": 1.0937076945806837e-05, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.1653721183538437, "step": 3155, "valid_targets_mean": 3996.0, "valid_targets_min": 608 }, { "epoch": 4.802431610942249, "grad_norm": 0.95424384071522, "learning_rate": 1.0869578142862228e-05, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.15056976675987244, "step": 3160, "valid_targets_mean": 5264.1, "valid_targets_min": 911 }, { "epoch": 4.810030395136778, "grad_norm": 0.436658942790459, "learning_rate": 1.0802210463561166e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.15242451429367065, "step": 3165, "valid_targets_mean": 4430.6, "valid_targets_min": 1307 }, { "epoch": 4.817629179331307, "grad_norm": 0.4940935042193495, "learning_rate": 1.0734974875383066e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.15941178798675537, "step": 3170, "valid_targets_mean": 3658.3, "valid_targets_min": 640 }, { "epoch": 4.825227963525836, "grad_norm": 0.5857976461421992, "learning_rate": 1.0667872343910432e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.16998814046382904, "step": 3175, "valid_targets_mean": 4214.1, "valid_targets_min": 619 }, { "epoch": 4.832826747720365, "grad_norm": 0.447470023536544, "learning_rate": 1.0600903832814856e-05, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.16528019309043884, "step": 3180, "valid_targets_mean": 4406.2, "valid_targets_min": 774 }, { "epoch": 4.840425531914894, "grad_norm": 0.45582176893752013, "learning_rate": 1.0534070303843294e-05, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.16366976499557495, "step": 3185, "valid_targets_mean": 4874.4, "valid_targets_min": 531 }, { "epoch": 4.848024316109423, "grad_norm": 0.491211928315914, "learning_rate": 1.0467372716804141e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.18734398484230042, "step": 3190, "valid_targets_mean": 4573.7, "valid_targets_min": 655 }, { "epoch": 4.855623100303951, "grad_norm": 0.5889214979063572, "learning_rate": 1.0400812029553569e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.18033604323863983, "step": 3195, "valid_targets_mean": 3925.6, "valid_targets_min": 545 }, { "epoch": 4.86322188449848, "grad_norm": 0.4334778399672226, "learning_rate": 1.0334389197981638e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.14970465004444122, "step": 3200, "valid_targets_mean": 4557.2, "valid_targets_min": 736 }, { "epoch": 4.870820668693009, "grad_norm": 0.5178203832731765, "learning_rate": 1.0268105175998713e-05, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.16531500220298767, "step": 3205, "valid_targets_mean": 3934.7, "valid_targets_min": 616 }, { "epoch": 4.878419452887538, "grad_norm": 0.4677336984690735, "learning_rate": 1.0201960915521614e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.15597450733184814, "step": 3210, "valid_targets_mean": 4830.2, "valid_targets_min": 631 }, { "epoch": 4.886018237082067, "grad_norm": 0.4582200792232965, "learning_rate": 1.0135957366460087e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.14683008193969727, "step": 3215, "valid_targets_mean": 4210.8, "valid_targets_min": 1151 }, { "epoch": 4.8936170212765955, "grad_norm": 2.6017818537468114, "learning_rate": 1.0070095476703036e-05, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.17961879074573517, "step": 3220, "valid_targets_mean": 4255.6, "valid_targets_min": 544 }, { "epoch": 4.901215805471125, "grad_norm": 0.48429935318886524, "learning_rate": 1.0004376192105032e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.1917518824338913, "step": 3225, "valid_targets_mean": 4164.9, "valid_targets_min": 683 }, { "epoch": 4.908814589665654, "grad_norm": 0.408755975822661, "learning_rate": 9.938800456472603e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.15598323941230774, "step": 3230, "valid_targets_mean": 5235.6, "valid_targets_min": 673 }, { "epoch": 4.916413373860182, "grad_norm": 0.5687286004991109, "learning_rate": 9.87336921155081e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.1737002432346344, "step": 3235, "valid_targets_mean": 4874.2, "valid_targets_min": 648 }, { "epoch": 4.924012158054711, "grad_norm": 0.4449749826597429, "learning_rate": 9.80808339700959e-06, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.18869557976722717, "step": 3240, "valid_targets_mean": 5077.7, "valid_targets_min": 778 }, { "epoch": 4.9316109422492405, "grad_norm": 0.43592967879817196, "learning_rate": 9.74294395043039e-06, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.16350185871124268, "step": 3245, "valid_targets_mean": 4365.2, "valid_targets_min": 579 }, { "epoch": 4.939209726443769, "grad_norm": 0.44671726836927617, "learning_rate": 9.677951807292584e-06, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.1710178405046463, "step": 3250, "valid_targets_mean": 4973.2, "valid_targets_min": 456 }, { "epoch": 4.946808510638298, "grad_norm": 0.4273982901555888, "learning_rate": 9.61310790096015e-06, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.13666585087776184, "step": 3255, "valid_targets_mean": 4339.3, "valid_targets_min": 970 }, { "epoch": 4.954407294832826, "grad_norm": 0.4111092281316594, "learning_rate": 9.548413162668155e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.13993242383003235, "step": 3260, "valid_targets_mean": 5151.4, "valid_targets_min": 1606 }, { "epoch": 4.962006079027356, "grad_norm": 0.4678973949276577, "learning_rate": 9.483868521509492e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.17497044801712036, "step": 3265, "valid_targets_mean": 4569.8, "valid_targets_min": 507 }, { "epoch": 4.9696048632218845, "grad_norm": 0.48923608505182986, "learning_rate": 9.419474904421422e-06, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.17405647039413452, "step": 3270, "valid_targets_mean": 4378.5, "valid_targets_min": 646 }, { "epoch": 4.977203647416413, "grad_norm": 0.42080134203036884, "learning_rate": 9.355233236172381e-06, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.14896854758262634, "step": 3275, "valid_targets_mean": 4978.7, "valid_targets_min": 1936 }, { "epoch": 4.984802431610943, "grad_norm": 0.45247817713087146, "learning_rate": 9.2911444393486e-06, "loss": 0.1697, "loss_nan_ranks": 0, "loss_rank_avg": 0.14354351162910461, "step": 3280, "valid_targets_mean": 5089.9, "valid_targets_min": 754 }, { "epoch": 4.992401215805471, "grad_norm": 0.4892191547497894, "learning_rate": 9.227209434340914e-06, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.1533418595790863, "step": 3285, "valid_targets_mean": 4154.1, "valid_targets_min": 434 }, { "epoch": 5.0, "grad_norm": 0.4367103289579237, "learning_rate": 9.163429139331516e-06, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.1589938849210739, "step": 3290, "valid_targets_mean": 4928.7, "valid_targets_min": 567 }, { "epoch": 5.007598784194529, "grad_norm": 0.5506166462705645, "learning_rate": 9.099804470280791e-06, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.1861366331577301, "step": 3295, "valid_targets_mean": 3553.4, "valid_targets_min": 519 }, { "epoch": 5.015197568389058, "grad_norm": 0.44365514163643444, "learning_rate": 9.036336340914138e-06, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.18212465941905975, "step": 3300, "valid_targets_mean": 4840.4, "valid_targets_min": 465 }, { "epoch": 5.022796352583587, "grad_norm": 0.5002686598117616, "learning_rate": 8.973025662708875e-06, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.16633297502994537, "step": 3305, "valid_targets_mean": 5309.5, "valid_targets_min": 834 }, { "epoch": 5.0303951367781155, "grad_norm": 0.5141187748402867, "learning_rate": 8.909873344881125e-06, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.1726076900959015, "step": 3310, "valid_targets_mean": 4149.5, "valid_targets_min": 1217 }, { "epoch": 5.037993920972644, "grad_norm": 0.42838999609845296, "learning_rate": 8.846880294372777e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.1435108482837677, "step": 3315, "valid_targets_mean": 5703.1, "valid_targets_min": 781 }, { "epoch": 5.045592705167174, "grad_norm": 0.4990807265797361, "learning_rate": 8.784047415838446e-06, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.15767478942871094, "step": 3320, "valid_targets_mean": 4732.1, "valid_targets_min": 998 }, { "epoch": 5.053191489361702, "grad_norm": 0.4244905713932716, "learning_rate": 8.721375611632494e-06, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.15482358634471893, "step": 3325, "valid_targets_mean": 5283.4, "valid_targets_min": 977 }, { "epoch": 5.060790273556231, "grad_norm": 0.5268949634896493, "learning_rate": 8.658865781796059e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.16202573478221893, "step": 3330, "valid_targets_mean": 4009.4, "valid_targets_min": 736 }, { "epoch": 5.0683890577507595, "grad_norm": 0.5222959380611226, "learning_rate": 8.596518824044145e-06, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.1700512319803238, "step": 3335, "valid_targets_mean": 4815.2, "valid_targets_min": 1896 }, { "epoch": 5.075987841945289, "grad_norm": 0.48817810574292153, "learning_rate": 8.53433563375271e-06, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.15692004561424255, "step": 3340, "valid_targets_mean": 5081.4, "valid_targets_min": 604 }, { "epoch": 5.083586626139818, "grad_norm": 0.5145519787891805, "learning_rate": 8.472317103945827e-06, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.15433713793754578, "step": 3345, "valid_targets_mean": 4923.5, "valid_targets_min": 664 }, { "epoch": 5.091185410334346, "grad_norm": 0.49860669438741656, "learning_rate": 8.410464125282842e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.18030579388141632, "step": 3350, "valid_targets_mean": 4054.4, "valid_targets_min": 849 }, { "epoch": 5.098784194528875, "grad_norm": 0.4977104637629043, "learning_rate": 8.348777586045599e-06, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.16232091188430786, "step": 3355, "valid_targets_mean": 4112.1, "valid_targets_min": 342 }, { "epoch": 5.1063829787234045, "grad_norm": 0.40792452628529047, "learning_rate": 8.287258372125666e-06, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.14980870485305786, "step": 3360, "valid_targets_mean": 5441.6, "valid_targets_min": 828 }, { "epoch": 5.113981762917933, "grad_norm": 0.48624828153735117, "learning_rate": 8.22590736701163e-06, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.15524911880493164, "step": 3365, "valid_targets_mean": 4029.7, "valid_targets_min": 527 }, { "epoch": 5.121580547112462, "grad_norm": 0.41260477481757823, "learning_rate": 8.164725451776396e-06, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.11952009797096252, "step": 3370, "valid_targets_mean": 5127.4, "valid_targets_min": 1259 }, { "epoch": 5.129179331306991, "grad_norm": 0.5121037283737604, "learning_rate": 8.103713505064542e-06, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.13970546424388885, "step": 3375, "valid_targets_mean": 5086.4, "valid_targets_min": 447 }, { "epoch": 5.13677811550152, "grad_norm": 0.554785879889902, "learning_rate": 8.042872403079695e-06, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.17848604917526245, "step": 3380, "valid_targets_mean": 4835.1, "valid_targets_min": 229 }, { "epoch": 5.144376899696049, "grad_norm": 0.4543169082658653, "learning_rate": 7.982203019571951e-06, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.15885761380195618, "step": 3385, "valid_targets_mean": 4715.2, "valid_targets_min": 614 }, { "epoch": 5.151975683890577, "grad_norm": 0.49519076224489234, "learning_rate": 7.921706225825323e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.14728990197181702, "step": 3390, "valid_targets_mean": 4132.9, "valid_targets_min": 705 }, { "epoch": 5.159574468085107, "grad_norm": 0.4692483655123735, "learning_rate": 7.861382890645235e-06, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.1677330732345581, "step": 3395, "valid_targets_mean": 4542.6, "valid_targets_min": 571 }, { "epoch": 5.167173252279635, "grad_norm": 0.4981198573213941, "learning_rate": 7.801233880346044e-06, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.152068629860878, "step": 3400, "valid_targets_mean": 4878.0, "valid_targets_min": 1568 }, { "epoch": 5.174772036474164, "grad_norm": 0.496973792548942, "learning_rate": 7.741260058738576e-06, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.1845749020576477, "step": 3405, "valid_targets_mean": 4564.4, "valid_targets_min": 333 }, { "epoch": 5.182370820668693, "grad_norm": 0.4801400629594902, "learning_rate": 7.681462287117769e-06, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.15920531749725342, "step": 3410, "valid_targets_mean": 4416.2, "valid_targets_min": 618 }, { "epoch": 5.189969604863222, "grad_norm": 0.44717438624237565, "learning_rate": 7.62184142425026e-06, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.14159642159938812, "step": 3415, "valid_targets_mean": 5296.9, "valid_targets_min": 1679 }, { "epoch": 5.197568389057751, "grad_norm": 0.5694531326181947, "learning_rate": 7.562398326362068e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.1987701654434204, "step": 3420, "valid_targets_mean": 4228.2, "valid_targets_min": 500 }, { "epoch": 5.2051671732522795, "grad_norm": 0.4837511107077152, "learning_rate": 7.503133847126298e-06, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.14547014236450195, "step": 3425, "valid_targets_mean": 4541.6, "valid_targets_min": 537 }, { "epoch": 5.212765957446808, "grad_norm": 0.46751291957082003, "learning_rate": 7.444048837650879e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.1482163369655609, "step": 3430, "valid_targets_mean": 4358.3, "valid_targets_min": 464 }, { "epoch": 5.220364741641338, "grad_norm": 0.48046465195883326, "learning_rate": 7.3851441464663455e-06, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.15912845730781555, "step": 3435, "valid_targets_mean": 4258.4, "valid_targets_min": 1734 }, { "epoch": 5.227963525835866, "grad_norm": 0.5201595463216373, "learning_rate": 7.326420619513645e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.14452405273914337, "step": 3440, "valid_targets_mean": 4945.8, "valid_targets_min": 2273 }, { "epoch": 5.235562310030395, "grad_norm": 0.4662188330800987, "learning_rate": 7.267879100131996e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.16573692858219147, "step": 3445, "valid_targets_mean": 5350.9, "valid_targets_min": 1272 }, { "epoch": 5.243161094224924, "grad_norm": 0.5445679437490333, "learning_rate": 7.209520429046768e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.14232224225997925, "step": 3450, "valid_targets_mean": 3531.5, "valid_targets_min": 756 }, { "epoch": 5.250759878419453, "grad_norm": 0.48341944333718034, "learning_rate": 7.151345444357418e-06, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.15717411041259766, "step": 3455, "valid_targets_mean": 4357.9, "valid_targets_min": 410 }, { "epoch": 5.258358662613982, "grad_norm": 0.46774893892784875, "learning_rate": 7.0933549815254465e-06, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.16652044653892517, "step": 3460, "valid_targets_mean": 5190.8, "valid_targets_min": 433 }, { "epoch": 5.26595744680851, "grad_norm": 0.47602862093431514, "learning_rate": 7.035549873362406e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.14074617624282837, "step": 3465, "valid_targets_mean": 4641.2, "valid_targets_min": 1537 }, { "epoch": 5.27355623100304, "grad_norm": 0.49943887077257887, "learning_rate": 6.97793095001793e-06, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.15125201642513275, "step": 3470, "valid_targets_mean": 4864.9, "valid_targets_min": 754 }, { "epoch": 5.281155015197569, "grad_norm": 0.56912423597624, "learning_rate": 6.920499038967825e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.1387101113796234, "step": 3475, "valid_targets_mean": 4497.3, "valid_targets_min": 780 }, { "epoch": 5.288753799392097, "grad_norm": 0.6031298612179781, "learning_rate": 6.863254965002178e-06, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.17738491296768188, "step": 3480, "valid_targets_mean": 2821.3, "valid_targets_min": 271 }, { "epoch": 5.296352583586626, "grad_norm": 0.42528213654923797, "learning_rate": 6.80619955021351e-06, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.13962329924106598, "step": 3485, "valid_targets_mean": 5226.1, "valid_targets_min": 1805 }, { "epoch": 5.303951367781155, "grad_norm": 0.4641682316415047, "learning_rate": 6.749333613984979e-06, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.17883500456809998, "step": 3490, "valid_targets_mean": 5505.0, "valid_targets_min": 2227 }, { "epoch": 5.311550151975684, "grad_norm": 0.41287597531580333, "learning_rate": 6.6926579729786025e-06, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.13076046109199524, "step": 3495, "valid_targets_mean": 5253.1, "valid_targets_min": 624 }, { "epoch": 5.319148936170213, "grad_norm": 0.47804228992277803, "learning_rate": 6.636173441123537e-06, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.13578727841377258, "step": 3500, "valid_targets_mean": 4141.2, "valid_targets_min": 974 }, { "epoch": 5.326747720364741, "grad_norm": 0.6043580771376642, "learning_rate": 6.5798808296043835e-06, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.1580887734889984, "step": 3505, "valid_targets_mean": 3810.6, "valid_targets_min": 769 }, { "epoch": 5.334346504559271, "grad_norm": 0.5078101575478104, "learning_rate": 6.52378094684954e-06, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.17107361555099487, "step": 3510, "valid_targets_mean": 3934.2, "valid_targets_min": 280 }, { "epoch": 5.3419452887537995, "grad_norm": 0.4141414829732433, "learning_rate": 6.467874598519597e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.14241334795951843, "step": 3515, "valid_targets_mean": 5362.5, "valid_targets_min": 2329 }, { "epoch": 5.349544072948328, "grad_norm": 0.4458140032344141, "learning_rate": 6.412162587495754e-06, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.13986560702323914, "step": 3520, "valid_targets_mean": 4640.0, "valid_targets_min": 593 }, { "epoch": 5.357142857142857, "grad_norm": 0.49980298962190683, "learning_rate": 6.3566457138683015e-06, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.1622404009103775, "step": 3525, "valid_targets_mean": 4144.8, "valid_targets_min": 523 }, { "epoch": 5.364741641337386, "grad_norm": 0.5309190846014655, "learning_rate": 6.301324774925128e-06, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.1419864147901535, "step": 3530, "valid_targets_mean": 4773.5, "valid_targets_min": 601 }, { "epoch": 5.372340425531915, "grad_norm": 0.4394509557877868, "learning_rate": 6.246200565140266e-06, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.1346133053302765, "step": 3535, "valid_targets_mean": 5314.5, "valid_targets_min": 1831 }, { "epoch": 5.379939209726444, "grad_norm": 0.6157551616826415, "learning_rate": 6.191273876162487e-06, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.16742759943008423, "step": 3540, "valid_targets_mean": 4461.9, "valid_targets_min": 632 }, { "epoch": 5.387537993920972, "grad_norm": 0.5207893779334158, "learning_rate": 6.136545496803925e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.173904150724411, "step": 3545, "valid_targets_mean": 4806.9, "valid_targets_min": 816 }, { "epoch": 5.395136778115502, "grad_norm": 0.41444365615563894, "learning_rate": 6.082016213028761e-06, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.14027008414268494, "step": 3550, "valid_targets_mean": 5664.4, "valid_targets_min": 840 }, { "epoch": 5.40273556231003, "grad_norm": 0.4453222293778615, "learning_rate": 6.0276868079419235e-06, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.1503615528345108, "step": 3555, "valid_targets_mean": 5143.4, "valid_targets_min": 979 }, { "epoch": 5.410334346504559, "grad_norm": 0.4781236892192554, "learning_rate": 5.973558061777849e-06, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.15819337964057922, "step": 3560, "valid_targets_mean": 5053.2, "valid_targets_min": 664 }, { "epoch": 5.4179331306990886, "grad_norm": 0.41198950921824895, "learning_rate": 5.919630751889274e-06, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.13387863337993622, "step": 3565, "valid_targets_mean": 5390.4, "valid_targets_min": 1116 }, { "epoch": 5.425531914893617, "grad_norm": 0.516010838368697, "learning_rate": 5.865905652736072e-06, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.17436817288398743, "step": 3570, "valid_targets_mean": 4064.7, "valid_targets_min": 894 }, { "epoch": 5.433130699088146, "grad_norm": 0.5141562761832758, "learning_rate": 5.812383535874131e-06, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.13484925031661987, "step": 3575, "valid_targets_mean": 3949.4, "valid_targets_min": 1312 }, { "epoch": 5.4407294832826745, "grad_norm": 0.45662210514471807, "learning_rate": 5.759065169944274e-06, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.1350744068622589, "step": 3580, "valid_targets_mean": 4565.4, "valid_targets_min": 381 }, { "epoch": 5.448328267477204, "grad_norm": 0.49698187827992, "learning_rate": 5.705951320661222e-06, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.14174014329910278, "step": 3585, "valid_targets_mean": 4722.2, "valid_targets_min": 2183 }, { "epoch": 5.455927051671733, "grad_norm": 0.45234338868163015, "learning_rate": 5.653042750802591e-06, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.14616911113262177, "step": 3590, "valid_targets_mean": 4943.4, "valid_targets_min": 1261 }, { "epoch": 5.463525835866261, "grad_norm": 0.4806481881918089, "learning_rate": 5.600340220197946e-06, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.17162683606147766, "step": 3595, "valid_targets_mean": 4331.8, "valid_targets_min": 414 }, { "epoch": 5.47112462006079, "grad_norm": 0.46035606110531224, "learning_rate": 5.547844485717884e-06, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.14485681056976318, "step": 3600, "valid_targets_mean": 4167.1, "valid_targets_min": 1119 }, { "epoch": 5.4787234042553195, "grad_norm": 0.4684818904402137, "learning_rate": 5.4955563012631606e-06, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.14429020881652832, "step": 3605, "valid_targets_mean": 5013.6, "valid_targets_min": 1788 }, { "epoch": 5.486322188449848, "grad_norm": 0.6076128140539062, "learning_rate": 5.443476417753877e-06, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.17048346996307373, "step": 3610, "valid_targets_mean": 2878.3, "valid_targets_min": 491 }, { "epoch": 5.493920972644377, "grad_norm": 0.46825002881973943, "learning_rate": 5.39160558311868e-06, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.17676037549972534, "step": 3615, "valid_targets_mean": 4354.2, "valid_targets_min": 646 }, { "epoch": 5.501519756838906, "grad_norm": 0.49007855328228217, "learning_rate": 5.33994454228403e-06, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.17580349743366241, "step": 3620, "valid_targets_mean": 5169.6, "valid_targets_min": 953 }, { "epoch": 5.509118541033435, "grad_norm": 0.44768382223068853, "learning_rate": 5.2884940371634915e-06, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.14162276685237885, "step": 3625, "valid_targets_mean": 5179.9, "valid_targets_min": 1051 }, { "epoch": 5.5167173252279635, "grad_norm": 0.4352121315996926, "learning_rate": 5.237254806647117e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.1292266994714737, "step": 3630, "valid_targets_mean": 4936.1, "valid_targets_min": 912 }, { "epoch": 5.524316109422492, "grad_norm": 0.5433474427694438, "learning_rate": 5.1862275865907575e-06, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.1526874601840973, "step": 3635, "valid_targets_mean": 3939.9, "valid_targets_min": 1082 }, { "epoch": 5.531914893617021, "grad_norm": 0.4664875248042157, "learning_rate": 5.135413109805596e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.14586284756660461, "step": 3640, "valid_targets_mean": 4819.6, "valid_targets_min": 1708 }, { "epoch": 5.53951367781155, "grad_norm": 0.4479408250207293, "learning_rate": 5.084812106047525e-06, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.13202941417694092, "step": 3645, "valid_targets_mean": 5479.3, "valid_targets_min": 1475 }, { "epoch": 5.547112462006079, "grad_norm": 0.46875681135292097, "learning_rate": 5.034425302006751e-06, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.15239191055297852, "step": 3650, "valid_targets_mean": 4168.7, "valid_targets_min": 534 }, { "epoch": 5.554711246200608, "grad_norm": 0.5099225903083285, "learning_rate": 4.984253421297285e-06, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.15130409598350525, "step": 3655, "valid_targets_mean": 3672.7, "valid_targets_min": 465 }, { "epoch": 5.562310030395137, "grad_norm": 0.44549612335892824, "learning_rate": 4.934297184446617e-06, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.15832307934761047, "step": 3660, "valid_targets_mean": 5213.5, "valid_targets_min": 1002 }, { "epoch": 5.569908814589666, "grad_norm": 0.5093597450581251, "learning_rate": 4.884557308885302e-06, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.16333602368831635, "step": 3665, "valid_targets_mean": 4690.4, "valid_targets_min": 876 }, { "epoch": 5.577507598784194, "grad_norm": 0.5062778786472242, "learning_rate": 4.835034508936736e-06, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.15072304010391235, "step": 3670, "valid_targets_mean": 4472.8, "valid_targets_min": 863 }, { "epoch": 5.585106382978723, "grad_norm": 0.4887232514300285, "learning_rate": 4.785729495806804e-06, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.1506553441286087, "step": 3675, "valid_targets_mean": 4468.6, "valid_targets_min": 1870 }, { "epoch": 5.592705167173253, "grad_norm": 0.5178118286048965, "learning_rate": 4.736642977573745e-06, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.14603829383850098, "step": 3680, "valid_targets_mean": 3900.1, "valid_targets_min": 314 }, { "epoch": 5.600303951367781, "grad_norm": 0.49021784557999176, "learning_rate": 4.6877756591779465e-06, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.1614750772714615, "step": 3685, "valid_targets_mean": 4549.1, "valid_targets_min": 1530 }, { "epoch": 5.60790273556231, "grad_norm": 0.46685253564728685, "learning_rate": 4.63912824241183e-06, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.15664935111999512, "step": 3690, "valid_targets_mean": 4078.2, "valid_targets_min": 702 }, { "epoch": 5.6155015197568385, "grad_norm": 0.4476391544726595, "learning_rate": 4.590701425909763e-06, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.1614711433649063, "step": 3695, "valid_targets_mean": 5204.6, "valid_targets_min": 1871 }, { "epoch": 5.623100303951368, "grad_norm": 0.46752237532336416, "learning_rate": 4.5424959051380376e-06, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.14600232243537903, "step": 3700, "valid_targets_mean": 4345.4, "valid_targets_min": 1418 }, { "epoch": 5.630699088145897, "grad_norm": 0.498907377725208, "learning_rate": 4.4945123723848785e-06, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.16958801448345184, "step": 3705, "valid_targets_mean": 4744.0, "valid_targets_min": 655 }, { "epoch": 5.638297872340425, "grad_norm": 0.47032248993505454, "learning_rate": 4.446751516750496e-06, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.15484699606895447, "step": 3710, "valid_targets_mean": 4455.9, "valid_targets_min": 513 }, { "epoch": 5.645896656534955, "grad_norm": 0.49291725666506586, "learning_rate": 4.399214024137199e-06, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.1515854448080063, "step": 3715, "valid_targets_mean": 4026.5, "valid_targets_min": 401 }, { "epoch": 5.6534954407294835, "grad_norm": 0.42768293201723206, "learning_rate": 4.351900577239534e-06, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.1308768093585968, "step": 3720, "valid_targets_mean": 5203.2, "valid_targets_min": 511 }, { "epoch": 5.661094224924012, "grad_norm": 0.419913357256391, "learning_rate": 4.30481185553449e-06, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.15996746718883514, "step": 3725, "valid_targets_mean": 6209.4, "valid_targets_min": 3964 }, { "epoch": 5.668693009118541, "grad_norm": 0.5024514745126758, "learning_rate": 4.2579485352717365e-06, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.14928898215293884, "step": 3730, "valid_targets_mean": 5061.5, "valid_targets_min": 854 }, { "epoch": 5.676291793313069, "grad_norm": 0.6107697257765264, "learning_rate": 4.211311289463913e-06, "loss": 0.1791, "loss_nan_ranks": 0, "loss_rank_avg": 0.212265282869339, "step": 3735, "valid_targets_mean": 2980.9, "valid_targets_min": 613 }, { "epoch": 5.683890577507599, "grad_norm": 0.40762228356266644, "learning_rate": 4.164900787876958e-06, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.15725256502628326, "step": 3740, "valid_targets_mean": 5801.9, "valid_targets_min": 1647 }, { "epoch": 5.691489361702128, "grad_norm": 0.42068151608687643, "learning_rate": 4.118717697020503e-06, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.15178656578063965, "step": 3745, "valid_targets_mean": 5270.4, "valid_targets_min": 714 }, { "epoch": 5.699088145896656, "grad_norm": 0.510742750219421, "learning_rate": 4.072762680138283e-06, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.16748473048210144, "step": 3750, "valid_targets_mean": 4111.5, "valid_targets_min": 690 }, { "epoch": 5.706686930091186, "grad_norm": 0.4725979697075687, "learning_rate": 4.02703639719863e-06, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.16421647369861603, "step": 3755, "valid_targets_mean": 5007.1, "valid_targets_min": 1593 }, { "epoch": 5.714285714285714, "grad_norm": 0.4858255836304888, "learning_rate": 3.981539504884975e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.1452382504940033, "step": 3760, "valid_targets_mean": 4335.0, "valid_targets_min": 268 }, { "epoch": 5.721884498480243, "grad_norm": 0.496365033025088, "learning_rate": 3.936272656586455e-06, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.1607646495103836, "step": 3765, "valid_targets_mean": 4691.0, "valid_targets_min": 801 }, { "epoch": 5.729483282674772, "grad_norm": 0.49339220005728074, "learning_rate": 3.891236502388463e-06, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.12876826524734497, "step": 3770, "valid_targets_mean": 3568.1, "valid_targets_min": 629 }, { "epoch": 5.737082066869301, "grad_norm": 0.42864321603538963, "learning_rate": 3.846431689063395e-06, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.14634914696216583, "step": 3775, "valid_targets_mean": 5067.4, "valid_targets_min": 1740 }, { "epoch": 5.74468085106383, "grad_norm": 0.4858809112101771, "learning_rate": 3.801858860061276e-06, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.15183153748512268, "step": 3780, "valid_targets_mean": 4308.7, "valid_targets_min": 2342 }, { "epoch": 5.7522796352583585, "grad_norm": 0.430010773677836, "learning_rate": 3.757518655500607e-06, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.11490476876497269, "step": 3785, "valid_targets_mean": 4636.7, "valid_targets_min": 1770 }, { "epoch": 5.759878419452887, "grad_norm": 0.44137928337029025, "learning_rate": 3.7134117121590783e-06, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.1602618247270584, "step": 3790, "valid_targets_mean": 5387.0, "valid_targets_min": 1520 }, { "epoch": 5.767477203647417, "grad_norm": 0.49716171756169814, "learning_rate": 3.6695386634645268e-06, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.17046484351158142, "step": 3795, "valid_targets_mean": 3979.0, "valid_targets_min": 637 }, { "epoch": 5.775075987841945, "grad_norm": 0.6225472640133536, "learning_rate": 3.625900139485732e-06, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.16933000087738037, "step": 3800, "valid_targets_mean": 3247.3, "valid_targets_min": 403 }, { "epoch": 5.782674772036474, "grad_norm": 0.4826561130766123, "learning_rate": 3.5824967669234712e-06, "loss": 0.1677, "loss_nan_ranks": 0, "loss_rank_avg": 0.14927777647972107, "step": 3805, "valid_targets_mean": 4297.8, "valid_targets_min": 479 }, { "epoch": 5.7902735562310035, "grad_norm": 0.4594251420598871, "learning_rate": 3.539329169101424e-06, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.15365689992904663, "step": 3810, "valid_targets_mean": 5167.4, "valid_targets_min": 892 }, { "epoch": 5.797872340425532, "grad_norm": 0.4557619581698914, "learning_rate": 3.49639796595731e-06, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.1744815707206726, "step": 3815, "valid_targets_mean": 5195.3, "valid_targets_min": 634 }, { "epoch": 5.805471124620061, "grad_norm": 0.46537892238846895, "learning_rate": 3.453703774033901e-06, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.14466017484664917, "step": 3820, "valid_targets_mean": 4648.0, "valid_targets_min": 736 }, { "epoch": 5.813069908814589, "grad_norm": 0.5247551115664364, "learning_rate": 3.4112472064702473e-06, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.16951002180576324, "step": 3825, "valid_targets_mean": 4100.8, "valid_targets_min": 529 }, { "epoch": 5.820668693009118, "grad_norm": 0.4408079538837663, "learning_rate": 3.369028872992792e-06, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.15143227577209473, "step": 3830, "valid_targets_mean": 5215.6, "valid_targets_min": 1009 }, { "epoch": 5.828267477203648, "grad_norm": 0.5248938288172915, "learning_rate": 3.327049379906695e-06, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.17994189262390137, "step": 3835, "valid_targets_mean": 4604.6, "valid_targets_min": 570 }, { "epoch": 5.835866261398176, "grad_norm": 0.5052356507109963, "learning_rate": 3.2853093300870452e-06, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.1394600123167038, "step": 3840, "valid_targets_mean": 4017.8, "valid_targets_min": 736 }, { "epoch": 5.843465045592705, "grad_norm": 0.47463044811940924, "learning_rate": 3.2438093229702905e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.15373006463050842, "step": 3845, "valid_targets_mean": 4134.0, "valid_targets_min": 410 }, { "epoch": 5.851063829787234, "grad_norm": 0.513814275937601, "learning_rate": 3.202549954545533e-06, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.23078633844852448, "step": 3850, "valid_targets_mean": 5543.1, "valid_targets_min": 655 }, { "epoch": 5.858662613981763, "grad_norm": 0.48073524570765763, "learning_rate": 3.161531817346062e-06, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.17668002843856812, "step": 3855, "valid_targets_mean": 4446.9, "valid_targets_min": 449 }, { "epoch": 5.866261398176292, "grad_norm": 0.4258287069585612, "learning_rate": 3.120755500440762e-06, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.14281289279460907, "step": 3860, "valid_targets_mean": 5058.1, "valid_targets_min": 1100 }, { "epoch": 5.87386018237082, "grad_norm": 0.4556314380528612, "learning_rate": 3.0802215894257336e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.15817520022392273, "step": 3865, "valid_targets_mean": 4869.2, "valid_targets_min": 2426 }, { "epoch": 5.88145896656535, "grad_norm": 0.632880711013422, "learning_rate": 3.0399306664158e-06, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440334916114807, "step": 3870, "valid_targets_mean": 4294.8, "valid_targets_min": 1072 }, { "epoch": 5.8890577507598785, "grad_norm": 0.40158185981708566, "learning_rate": 2.9998833100362336e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.1560600996017456, "step": 3875, "valid_targets_mean": 5631.6, "valid_targets_min": 1728 }, { "epoch": 5.896656534954407, "grad_norm": 0.500623763450671, "learning_rate": 2.9600800954143572e-06, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.1587526947259903, "step": 3880, "valid_targets_mean": 4028.8, "valid_targets_min": 666 }, { "epoch": 5.904255319148936, "grad_norm": 0.4944868321896879, "learning_rate": 2.9205215941713704e-06, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.16634200513362885, "step": 3885, "valid_targets_mean": 4611.9, "valid_targets_min": 732 }, { "epoch": 5.911854103343465, "grad_norm": 0.5115742550534301, "learning_rate": 2.8812083744140616e-06, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.15021023154258728, "step": 3890, "valid_targets_mean": 4236.3, "valid_targets_min": 1104 }, { "epoch": 5.919452887537994, "grad_norm": 0.48224861462921226, "learning_rate": 2.842141000726726e-06, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.1501300185918808, "step": 3895, "valid_targets_mean": 4213.5, "valid_targets_min": 774 }, { "epoch": 5.927051671732523, "grad_norm": 0.4030631035629361, "learning_rate": 2.8033200341629886e-06, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.12463116645812988, "step": 3900, "valid_targets_mean": 5398.5, "valid_targets_min": 1514 }, { "epoch": 5.934650455927052, "grad_norm": 0.45096444866968627, "learning_rate": 2.7647460322377927e-06, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.17850109934806824, "step": 3905, "valid_targets_mean": 5562.8, "valid_targets_min": 569 }, { "epoch": 5.942249240121581, "grad_norm": 0.41781952891112895, "learning_rate": 2.72641954891937e-06, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.145452082157135, "step": 3910, "valid_targets_mean": 5237.6, "valid_targets_min": 787 }, { "epoch": 5.949848024316109, "grad_norm": 0.462920182118315, "learning_rate": 2.688341134621295e-06, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.1589956283569336, "step": 3915, "valid_targets_mean": 5620.2, "valid_targets_min": 797 }, { "epoch": 5.957446808510638, "grad_norm": 0.48846090610407683, "learning_rate": 2.6505113361945833e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.18880805373191833, "step": 3920, "valid_targets_mean": 4641.4, "valid_targets_min": 879 }, { "epoch": 5.9650455927051675, "grad_norm": 0.440227878411004, "learning_rate": 2.612930696919822e-06, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.13358448445796967, "step": 3925, "valid_targets_mean": 4184.0, "valid_targets_min": 559 }, { "epoch": 5.972644376899696, "grad_norm": 0.4575207059455806, "learning_rate": 2.5755997564993894e-06, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.14469373226165771, "step": 3930, "valid_targets_mean": 4649.6, "valid_targets_min": 2261 }, { "epoch": 5.980243161094225, "grad_norm": 0.5005233906873359, "learning_rate": 2.5385190510496858e-06, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.17244486510753632, "step": 3935, "valid_targets_mean": 4924.8, "valid_targets_min": 171 }, { "epoch": 5.9878419452887535, "grad_norm": 0.4458252216107338, "learning_rate": 2.5016891130934463e-06, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.13665539026260376, "step": 3940, "valid_targets_mean": 4990.1, "valid_targets_min": 500 }, { "epoch": 5.995440729483283, "grad_norm": 0.4846406288628859, "learning_rate": 2.465110471552086e-06, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.16603650152683258, "step": 3945, "valid_targets_mean": 4758.2, "valid_targets_min": 599 }, { "epoch": 6.003039513677812, "grad_norm": 0.44214905635705837, "learning_rate": 2.4287836517381113e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.11986207216978073, "step": 3950, "valid_targets_mean": 4267.4, "valid_targets_min": 335 }, { "epoch": 6.01063829787234, "grad_norm": 0.4887571085350468, "learning_rate": 2.392709175347554e-06, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.14001381397247314, "step": 3955, "valid_targets_mean": 4841.9, "valid_targets_min": 797 }, { "epoch": 6.018237082066869, "grad_norm": 0.5312808060591666, "learning_rate": 2.356887560452528e-06, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.17127478122711182, "step": 3960, "valid_targets_mean": 3657.6, "valid_targets_min": 713 }, { "epoch": 6.025835866261398, "grad_norm": 0.49420144944896355, "learning_rate": 2.321319321493718e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.15153075754642487, "step": 3965, "valid_targets_mean": 4141.9, "valid_targets_min": 792 }, { "epoch": 6.033434650455927, "grad_norm": 0.43348847119788875, "learning_rate": 2.2860049692730745e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.15093687176704407, "step": 3970, "valid_targets_mean": 5298.1, "valid_targets_min": 491 }, { "epoch": 6.041033434650456, "grad_norm": 0.4852668062537144, "learning_rate": 2.2509450109463903e-06, "loss": 0.1462, "loss_nan_ranks": 0, "loss_rank_avg": 0.15192578732967377, "step": 3975, "valid_targets_mean": 4195.6, "valid_targets_min": 646 }, { "epoch": 6.048632218844984, "grad_norm": 0.4985600383895827, "learning_rate": 2.2161399500161005e-06, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.12650343775749207, "step": 3980, "valid_targets_mean": 4298.5, "valid_targets_min": 1887 }, { "epoch": 6.056231003039514, "grad_norm": 0.46036482703942144, "learning_rate": 2.1815902863239826e-06, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.12870556116104126, "step": 3985, "valid_targets_mean": 4722.8, "valid_targets_min": 1027 }, { "epoch": 6.0638297872340425, "grad_norm": 0.4724257952962997, "learning_rate": 2.1472965160440307e-06, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.15059977769851685, "step": 3990, "valid_targets_mean": 4350.8, "valid_targets_min": 1618 }, { "epoch": 6.071428571428571, "grad_norm": 0.4736941877158723, "learning_rate": 2.1132591316752824e-06, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.12970831990242004, "step": 3995, "valid_targets_mean": 4671.1, "valid_targets_min": 1136 }, { "epoch": 6.079027355623101, "grad_norm": 0.4790995642913263, "learning_rate": 2.079478622034803e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.1599026918411255, "step": 4000, "valid_targets_mean": 5553.9, "valid_targets_min": 2157 }, { "epoch": 6.086626139817629, "grad_norm": 0.5750210601223926, "learning_rate": 2.045955472250598e-06, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1329852193593979, "step": 4005, "valid_targets_mean": 4740.1, "valid_targets_min": 658 }, { "epoch": 6.094224924012158, "grad_norm": 0.5356962782262873, "learning_rate": 2.012690163754716e-06, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.1583370566368103, "step": 4010, "valid_targets_mean": 3881.9, "valid_targets_min": 833 }, { "epoch": 6.101823708206687, "grad_norm": 0.5430593717962985, "learning_rate": 1.9796831742762658e-06, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.17519140243530273, "step": 4015, "valid_targets_mean": 4008.7, "valid_targets_min": 513 }, { "epoch": 6.109422492401216, "grad_norm": 0.5395476454999809, "learning_rate": 1.9469349778346223e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.1673513501882553, "step": 4020, "valid_targets_mean": 3863.8, "valid_targets_min": 862 }, { "epoch": 6.117021276595745, "grad_norm": 0.6041814504745721, "learning_rate": 1.9144460447325564e-06, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.16433076560497284, "step": 4025, "valid_targets_mean": 4698.3, "valid_targets_min": 821 }, { "epoch": 6.124620060790273, "grad_norm": 0.6094776194613557, "learning_rate": 1.8822168415495422e-06, "loss": 0.1453, "loss_nan_ranks": 0, "loss_rank_avg": 0.13730981945991516, "step": 4030, "valid_targets_mean": 4077.6, "valid_targets_min": 901 }, { "epoch": 6.132218844984802, "grad_norm": 0.45063574077263974, "learning_rate": 1.8502478311349947e-06, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.16246050596237183, "step": 4035, "valid_targets_mean": 5466.6, "valid_targets_min": 2424 }, { "epoch": 6.139817629179332, "grad_norm": 0.4816199109533305, "learning_rate": 1.8185394726016791e-06, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.1370609700679779, "step": 4040, "valid_targets_mean": 4561.9, "valid_targets_min": 743 }, { "epoch": 6.14741641337386, "grad_norm": 0.6732958197054807, "learning_rate": 1.7870922213190755e-06, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.16209891438484192, "step": 4045, "valid_targets_mean": 3887.8, "valid_targets_min": 550 }, { "epoch": 6.155015197568389, "grad_norm": 0.4601061012528339, "learning_rate": 1.7559065289068633e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.13671234250068665, "step": 4050, "valid_targets_mean": 5133.4, "valid_targets_min": 479 }, { "epoch": 6.1626139817629175, "grad_norm": 0.43746420290219207, "learning_rate": 1.72498284322842e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.1267484724521637, "step": 4055, "valid_targets_mean": 5035.9, "valid_targets_min": 1853 }, { "epoch": 6.170212765957447, "grad_norm": 0.4569139573946025, "learning_rate": 1.694321608384406e-06, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.14077520370483398, "step": 4060, "valid_targets_mean": 5069.5, "valid_targets_min": 2002 }, { "epoch": 6.177811550151976, "grad_norm": 0.43274533973618445, "learning_rate": 1.663923264706373e-06, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.14554743468761444, "step": 4065, "valid_targets_mean": 5077.8, "valid_targets_min": 519 }, { "epoch": 6.185410334346504, "grad_norm": 0.47582107432910764, "learning_rate": 1.6337882487504452e-06, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.14857840538024902, "step": 4070, "valid_targets_mean": 4424.7, "valid_targets_min": 674 }, { "epoch": 6.193009118541034, "grad_norm": 0.5274167558239128, "learning_rate": 1.603916993291048e-06, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.14230819046497345, "step": 4075, "valid_targets_mean": 3961.1, "valid_targets_min": 654 }, { "epoch": 6.2006079027355625, "grad_norm": 0.49913070570635226, "learning_rate": 1.5743099273146967e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440865695476532, "step": 4080, "valid_targets_mean": 5009.5, "valid_targets_min": 444 }, { "epoch": 6.208206686930091, "grad_norm": 0.4571022258136094, "learning_rate": 1.5449674760138344e-06, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.1474510282278061, "step": 4085, "valid_targets_mean": 4348.4, "valid_targets_min": 770 }, { "epoch": 6.21580547112462, "grad_norm": 0.4714848047264726, "learning_rate": 1.5158900607807248e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.16296353936195374, "step": 4090, "valid_targets_mean": 4949.5, "valid_targets_min": 694 }, { "epoch": 6.223404255319149, "grad_norm": 0.4322780542533103, "learning_rate": 1.4870780992013956e-06, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.13294166326522827, "step": 4095, "valid_targets_mean": 4950.1, "valid_targets_min": 329 }, { "epoch": 6.231003039513678, "grad_norm": 0.5464674366866006, "learning_rate": 1.4585320050496531e-06, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.15174424648284912, "step": 4100, "valid_targets_mean": 4007.2, "valid_targets_min": 834 }, { "epoch": 6.238601823708207, "grad_norm": 0.42685774893365297, "learning_rate": 1.4302521882811316e-06, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.1383514404296875, "step": 4105, "valid_targets_mean": 5403.9, "valid_targets_min": 918 }, { "epoch": 6.246200607902735, "grad_norm": 0.5366963612937214, "learning_rate": 1.4022390550274034e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.15787436068058014, "step": 4110, "valid_targets_mean": 3990.0, "valid_targets_min": 434 }, { "epoch": 6.253799392097265, "grad_norm": 0.46724324680744234, "learning_rate": 1.3744930075901563e-06, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.14154699444770813, "step": 4115, "valid_targets_mean": 4727.9, "valid_targets_min": 588 }, { "epoch": 6.261398176291793, "grad_norm": 0.41711994711720174, "learning_rate": 1.3470144444354061e-06, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.1419452279806137, "step": 4120, "valid_targets_mean": 5510.2, "valid_targets_min": 713 }, { "epoch": 6.268996960486322, "grad_norm": 0.5220642496809625, "learning_rate": 1.3198037601877789e-06, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.1353391706943512, "step": 4125, "valid_targets_mean": 4115.4, "valid_targets_min": 450 }, { "epoch": 6.276595744680851, "grad_norm": 0.4939240759429581, "learning_rate": 1.2928613456248473e-06, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.15414312481880188, "step": 4130, "valid_targets_mean": 5176.1, "valid_targets_min": 571 }, { "epoch": 6.28419452887538, "grad_norm": 0.442808139834025, "learning_rate": 1.266187587671508e-06, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.15302585065364838, "step": 4135, "valid_targets_mean": 5258.6, "valid_targets_min": 2495 }, { "epoch": 6.291793313069909, "grad_norm": 0.4548322696937593, "learning_rate": 1.2397828693944346e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.14306071400642395, "step": 4140, "valid_targets_mean": 4863.1, "valid_targets_min": 1948 }, { "epoch": 6.2993920972644375, "grad_norm": 0.46459072507225524, "learning_rate": 1.2136475699965766e-06, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.1553143858909607, "step": 4145, "valid_targets_mean": 4614.7, "valid_targets_min": 816 }, { "epoch": 6.306990881458967, "grad_norm": 0.4740383536049804, "learning_rate": 1.1877820648117045e-06, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.13636600971221924, "step": 4150, "valid_targets_mean": 4426.7, "valid_targets_min": 668 }, { "epoch": 6.314589665653496, "grad_norm": 0.6354900899788738, "learning_rate": 1.162186725299026e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.155159130692482, "step": 4155, "valid_targets_mean": 3329.7, "valid_targets_min": 585 }, { "epoch": 6.322188449848024, "grad_norm": 0.4835553520976796, "learning_rate": 1.1368619190378527e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.17658662796020508, "step": 4160, "valid_targets_mean": 4895.8, "valid_targets_min": 1482 }, { "epoch": 6.329787234042553, "grad_norm": 0.4554986467408132, "learning_rate": 1.1118080097223194e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.15265491604804993, "step": 4165, "valid_targets_mean": 5167.2, "valid_targets_min": 1292 }, { "epoch": 6.3373860182370825, "grad_norm": 0.41973694830585506, "learning_rate": 1.0870253571561595e-06, "loss": 0.1551, "loss_nan_ranks": 0, "loss_rank_avg": 0.12299495190382004, "step": 4170, "valid_targets_mean": 4780.7, "valid_targets_min": 970 }, { "epoch": 6.344984802431611, "grad_norm": 0.5118900681918644, "learning_rate": 1.0625143172475404e-06, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.15326988697052002, "step": 4175, "valid_targets_mean": 4208.6, "valid_targets_min": 636 }, { "epoch": 6.35258358662614, "grad_norm": 0.49642090601129557, "learning_rate": 1.0382752420039455e-06, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.15455183386802673, "step": 4180, "valid_targets_mean": 4102.3, "valid_targets_min": 997 }, { "epoch": 6.360182370820668, "grad_norm": 0.45380918848581747, "learning_rate": 1.0143084795271329e-06, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.15013962984085083, "step": 4185, "valid_targets_mean": 4628.6, "valid_targets_min": 1572 }, { "epoch": 6.367781155015198, "grad_norm": 0.5198176682483998, "learning_rate": 9.906143740081232e-07, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.15279626846313477, "step": 4190, "valid_targets_mean": 3914.1, "valid_targets_min": 365 }, { "epoch": 6.375379939209727, "grad_norm": 0.4840441603322201, "learning_rate": 9.671932657222593e-07, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.14245177805423737, "step": 4195, "valid_targets_mean": 4812.6, "valid_targets_min": 370 }, { "epoch": 6.382978723404255, "grad_norm": 0.49127649884609786, "learning_rate": 9.440454910243235e-07, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.1520758867263794, "step": 4200, "valid_targets_mean": 4315.1, "valid_targets_min": 517 }, { "epoch": 6.390577507598784, "grad_norm": 0.4383379165078549, "learning_rate": 9.211713823437063e-07, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.1275199055671692, "step": 4205, "valid_targets_mean": 5704.6, "valid_targets_min": 581 }, { "epoch": 6.398176291793313, "grad_norm": 0.5022657150694129, "learning_rate": 8.985712681796288e-07, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.17914274334907532, "step": 4210, "valid_targets_mean": 4508.4, "valid_targets_min": 640 }, { "epoch": 6.405775075987842, "grad_norm": 0.443057452645931, "learning_rate": 8.762454730964265e-07, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.15875935554504395, "step": 4215, "valid_targets_mean": 5279.9, "valid_targets_min": 972 }, { "epoch": 6.413373860182371, "grad_norm": 0.5449589653106505, "learning_rate": 8.541943177188882e-07, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.14582566916942596, "step": 4220, "valid_targets_mean": 4343.2, "valid_targets_min": 892 }, { "epoch": 6.420972644376899, "grad_norm": 0.4997679647771693, "learning_rate": 8.324181187276581e-07, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.15510517358779907, "step": 4225, "valid_targets_mean": 4085.7, "valid_targets_min": 912 }, { "epoch": 6.428571428571429, "grad_norm": 0.44678133251760943, "learning_rate": 8.109171888546763e-07, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.15751153230667114, "step": 4230, "valid_targets_mean": 5778.9, "valid_targets_min": 1954 }, { "epoch": 6.4361702127659575, "grad_norm": 0.46788177391921826, "learning_rate": 7.896918368786921e-07, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.15475589036941528, "step": 4235, "valid_targets_mean": 5169.8, "valid_targets_min": 398 }, { "epoch": 6.443768996960486, "grad_norm": 0.5529538967645823, "learning_rate": 7.687423676208361e-07, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.13819439709186554, "step": 4240, "valid_targets_mean": 3202.6, "valid_targets_min": 528 }, { "epoch": 6.451367781155016, "grad_norm": 0.5420949591531663, "learning_rate": 7.480690819402348e-07, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.1723976731300354, "step": 4245, "valid_targets_mean": 3846.0, "valid_targets_min": 630 }, { "epoch": 6.458966565349544, "grad_norm": 0.46741861641823984, "learning_rate": 7.276722767296873e-07, "loss": 0.1677, "loss_nan_ranks": 0, "loss_rank_avg": 0.1849384605884552, "step": 4250, "valid_targets_mean": 5119.9, "valid_targets_min": 883 }, { "epoch": 6.466565349544073, "grad_norm": 0.4582713436855528, "learning_rate": 7.075522449114158e-07, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.15820877254009247, "step": 4255, "valid_targets_mean": 5030.8, "valid_targets_min": 802 }, { "epoch": 6.474164133738602, "grad_norm": 0.5211860109572727, "learning_rate": 6.877092754328419e-07, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.13718628883361816, "step": 4260, "valid_targets_mean": 3807.9, "valid_targets_min": 845 }, { "epoch": 6.481762917933131, "grad_norm": 0.45451059770584273, "learning_rate": 6.681436532624474e-07, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.1656309813261032, "step": 4265, "valid_targets_mean": 5183.2, "valid_targets_min": 1002 }, { "epoch": 6.48936170212766, "grad_norm": 0.47843071748812777, "learning_rate": 6.488556593856809e-07, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.150562584400177, "step": 4270, "valid_targets_mean": 4543.6, "valid_targets_min": 656 }, { "epoch": 6.496960486322188, "grad_norm": 0.5319539824885515, "learning_rate": 6.298455708009176e-07, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.15512758493423462, "step": 4275, "valid_targets_mean": 3799.5, "valid_targets_min": 395 }, { "epoch": 6.504559270516717, "grad_norm": 0.4705596941066166, "learning_rate": 6.111136605154877e-07, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.16856907308101654, "step": 4280, "valid_targets_mean": 4642.4, "valid_targets_min": 589 }, { "epoch": 6.5121580547112465, "grad_norm": 0.46141711207212177, "learning_rate": 5.926601975417501e-07, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.17225798964500427, "step": 4285, "valid_targets_mean": 4939.4, "valid_targets_min": 706 }, { "epoch": 6.519756838905775, "grad_norm": 0.4495104074555779, "learning_rate": 5.744854468932315e-07, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1445414125919342, "step": 4290, "valid_targets_mean": 4603.4, "valid_targets_min": 810 }, { "epoch": 6.527355623100304, "grad_norm": 0.5733777706336946, "learning_rate": 5.565896695808203e-07, "loss": 0.1705, "loss_nan_ranks": 0, "loss_rank_avg": 0.16275358200073242, "step": 4295, "valid_targets_mean": 4785.0, "valid_targets_min": 599 }, { "epoch": 6.5349544072948325, "grad_norm": 0.8991578623134154, "learning_rate": 5.389731226090189e-07, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.14771892130374908, "step": 4300, "valid_targets_mean": 4996.3, "valid_targets_min": 981 }, { "epoch": 6.542553191489362, "grad_norm": 0.4730812664882942, "learning_rate": 5.216360589722546e-07, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.12634432315826416, "step": 4305, "valid_targets_mean": 4793.1, "valid_targets_min": 689 }, { "epoch": 6.550151975683891, "grad_norm": 0.7912559796750507, "learning_rate": 5.045787276512371e-07, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.14239290356636047, "step": 4310, "valid_targets_mean": 4268.8, "valid_targets_min": 558 }, { "epoch": 6.557750759878419, "grad_norm": 0.5029546562969596, "learning_rate": 4.878013736093979e-07, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.1558806449174881, "step": 4315, "valid_targets_mean": 4656.5, "valid_targets_min": 767 }, { "epoch": 6.565349544072948, "grad_norm": 0.4604621873568329, "learning_rate": 4.713042377893562e-07, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.1444740742444992, "step": 4320, "valid_targets_mean": 4422.7, "valid_targets_min": 346 }, { "epoch": 6.572948328267477, "grad_norm": 0.4561980791707648, "learning_rate": 4.550875571094726e-07, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.14359544217586517, "step": 4325, "valid_targets_mean": 4979.9, "valid_targets_min": 2820 }, { "epoch": 6.580547112462006, "grad_norm": 0.47209358910428856, "learning_rate": 4.391515644604383e-07, "loss": 0.1502, "loss_nan_ranks": 0, "loss_rank_avg": 0.1348213255405426, "step": 4330, "valid_targets_mean": 4494.7, "valid_targets_min": 589 }, { "epoch": 6.588145896656535, "grad_norm": 0.4994707929739602, "learning_rate": 4.2349648870193103e-07, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.15195885300636292, "step": 4335, "valid_targets_mean": 4239.8, "valid_targets_min": 307 }, { "epoch": 6.595744680851064, "grad_norm": 0.44042761045131223, "learning_rate": 4.081225546593337e-07, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.129265695810318, "step": 4340, "valid_targets_mean": 5283.0, "valid_targets_min": 1159 }, { "epoch": 6.603343465045593, "grad_norm": 0.47257646281879734, "learning_rate": 3.9302998312049865e-07, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.14243176579475403, "step": 4345, "valid_targets_mean": 5513.4, "valid_targets_min": 1072 }, { "epoch": 6.6109422492401215, "grad_norm": 0.5058368728464357, "learning_rate": 3.782189908325817e-07, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.14209382236003876, "step": 4350, "valid_targets_mean": 4845.4, "valid_targets_min": 876 }, { "epoch": 6.61854103343465, "grad_norm": 0.7222155225557564, "learning_rate": 3.636897904989312e-07, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.17290833592414856, "step": 4355, "valid_targets_mean": 5422.5, "valid_targets_min": 833 }, { "epoch": 6.62613981762918, "grad_norm": 0.5233180981965705, "learning_rate": 3.494425907760235e-07, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.1492675244808197, "step": 4360, "valid_targets_mean": 4823.8, "valid_targets_min": 1224 }, { "epoch": 6.633738601823708, "grad_norm": 0.5428953839010765, "learning_rate": 3.3547759627047927e-07, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.16122207045555115, "step": 4365, "valid_targets_mean": 3899.6, "valid_targets_min": 753 }, { "epoch": 6.641337386018237, "grad_norm": 0.4419180172745714, "learning_rate": 3.2179500753611423e-07, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.135797381401062, "step": 4370, "valid_targets_mean": 5275.6, "valid_targets_min": 861 }, { "epoch": 6.648936170212766, "grad_norm": 0.4922555679423693, "learning_rate": 3.0839502107106625e-07, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.13909777998924255, "step": 4375, "valid_targets_mean": 3951.1, "valid_targets_min": 702 }, { "epoch": 6.656534954407295, "grad_norm": 0.5087072512502506, "learning_rate": 2.952778293149705e-07, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.16498416662216187, "step": 4380, "valid_targets_mean": 4312.6, "valid_targets_min": 429 }, { "epoch": 6.664133738601824, "grad_norm": 0.4560459158918358, "learning_rate": 2.8244362064619777e-07, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.13717833161354065, "step": 4385, "valid_targets_mean": 5210.4, "valid_targets_min": 864 }, { "epoch": 6.671732522796352, "grad_norm": 0.5227653302420172, "learning_rate": 2.698925793791407e-07, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.13961048424243927, "step": 4390, "valid_targets_mean": 4236.1, "valid_targets_min": 534 }, { "epoch": 6.679331306990882, "grad_norm": 0.6213258302004528, "learning_rate": 2.576248857615826e-07, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.14259956777095795, "step": 4395, "valid_targets_mean": 4035.6, "valid_targets_min": 752 }, { "epoch": 6.686930091185411, "grad_norm": 0.4688652989866426, "learning_rate": 2.4564071597209304e-07, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.15681865811347961, "step": 4400, "valid_targets_mean": 4584.2, "valid_targets_min": 869 }, { "epoch": 6.694528875379939, "grad_norm": 0.44005419382672806, "learning_rate": 2.3394024211750964e-07, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.1523476541042328, "step": 4405, "valid_targets_mean": 4952.2, "valid_targets_min": 646 }, { "epoch": 6.702127659574468, "grad_norm": 0.5205262877358279, "learning_rate": 2.2252363223045358e-07, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.16646242141723633, "step": 4410, "valid_targets_mean": 4151.1, "valid_targets_min": 820 }, { "epoch": 6.7097264437689965, "grad_norm": 0.40766981515095174, "learning_rate": 2.1139105026693586e-07, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.11196255683898926, "step": 4415, "valid_targets_mean": 5557.6, "valid_targets_min": 2410 }, { "epoch": 6.717325227963526, "grad_norm": 0.4673986831108265, "learning_rate": 2.0054265610397916e-07, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.1210668534040451, "step": 4420, "valid_targets_mean": 3992.8, "valid_targets_min": 936 }, { "epoch": 6.724924012158055, "grad_norm": 0.5619671678982381, "learning_rate": 1.8997860553733981e-07, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.17317882180213928, "step": 4425, "valid_targets_mean": 3874.4, "valid_targets_min": 446 }, { "epoch": 6.732522796352583, "grad_norm": 0.4280630319229206, "learning_rate": 1.7969905027926504e-07, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.1904495656490326, "step": 4430, "valid_targets_mean": 6671.5, "valid_targets_min": 907 }, { "epoch": 6.740121580547113, "grad_norm": 0.44122684787277994, "learning_rate": 1.6970413795631025e-07, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.14559206366539001, "step": 4435, "valid_targets_mean": 5373.0, "valid_targets_min": 595 }, { "epoch": 6.7477203647416415, "grad_norm": 0.5080820811124032, "learning_rate": 1.5999401210722075e-07, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.1340736597776413, "step": 4440, "valid_targets_mean": 3668.2, "valid_targets_min": 694 }, { "epoch": 6.75531914893617, "grad_norm": 0.5257059339394762, "learning_rate": 1.5056881218088016e-07, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.15984541177749634, "step": 4445, "valid_targets_mean": 4337.5, "valid_targets_min": 498 }, { "epoch": 6.762917933130699, "grad_norm": 0.43327223465331344, "learning_rate": 1.4142867353428514e-07, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.157816082239151, "step": 4450, "valid_targets_mean": 5491.9, "valid_targets_min": 827 }, { "epoch": 6.770516717325228, "grad_norm": 0.50219861891989, "learning_rate": 1.3257372743063157e-07, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.11714717745780945, "step": 4455, "valid_targets_mean": 3812.8, "valid_targets_min": 502 }, { "epoch": 6.778115501519757, "grad_norm": 0.45055666905824504, "learning_rate": 1.2400410103740045e-07, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.14584630727767944, "step": 4460, "valid_targets_mean": 5178.9, "valid_targets_min": 516 }, { "epoch": 6.785714285714286, "grad_norm": 0.43952764279896794, "learning_rate": 1.157199174245549e-07, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.13095200061798096, "step": 4465, "valid_targets_mean": 5314.9, "valid_targets_min": 1217 }, { "epoch": 6.793313069908814, "grad_norm": 0.4738968512497199, "learning_rate": 1.0772129556275268e-07, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.12924160063266754, "step": 4470, "valid_targets_mean": 4845.8, "valid_targets_min": 843 }, { "epoch": 6.800911854103344, "grad_norm": 0.5060295374260998, "learning_rate": 1.0000835032165645e-07, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.1658594310283661, "step": 4475, "valid_targets_mean": 4230.7, "valid_targets_min": 915 }, { "epoch": 6.808510638297872, "grad_norm": 0.4466023053432, "learning_rate": 9.258119246826625e-08, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.1489754319190979, "step": 4480, "valid_targets_mean": 5316.6, "valid_targets_min": 2627 }, { "epoch": 6.816109422492401, "grad_norm": 0.46338292936158193, "learning_rate": 8.543992866534734e-08, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.14392951130867004, "step": 4485, "valid_targets_mean": 4956.6, "valid_targets_min": 409 }, { "epoch": 6.823708206686931, "grad_norm": 0.5158394667496263, "learning_rate": 7.858466146988042e-08, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.16497617959976196, "step": 4490, "valid_targets_mean": 4279.7, "valid_targets_min": 775 }, { "epoch": 6.831306990881459, "grad_norm": 0.42417696152695383, "learning_rate": 7.201548933160275e-08, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.14127472043037415, "step": 4495, "valid_targets_mean": 5479.2, "valid_targets_min": 2631 }, { "epoch": 6.838905775075988, "grad_norm": 0.5211912905058261, "learning_rate": 6.573250659158481e-08, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.14878888428211212, "step": 4500, "valid_targets_mean": 4435.9, "valid_targets_min": 2412 }, { "epoch": 6.8465045592705165, "grad_norm": 0.43147229360794226, "learning_rate": 5.973580348088259e-08, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.15211549401283264, "step": 4505, "valid_targets_mean": 5367.4, "valid_targets_min": 2364 }, { "epoch": 6.854103343465045, "grad_norm": 0.4561025698955299, "learning_rate": 5.4025466119234094e-08, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.13766488432884216, "step": 4510, "valid_targets_mean": 5133.6, "valid_targets_min": 655 }, { "epoch": 6.861702127659575, "grad_norm": 0.4670200688124053, "learning_rate": 4.860157651383146e-08, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.12196432799100876, "step": 4515, "valid_targets_mean": 5354.1, "valid_targets_min": 1941 }, { "epoch": 6.869300911854103, "grad_norm": 0.46811141014194185, "learning_rate": 4.346421255813527e-08, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.1508735716342926, "step": 4520, "valid_targets_mean": 4876.9, "valid_targets_min": 647 }, { "epoch": 6.876899696048632, "grad_norm": 0.5309409348069238, "learning_rate": 3.8613448030759836e-08, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.1319991499185562, "step": 4525, "valid_targets_mean": 4153.0, "valid_targets_min": 558 }, { "epoch": 6.8844984802431615, "grad_norm": 0.4583034610783906, "learning_rate": 3.404935259441633e-08, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.1385440230369568, "step": 4530, "valid_targets_mean": 5040.1, "valid_targets_min": 666 }, { "epoch": 6.89209726443769, "grad_norm": 0.5760708842558298, "learning_rate": 2.977199179490686e-08, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.16344650089740753, "step": 4535, "valid_targets_mean": 4789.9, "valid_targets_min": 774 }, { "epoch": 6.899696048632219, "grad_norm": 0.5268446726565859, "learning_rate": 2.5781427060183052e-08, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.1606959104537964, "step": 4540, "valid_targets_mean": 4283.8, "valid_targets_min": 229 }, { "epoch": 6.907294832826747, "grad_norm": 0.4734646023589767, "learning_rate": 2.2077715699468928e-08, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.14003373682498932, "step": 4545, "valid_targets_mean": 4974.8, "valid_targets_min": 773 }, { "epoch": 6.914893617021277, "grad_norm": 0.4360796739556199, "learning_rate": 1.8660910902434936e-08, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.12974536418914795, "step": 4550, "valid_targets_mean": 5910.8, "valid_targets_min": 1114 }, { "epoch": 6.922492401215806, "grad_norm": 0.48684145305746557, "learning_rate": 1.5531061738436327e-08, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.15198959410190582, "step": 4555, "valid_targets_mean": 3936.3, "valid_targets_min": 1779 }, { "epoch": 6.930091185410334, "grad_norm": 0.5091294127835059, "learning_rate": 1.2688213155802598e-08, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.1628214567899704, "step": 4560, "valid_targets_mean": 4214.5, "valid_targets_min": 683 }, { "epoch": 6.937689969604863, "grad_norm": 0.43005172219863, "learning_rate": 1.0132405981195804e-08, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.13487809896469116, "step": 4565, "valid_targets_mean": 5104.1, "valid_targets_min": 2548 }, { "epoch": 6.945288753799392, "grad_norm": 0.5851616543398429, "learning_rate": 7.863676919031005e-09, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.13807334005832672, "step": 4570, "valid_targets_mean": 4572.6, "valid_targets_min": 792 }, { "epoch": 6.952887537993921, "grad_norm": 0.5007425137471639, "learning_rate": 5.882058550932268e-09, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591353416442871, "step": 4575, "valid_targets_mean": 3956.2, "valid_targets_min": 447 }, { "epoch": 6.96048632218845, "grad_norm": 0.5253135197553259, "learning_rate": 4.187579335281911e-09, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.16565826535224915, "step": 4580, "valid_targets_mean": 3869.7, "valid_targets_min": 1117 }, { "epoch": 6.968085106382979, "grad_norm": 0.5136974200238252, "learning_rate": 2.780263606805278e-09, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.1372585892677307, "step": 4585, "valid_targets_mean": 4006.6, "valid_targets_min": 538 }, { "epoch": 6.975683890577508, "grad_norm": 0.5478996499330996, "learning_rate": 1.6601315762154735e-09, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.1610221564769745, "step": 4590, "valid_targets_mean": 4602.3, "valid_targets_min": 741 }, { "epoch": 6.9832826747720365, "grad_norm": 0.48873947966074016, "learning_rate": 8.271993299358017e-10, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.16153308749198914, "step": 4595, "valid_targets_mean": 4922.5, "valid_targets_min": 589 }, { "epoch": 6.990881458966565, "grad_norm": 0.484585895107589, "learning_rate": 2.814788298532989e-10, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.14617104828357697, "step": 4600, "valid_targets_mean": 4203.9, "valid_targets_min": 714 }, { "epoch": 6.998480243161094, "grad_norm": 0.4567401537531439, "learning_rate": 2.2977913158861444e-11, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.15201044082641602, "step": 4605, "valid_targets_mean": 5189.9, "valid_targets_min": 511 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.1645904779434204, "step": 4606, "total_flos": 1702570888593408.0, "train_loss": 0.19200077259858897, "train_runtime": 28350.7795, "train_samples_per_second": 2.597, "train_steps_per_second": 0.162, "valid_targets_mean": 3879.8, "valid_targets_min": 728 } ], "logging_steps": 5, "max_steps": 4606, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1702570888593408.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }