{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 4004, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.008741258741258742, "grad_norm": 6.891807865886709, "learning_rate": 3.990024937655861e-07, "loss": 0.7806, "loss_nan_ranks": 0, "loss_rank_avg": 0.688166618347168, "step": 5, "valid_targets_mean": 4434.8, "valid_targets_min": 1164 }, { "epoch": 0.017482517482517484, "grad_norm": 10.07235768114182, "learning_rate": 8.977556109725687e-07, "loss": 0.7949, "loss_nan_ranks": 0, "loss_rank_avg": 0.6993734836578369, "step": 10, "valid_targets_mean": 2489.4, "valid_targets_min": 760 }, { "epoch": 0.026223776223776224, "grad_norm": 9.371443623670519, "learning_rate": 1.396508728179551e-06, "loss": 0.8104, "loss_nan_ranks": 0, "loss_rank_avg": 0.8695156574249268, "step": 15, "valid_targets_mean": 3041.5, "valid_targets_min": 1109 }, { "epoch": 0.03496503496503497, "grad_norm": 5.8828558878845, "learning_rate": 1.8952618453865338e-06, "loss": 0.7645, "loss_nan_ranks": 0, "loss_rank_avg": 0.820339024066925, "step": 20, "valid_targets_mean": 5423.1, "valid_targets_min": 1087 }, { "epoch": 0.043706293706293704, "grad_norm": 4.921738857282242, "learning_rate": 2.3940149625935166e-06, "loss": 0.7558, "loss_nan_ranks": 0, "loss_rank_avg": 0.75657057762146, "step": 25, "valid_targets_mean": 4129.1, "valid_targets_min": 1235 }, { "epoch": 0.05244755244755245, "grad_norm": 3.1722389939987297, "learning_rate": 2.892768079800499e-06, "loss": 0.7613, "loss_nan_ranks": 0, "loss_rank_avg": 0.7961629033088684, "step": 30, "valid_targets_mean": 5228.2, "valid_targets_min": 1258 }, { "epoch": 0.06118881118881119, "grad_norm": 2.483826973866041, "learning_rate": 3.391521197007482e-06, "loss": 0.6789, "loss_nan_ranks": 0, "loss_rank_avg": 0.6847758293151855, "step": 35, "valid_targets_mean": 3565.4, "valid_targets_min": 1135 }, { "epoch": 0.06993006993006994, "grad_norm": 1.7214635926067359, "learning_rate": 3.890274314214464e-06, "loss": 0.6961, "loss_nan_ranks": 0, "loss_rank_avg": 0.6839813590049744, "step": 40, "valid_targets_mean": 4050.9, "valid_targets_min": 1743 }, { "epoch": 0.07867132867132867, "grad_norm": 1.4291208613040705, "learning_rate": 4.389027431421446e-06, "loss": 0.6516, "loss_nan_ranks": 0, "loss_rank_avg": 0.7264044284820557, "step": 45, "valid_targets_mean": 4053.4, "valid_targets_min": 795 }, { "epoch": 0.08741258741258741, "grad_norm": 1.1744063794805446, "learning_rate": 4.887780548628429e-06, "loss": 0.6135, "loss_nan_ranks": 0, "loss_rank_avg": 0.5638917684555054, "step": 50, "valid_targets_mean": 2825.8, "valid_targets_min": 1378 }, { "epoch": 0.09615384615384616, "grad_norm": 1.27848851631508, "learning_rate": 5.386533665835411e-06, "loss": 0.6698, "loss_nan_ranks": 0, "loss_rank_avg": 0.8109359741210938, "step": 55, "valid_targets_mean": 6348.3, "valid_targets_min": 1256 }, { "epoch": 0.1048951048951049, "grad_norm": 0.880099323037957, "learning_rate": 5.885286783042394e-06, "loss": 0.6445, "loss_nan_ranks": 0, "loss_rank_avg": 0.6418143510818481, "step": 60, "valid_targets_mean": 5170.8, "valid_targets_min": 775 }, { "epoch": 0.11363636363636363, "grad_norm": 0.8423522806449167, "learning_rate": 6.384039900249377e-06, "loss": 0.5967, "loss_nan_ranks": 0, "loss_rank_avg": 0.6989394426345825, "step": 65, "valid_targets_mean": 4292.8, "valid_targets_min": 1137 }, { "epoch": 0.12237762237762238, "grad_norm": 0.8774344604276414, "learning_rate": 6.882793017456359e-06, "loss": 0.5712, "loss_nan_ranks": 0, "loss_rank_avg": 0.5156315565109253, "step": 70, "valid_targets_mean": 3363.1, "valid_targets_min": 1000 }, { "epoch": 0.13111888111888112, "grad_norm": 0.7471525308366247, "learning_rate": 7.381546134663342e-06, "loss": 0.5889, "loss_nan_ranks": 0, "loss_rank_avg": 0.524969220161438, "step": 75, "valid_targets_mean": 3267.2, "valid_targets_min": 437 }, { "epoch": 0.13986013986013987, "grad_norm": 0.6351105968482974, "learning_rate": 7.880299251870324e-06, "loss": 0.5783, "loss_nan_ranks": 0, "loss_rank_avg": 0.5628579258918762, "step": 80, "valid_targets_mean": 4445.7, "valid_targets_min": 1269 }, { "epoch": 0.1486013986013986, "grad_norm": 0.8435486850711871, "learning_rate": 8.379052369077308e-06, "loss": 0.5584, "loss_nan_ranks": 0, "loss_rank_avg": 0.5862073302268982, "step": 85, "valid_targets_mean": 3406.3, "valid_targets_min": 1195 }, { "epoch": 0.15734265734265734, "grad_norm": 0.7027259715932884, "learning_rate": 8.87780548628429e-06, "loss": 0.5716, "loss_nan_ranks": 0, "loss_rank_avg": 0.5122252702713013, "step": 90, "valid_targets_mean": 3020.4, "valid_targets_min": 816 }, { "epoch": 0.1660839160839161, "grad_norm": 0.7143768069579088, "learning_rate": 9.376558603491272e-06, "loss": 0.5652, "loss_nan_ranks": 0, "loss_rank_avg": 0.5643905401229858, "step": 95, "valid_targets_mean": 3280.6, "valid_targets_min": 1458 }, { "epoch": 0.17482517482517482, "grad_norm": 0.6466673146750979, "learning_rate": 9.875311720698254e-06, "loss": 0.5271, "loss_nan_ranks": 0, "loss_rank_avg": 0.5161752700805664, "step": 100, "valid_targets_mean": 3466.4, "valid_targets_min": 785 }, { "epoch": 0.18356643356643357, "grad_norm": 0.660607431222328, "learning_rate": 1.0374064837905238e-05, "loss": 0.5565, "loss_nan_ranks": 0, "loss_rank_avg": 0.49148479104042053, "step": 105, "valid_targets_mean": 2937.3, "valid_targets_min": 967 }, { "epoch": 0.19230769230769232, "grad_norm": 0.6418923782026298, "learning_rate": 1.087281795511222e-05, "loss": 0.4982, "loss_nan_ranks": 0, "loss_rank_avg": 0.53751540184021, "step": 110, "valid_targets_mean": 4915.1, "valid_targets_min": 753 }, { "epoch": 0.20104895104895104, "grad_norm": 0.5772065562262413, "learning_rate": 1.1371571072319202e-05, "loss": 0.4941, "loss_nan_ranks": 0, "loss_rank_avg": 0.5409708023071289, "step": 115, "valid_targets_mean": 4977.4, "valid_targets_min": 1187 }, { "epoch": 0.2097902097902098, "grad_norm": 0.6801379276243148, "learning_rate": 1.1870324189526186e-05, "loss": 0.4966, "loss_nan_ranks": 0, "loss_rank_avg": 0.5502436757087708, "step": 120, "valid_targets_mean": 4482.5, "valid_targets_min": 771 }, { "epoch": 0.21853146853146854, "grad_norm": 0.6133787753502925, "learning_rate": 1.2369077306733168e-05, "loss": 0.5088, "loss_nan_ranks": 0, "loss_rank_avg": 0.45697876811027527, "step": 125, "valid_targets_mean": 3453.1, "valid_targets_min": 1168 }, { "epoch": 0.22727272727272727, "grad_norm": 0.7592541102494601, "learning_rate": 1.286783042394015e-05, "loss": 0.4966, "loss_nan_ranks": 0, "loss_rank_avg": 0.4945298135280609, "step": 130, "valid_targets_mean": 5048.1, "valid_targets_min": 1529 }, { "epoch": 0.23601398601398602, "grad_norm": 0.6366182167764396, "learning_rate": 1.3366583541147134e-05, "loss": 0.4939, "loss_nan_ranks": 0, "loss_rank_avg": 0.5059365034103394, "step": 135, "valid_targets_mean": 4097.1, "valid_targets_min": 1112 }, { "epoch": 0.24475524475524477, "grad_norm": 0.6564205667008085, "learning_rate": 1.3865336658354116e-05, "loss": 0.4725, "loss_nan_ranks": 0, "loss_rank_avg": 0.44329914450645447, "step": 140, "valid_targets_mean": 2867.4, "valid_targets_min": 1213 }, { "epoch": 0.2534965034965035, "grad_norm": 0.6724554034077109, "learning_rate": 1.4364089775561098e-05, "loss": 0.538, "loss_nan_ranks": 0, "loss_rank_avg": 0.4999472200870514, "step": 145, "valid_targets_mean": 4216.0, "valid_targets_min": 1142 }, { "epoch": 0.26223776223776224, "grad_norm": 0.7059030471238626, "learning_rate": 1.486284289276808e-05, "loss": 0.4688, "loss_nan_ranks": 0, "loss_rank_avg": 0.48053932189941406, "step": 150, "valid_targets_mean": 2904.5, "valid_targets_min": 954 }, { "epoch": 0.270979020979021, "grad_norm": 0.7125138132476857, "learning_rate": 1.5361596009975064e-05, "loss": 0.499, "loss_nan_ranks": 0, "loss_rank_avg": 0.581404983997345, "step": 155, "valid_targets_mean": 4037.4, "valid_targets_min": 428 }, { "epoch": 0.27972027972027974, "grad_norm": 0.728117797766979, "learning_rate": 1.5860349127182046e-05, "loss": 0.4432, "loss_nan_ranks": 0, "loss_rank_avg": 0.4301885962486267, "step": 160, "valid_targets_mean": 2771.1, "valid_targets_min": 1129 }, { "epoch": 0.28846153846153844, "grad_norm": 0.715988515093435, "learning_rate": 1.635910224438903e-05, "loss": 0.4658, "loss_nan_ranks": 0, "loss_rank_avg": 0.4865019917488098, "step": 165, "valid_targets_mean": 3270.8, "valid_targets_min": 783 }, { "epoch": 0.2972027972027972, "grad_norm": 0.6269860955107454, "learning_rate": 1.685785536159601e-05, "loss": 0.4362, "loss_nan_ranks": 0, "loss_rank_avg": 0.4705418646335602, "step": 170, "valid_targets_mean": 4284.6, "valid_targets_min": 1122 }, { "epoch": 0.30594405594405594, "grad_norm": 0.5592398328135262, "learning_rate": 1.7356608478802993e-05, "loss": 0.4659, "loss_nan_ranks": 0, "loss_rank_avg": 0.3761853873729706, "step": 175, "valid_targets_mean": 3507.1, "valid_targets_min": 711 }, { "epoch": 0.3146853146853147, "grad_norm": 0.6467612787611225, "learning_rate": 1.7855361596009978e-05, "loss": 0.4857, "loss_nan_ranks": 0, "loss_rank_avg": 0.5388031005859375, "step": 180, "valid_targets_mean": 4472.5, "valid_targets_min": 1251 }, { "epoch": 0.32342657342657344, "grad_norm": 0.7059874120353821, "learning_rate": 1.835411471321696e-05, "loss": 0.4413, "loss_nan_ranks": 0, "loss_rank_avg": 0.4448562562465668, "step": 185, "valid_targets_mean": 3762.6, "valid_targets_min": 317 }, { "epoch": 0.3321678321678322, "grad_norm": 0.647197969313476, "learning_rate": 1.8852867830423942e-05, "loss": 0.4846, "loss_nan_ranks": 0, "loss_rank_avg": 0.5174081921577454, "step": 190, "valid_targets_mean": 4593.6, "valid_targets_min": 848 }, { "epoch": 0.3409090909090909, "grad_norm": 0.758407351151443, "learning_rate": 1.9351620947630925e-05, "loss": 0.4638, "loss_nan_ranks": 0, "loss_rank_avg": 0.4045215845108032, "step": 195, "valid_targets_mean": 2296.8, "valid_targets_min": 870 }, { "epoch": 0.34965034965034963, "grad_norm": 0.6647262744061739, "learning_rate": 1.9850374064837907e-05, "loss": 0.452, "loss_nan_ranks": 0, "loss_rank_avg": 0.4018682539463043, "step": 200, "valid_targets_mean": 3484.7, "valid_targets_min": 1374 }, { "epoch": 0.3583916083916084, "grad_norm": 0.8052379949927564, "learning_rate": 2.034912718204489e-05, "loss": 0.5022, "loss_nan_ranks": 0, "loss_rank_avg": 0.4757809638977051, "step": 205, "valid_targets_mean": 2731.2, "valid_targets_min": 1124 }, { "epoch": 0.36713286713286714, "grad_norm": 0.5730191757062828, "learning_rate": 2.084788029925187e-05, "loss": 0.4553, "loss_nan_ranks": 0, "loss_rank_avg": 0.49919718503952026, "step": 210, "valid_targets_mean": 5203.2, "valid_targets_min": 1011 }, { "epoch": 0.3758741258741259, "grad_norm": 0.6122316092766614, "learning_rate": 2.1346633416458853e-05, "loss": 0.461, "loss_nan_ranks": 0, "loss_rank_avg": 0.5063073635101318, "step": 215, "valid_targets_mean": 6397.0, "valid_targets_min": 1352 }, { "epoch": 0.38461538461538464, "grad_norm": 0.7049095990494619, "learning_rate": 2.1845386533665835e-05, "loss": 0.416, "loss_nan_ranks": 0, "loss_rank_avg": 0.5339525938034058, "step": 220, "valid_targets_mean": 4158.1, "valid_targets_min": 823 }, { "epoch": 0.39335664335664333, "grad_norm": 0.698438091999467, "learning_rate": 2.2344139650872817e-05, "loss": 0.4574, "loss_nan_ranks": 0, "loss_rank_avg": 0.47370338439941406, "step": 225, "valid_targets_mean": 3506.1, "valid_targets_min": 1179 }, { "epoch": 0.4020979020979021, "grad_norm": 0.7054393747626264, "learning_rate": 2.28428927680798e-05, "loss": 0.4607, "loss_nan_ranks": 0, "loss_rank_avg": 0.4713825285434723, "step": 230, "valid_targets_mean": 3467.7, "valid_targets_min": 769 }, { "epoch": 0.41083916083916083, "grad_norm": 0.6398523387870552, "learning_rate": 2.3341645885286785e-05, "loss": 0.4693, "loss_nan_ranks": 0, "loss_rank_avg": 0.49769261479377747, "step": 235, "valid_targets_mean": 5616.6, "valid_targets_min": 1339 }, { "epoch": 0.4195804195804196, "grad_norm": 0.5779595979100703, "learning_rate": 2.3840399002493767e-05, "loss": 0.4295, "loss_nan_ranks": 0, "loss_rank_avg": 0.42991095781326294, "step": 240, "valid_targets_mean": 4796.9, "valid_targets_min": 1399 }, { "epoch": 0.42832167832167833, "grad_norm": 0.7018424514021866, "learning_rate": 2.433915211970075e-05, "loss": 0.4287, "loss_nan_ranks": 0, "loss_rank_avg": 0.416814386844635, "step": 245, "valid_targets_mean": 3066.3, "valid_targets_min": 1091 }, { "epoch": 0.4370629370629371, "grad_norm": 0.7070083860196137, "learning_rate": 2.483790523690773e-05, "loss": 0.4089, "loss_nan_ranks": 0, "loss_rank_avg": 0.42583611607551575, "step": 250, "valid_targets_mean": 3095.8, "valid_targets_min": 836 }, { "epoch": 0.4458041958041958, "grad_norm": 0.6542255655325461, "learning_rate": 2.5336658354114713e-05, "loss": 0.4766, "loss_nan_ranks": 0, "loss_rank_avg": 0.4974190890789032, "step": 255, "valid_targets_mean": 4516.5, "valid_targets_min": 1431 }, { "epoch": 0.45454545454545453, "grad_norm": 0.6057280619187766, "learning_rate": 2.5835411471321695e-05, "loss": 0.4346, "loss_nan_ranks": 0, "loss_rank_avg": 0.494473934173584, "step": 260, "valid_targets_mean": 4743.2, "valid_targets_min": 1768 }, { "epoch": 0.4632867132867133, "grad_norm": 0.6576098745294991, "learning_rate": 2.6334164588528677e-05, "loss": 0.4003, "loss_nan_ranks": 0, "loss_rank_avg": 0.39938753843307495, "step": 265, "valid_targets_mean": 3158.4, "valid_targets_min": 1073 }, { "epoch": 0.47202797202797203, "grad_norm": 0.6101915400033449, "learning_rate": 2.6832917705735663e-05, "loss": 0.4526, "loss_nan_ranks": 0, "loss_rank_avg": 0.4094006419181824, "step": 270, "valid_targets_mean": 4226.7, "valid_targets_min": 1197 }, { "epoch": 0.4807692307692308, "grad_norm": 0.692943572411887, "learning_rate": 2.7331670822942645e-05, "loss": 0.4704, "loss_nan_ranks": 0, "loss_rank_avg": 0.42553043365478516, "step": 275, "valid_targets_mean": 3468.1, "valid_targets_min": 866 }, { "epoch": 0.48951048951048953, "grad_norm": 0.625051535199143, "learning_rate": 2.7830423940149627e-05, "loss": 0.4102, "loss_nan_ranks": 0, "loss_rank_avg": 0.4416755139827728, "step": 280, "valid_targets_mean": 4131.4, "valid_targets_min": 274 }, { "epoch": 0.4982517482517482, "grad_norm": 0.6202235346478298, "learning_rate": 2.832917705735661e-05, "loss": 0.4464, "loss_nan_ranks": 0, "loss_rank_avg": 0.38613349199295044, "step": 285, "valid_targets_mean": 3556.7, "valid_targets_min": 1975 }, { "epoch": 0.506993006993007, "grad_norm": 0.6373806668498091, "learning_rate": 2.882793017456359e-05, "loss": 0.4648, "loss_nan_ranks": 0, "loss_rank_avg": 0.3658190369606018, "step": 290, "valid_targets_mean": 3424.1, "valid_targets_min": 985 }, { "epoch": 0.5157342657342657, "grad_norm": 0.6404836592194673, "learning_rate": 2.9326683291770573e-05, "loss": 0.3999, "loss_nan_ranks": 0, "loss_rank_avg": 0.4423462748527527, "step": 295, "valid_targets_mean": 3966.9, "valid_targets_min": 699 }, { "epoch": 0.5244755244755245, "grad_norm": 0.6065384985472947, "learning_rate": 2.982543640897756e-05, "loss": 0.402, "loss_nan_ranks": 0, "loss_rank_avg": 0.478157639503479, "step": 300, "valid_targets_mean": 4951.2, "valid_targets_min": 794 }, { "epoch": 0.5332167832167832, "grad_norm": 0.7363666663898127, "learning_rate": 3.032418952618454e-05, "loss": 0.4199, "loss_nan_ranks": 0, "loss_rank_avg": 0.44249227643013, "step": 305, "valid_targets_mean": 3142.7, "valid_targets_min": 350 }, { "epoch": 0.541958041958042, "grad_norm": 0.7419524259349666, "learning_rate": 3.082294264339152e-05, "loss": 0.4473, "loss_nan_ranks": 0, "loss_rank_avg": 0.3787216246128082, "step": 310, "valid_targets_mean": 2529.6, "valid_targets_min": 593 }, { "epoch": 0.5506993006993007, "grad_norm": 0.6373826151069447, "learning_rate": 3.13216957605985e-05, "loss": 0.4175, "loss_nan_ranks": 0, "loss_rank_avg": 0.48238128423690796, "step": 315, "valid_targets_mean": 4511.8, "valid_targets_min": 1360 }, { "epoch": 0.5594405594405595, "grad_norm": 0.6890339528272231, "learning_rate": 3.182044887780549e-05, "loss": 0.4172, "loss_nan_ranks": 0, "loss_rank_avg": 0.4121536612510681, "step": 320, "valid_targets_mean": 3423.4, "valid_targets_min": 361 }, { "epoch": 0.5681818181818182, "grad_norm": 0.6709193485672122, "learning_rate": 3.231920199501247e-05, "loss": 0.4201, "loss_nan_ranks": 0, "loss_rank_avg": 0.4338151216506958, "step": 325, "valid_targets_mean": 3460.5, "valid_targets_min": 1175 }, { "epoch": 0.5769230769230769, "grad_norm": 0.5691860103331635, "learning_rate": 3.281795511221945e-05, "loss": 0.4425, "loss_nan_ranks": 0, "loss_rank_avg": 0.4696723520755768, "step": 330, "valid_targets_mean": 4651.1, "valid_targets_min": 1325 }, { "epoch": 0.5856643356643356, "grad_norm": 0.6081921585343787, "learning_rate": 3.331670822942644e-05, "loss": 0.4207, "loss_nan_ranks": 0, "loss_rank_avg": 0.46315813064575195, "step": 335, "valid_targets_mean": 4476.0, "valid_targets_min": 1014 }, { "epoch": 0.5944055944055944, "grad_norm": 0.6569386219652944, "learning_rate": 3.3815461346633416e-05, "loss": 0.4259, "loss_nan_ranks": 0, "loss_rank_avg": 0.4307020902633667, "step": 340, "valid_targets_mean": 3833.4, "valid_targets_min": 942 }, { "epoch": 0.6031468531468531, "grad_norm": 0.5939332314153571, "learning_rate": 3.43142144638404e-05, "loss": 0.4181, "loss_nan_ranks": 0, "loss_rank_avg": 0.4571363925933838, "step": 345, "valid_targets_mean": 4945.1, "valid_targets_min": 970 }, { "epoch": 0.6118881118881119, "grad_norm": 0.5969183422034433, "learning_rate": 3.481296758104738e-05, "loss": 0.4408, "loss_nan_ranks": 0, "loss_rank_avg": 0.4501033127307892, "step": 350, "valid_targets_mean": 4973.1, "valid_targets_min": 1044 }, { "epoch": 0.6206293706293706, "grad_norm": 0.5757241278002854, "learning_rate": 3.5311720698254365e-05, "loss": 0.4381, "loss_nan_ranks": 0, "loss_rank_avg": 0.43396443128585815, "step": 355, "valid_targets_mean": 4245.8, "valid_targets_min": 1144 }, { "epoch": 0.6293706293706294, "grad_norm": 0.6280624127149288, "learning_rate": 3.581047381546135e-05, "loss": 0.4111, "loss_nan_ranks": 0, "loss_rank_avg": 0.3709952235221863, "step": 360, "valid_targets_mean": 3450.9, "valid_targets_min": 1038 }, { "epoch": 0.6381118881118881, "grad_norm": 0.6272407181268593, "learning_rate": 3.630922693266833e-05, "loss": 0.4238, "loss_nan_ranks": 0, "loss_rank_avg": 0.4287092685699463, "step": 365, "valid_targets_mean": 3760.8, "valid_targets_min": 1263 }, { "epoch": 0.6468531468531469, "grad_norm": 0.6303444859879423, "learning_rate": 3.6807980049875315e-05, "loss": 0.4292, "loss_nan_ranks": 0, "loss_rank_avg": 0.4412212371826172, "step": 370, "valid_targets_mean": 3570.2, "valid_targets_min": 632 }, { "epoch": 0.6555944055944056, "grad_norm": 0.5953844799248368, "learning_rate": 3.7306733167082294e-05, "loss": 0.3885, "loss_nan_ranks": 0, "loss_rank_avg": 0.43160712718963623, "step": 375, "valid_targets_mean": 4197.4, "valid_targets_min": 1396 }, { "epoch": 0.6643356643356644, "grad_norm": 0.6082707171096963, "learning_rate": 3.780548628428928e-05, "loss": 0.4052, "loss_nan_ranks": 0, "loss_rank_avg": 0.3460230529308319, "step": 380, "valid_targets_mean": 3363.0, "valid_targets_min": 872 }, { "epoch": 0.6730769230769231, "grad_norm": 0.5998396388984467, "learning_rate": 3.8304239401496265e-05, "loss": 0.3892, "loss_nan_ranks": 0, "loss_rank_avg": 0.4442782998085022, "step": 385, "valid_targets_mean": 4488.0, "valid_targets_min": 396 }, { "epoch": 0.6818181818181818, "grad_norm": 0.6607949283944162, "learning_rate": 3.8802992518703244e-05, "loss": 0.3803, "loss_nan_ranks": 0, "loss_rank_avg": 0.35880744457244873, "step": 390, "valid_targets_mean": 2970.6, "valid_targets_min": 1071 }, { "epoch": 0.6905594405594405, "grad_norm": 0.6900570931097955, "learning_rate": 3.930174563591023e-05, "loss": 0.4064, "loss_nan_ranks": 0, "loss_rank_avg": 0.36735618114471436, "step": 395, "valid_targets_mean": 3114.1, "valid_targets_min": 1095 }, { "epoch": 0.6993006993006993, "grad_norm": 0.6914449468836832, "learning_rate": 3.980049875311721e-05, "loss": 0.3688, "loss_nan_ranks": 0, "loss_rank_avg": 0.2671054005622864, "step": 400, "valid_targets_mean": 2244.2, "valid_targets_min": 875 }, { "epoch": 0.708041958041958, "grad_norm": 0.7160530816069505, "learning_rate": 3.999993157520847e-05, "loss": 0.413, "loss_nan_ranks": 0, "loss_rank_avg": 0.5022163391113281, "step": 405, "valid_targets_mean": 5052.9, "valid_targets_min": 659 }, { "epoch": 0.7167832167832168, "grad_norm": 0.8302002805431459, "learning_rate": 3.999951342540017e-05, "loss": 0.4308, "loss_nan_ranks": 0, "loss_rank_avg": 0.48281511664390564, "step": 410, "valid_targets_mean": 4652.4, "valid_targets_min": 913 }, { "epoch": 0.7255244755244755, "grad_norm": 0.5546189149897846, "learning_rate": 3.999871514749473e-05, "loss": 0.4438, "loss_nan_ranks": 0, "loss_rank_avg": 0.3389652669429779, "step": 415, "valid_targets_mean": 4212.8, "valid_targets_min": 758 }, { "epoch": 0.7342657342657343, "grad_norm": 0.5634394054527263, "learning_rate": 3.999753675666491e-05, "loss": 0.4093, "loss_nan_ranks": 0, "loss_rank_avg": 0.41193175315856934, "step": 420, "valid_targets_mean": 5020.0, "valid_targets_min": 885 }, { "epoch": 0.743006993006993, "grad_norm": 0.7004352845216515, "learning_rate": 3.9995978275308226e-05, "loss": 0.4024, "loss_nan_ranks": 0, "loss_rank_avg": 0.4134072959423065, "step": 425, "valid_targets_mean": 3430.8, "valid_targets_min": 1156 }, { "epoch": 0.7517482517482518, "grad_norm": 0.6196320289647665, "learning_rate": 3.999403973304654e-05, "loss": 0.4477, "loss_nan_ranks": 0, "loss_rank_avg": 0.3583190441131592, "step": 430, "valid_targets_mean": 3033.9, "valid_targets_min": 1023 }, { "epoch": 0.7604895104895105, "grad_norm": 0.5773913116859302, "learning_rate": 3.999172116672545e-05, "loss": 0.4322, "loss_nan_ranks": 0, "loss_rank_avg": 0.397724449634552, "step": 435, "valid_targets_mean": 4305.8, "valid_targets_min": 857 }, { "epoch": 0.7692307692307693, "grad_norm": 0.9368889840219, "learning_rate": 3.9989022620413646e-05, "loss": 0.3866, "loss_nan_ranks": 0, "loss_rank_avg": 0.43847835063934326, "step": 440, "valid_targets_mean": 4250.9, "valid_targets_min": 1030 }, { "epoch": 0.777972027972028, "grad_norm": 0.6324915742383318, "learning_rate": 3.998594414540204e-05, "loss": 0.4222, "loss_nan_ranks": 0, "loss_rank_avg": 0.2982059121131897, "step": 445, "valid_targets_mean": 2808.2, "valid_targets_min": 1264 }, { "epoch": 0.7867132867132867, "grad_norm": 0.7217580076816469, "learning_rate": 3.99824858002028e-05, "loss": 0.3705, "loss_nan_ranks": 0, "loss_rank_avg": 0.43571165204048157, "step": 450, "valid_targets_mean": 3194.4, "valid_targets_min": 765 }, { "epoch": 0.7954545454545454, "grad_norm": 0.6237816031652519, "learning_rate": 3.9978647650548225e-05, "loss": 0.3564, "loss_nan_ranks": 0, "loss_rank_avg": 0.3463501036167145, "step": 455, "valid_targets_mean": 3051.4, "valid_targets_min": 911 }, { "epoch": 0.8041958041958042, "grad_norm": 0.6681795392176033, "learning_rate": 3.9974429769389524e-05, "loss": 0.3839, "loss_nan_ranks": 0, "loss_rank_avg": 0.3593922555446625, "step": 460, "valid_targets_mean": 3530.2, "valid_targets_min": 1062 }, { "epoch": 0.8129370629370629, "grad_norm": 0.6468833105433451, "learning_rate": 3.996983223689541e-05, "loss": 0.4033, "loss_nan_ranks": 0, "loss_rank_avg": 0.3399583101272583, "step": 465, "valid_targets_mean": 2962.4, "valid_targets_min": 941 }, { "epoch": 0.8216783216783217, "grad_norm": 0.5620199704651588, "learning_rate": 3.9964855140450556e-05, "loss": 0.4159, "loss_nan_ranks": 0, "loss_rank_avg": 0.43714678287506104, "step": 470, "valid_targets_mean": 5177.6, "valid_targets_min": 400 }, { "epoch": 0.8304195804195804, "grad_norm": 0.6050684953003372, "learning_rate": 3.995949857465399e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.40957096219062805, "step": 475, "valid_targets_mean": 3481.8, "valid_targets_min": 907 }, { "epoch": 0.8391608391608392, "grad_norm": 0.5881967704006619, "learning_rate": 3.995376264131723e-05, "loss": 0.4496, "loss_nan_ranks": 0, "loss_rank_avg": 0.4586448073387146, "step": 480, "valid_targets_mean": 4609.4, "valid_targets_min": 875 }, { "epoch": 0.8479020979020979, "grad_norm": 0.5322379740150757, "learning_rate": 3.994764744946242e-05, "loss": 0.3688, "loss_nan_ranks": 0, "loss_rank_avg": 0.3586678206920624, "step": 485, "valid_targets_mean": 4380.9, "valid_targets_min": 988 }, { "epoch": 0.8566433566433567, "grad_norm": 0.5525711150756555, "learning_rate": 3.994115311532018e-05, "loss": 0.3889, "loss_nan_ranks": 0, "loss_rank_avg": 0.3657156229019165, "step": 490, "valid_targets_mean": 4059.6, "valid_targets_min": 776 }, { "epoch": 0.8653846153846154, "grad_norm": 0.6513120586241753, "learning_rate": 3.993427976232748e-05, "loss": 0.3798, "loss_nan_ranks": 0, "loss_rank_avg": 0.41130882501602173, "step": 495, "valid_targets_mean": 3188.6, "valid_targets_min": 1226 }, { "epoch": 0.8741258741258742, "grad_norm": 0.6127418213610771, "learning_rate": 3.99270275211252e-05, "loss": 0.4165, "loss_nan_ranks": 0, "loss_rank_avg": 0.4457509219646454, "step": 500, "valid_targets_mean": 4294.4, "valid_targets_min": 1023 }, { "epoch": 0.8828671328671329, "grad_norm": 0.6484091198476236, "learning_rate": 3.9919396529555754e-05, "loss": 0.4581, "loss_nan_ranks": 0, "loss_rank_avg": 0.44694262742996216, "step": 505, "valid_targets_mean": 3536.8, "valid_targets_min": 1392 }, { "epoch": 0.8916083916083916, "grad_norm": 0.630930600673457, "learning_rate": 3.991138693266037e-05, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.3340379595756531, "step": 510, "valid_targets_mean": 2815.2, "valid_targets_min": 1008 }, { "epoch": 0.9003496503496503, "grad_norm": 0.6303251542828444, "learning_rate": 3.990299888267639e-05, "loss": 0.4278, "loss_nan_ranks": 0, "loss_rank_avg": 0.4999693036079407, "step": 515, "valid_targets_mean": 5249.6, "valid_targets_min": 1123 }, { "epoch": 0.9090909090909091, "grad_norm": 0.6382900314128872, "learning_rate": 3.9894232539034376e-05, "loss": 0.4116, "loss_nan_ranks": 0, "loss_rank_avg": 0.39463382959365845, "step": 520, "valid_targets_mean": 3450.0, "valid_targets_min": 721 }, { "epoch": 0.9178321678321678, "grad_norm": 0.5751517540128765, "learning_rate": 3.9885088068355046e-05, "loss": 0.4414, "loss_nan_ranks": 0, "loss_rank_avg": 0.4512973427772522, "step": 525, "valid_targets_mean": 5112.5, "valid_targets_min": 1534 }, { "epoch": 0.9265734265734266, "grad_norm": 0.7081469703641994, "learning_rate": 3.9875565644446165e-05, "loss": 0.4415, "loss_nan_ranks": 0, "loss_rank_avg": 0.4004817306995392, "step": 530, "valid_targets_mean": 3352.9, "valid_targets_min": 1239 }, { "epoch": 0.9353146853146853, "grad_norm": 0.644292943390024, "learning_rate": 3.986566544829915e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.3852795958518982, "step": 535, "valid_targets_mean": 3494.4, "valid_targets_min": 1279 }, { "epoch": 0.9440559440559441, "grad_norm": 0.5674453210768845, "learning_rate": 3.9855387668085733e-05, "loss": 0.3847, "loss_nan_ranks": 0, "loss_rank_avg": 0.3958588242530823, "step": 540, "valid_targets_mean": 4133.1, "valid_targets_min": 1497 }, { "epoch": 0.9527972027972028, "grad_norm": 0.6005492272047183, "learning_rate": 3.984473249915432e-05, "loss": 0.3475, "loss_nan_ranks": 0, "loss_rank_avg": 0.4054728150367737, "step": 545, "valid_targets_mean": 3535.9, "valid_targets_min": 1910 }, { "epoch": 0.9615384615384616, "grad_norm": 0.5958464349073712, "learning_rate": 3.983370014402629e-05, "loss": 0.3792, "loss_nan_ranks": 0, "loss_rank_avg": 0.3395378589630127, "step": 550, "valid_targets_mean": 4115.0, "valid_targets_min": 924 }, { "epoch": 0.9702797202797203, "grad_norm": 0.5549227602894283, "learning_rate": 3.982229081239214e-05, "loss": 0.4286, "loss_nan_ranks": 0, "loss_rank_avg": 0.4644068479537964, "step": 555, "valid_targets_mean": 5402.5, "valid_targets_min": 860 }, { "epoch": 0.9790209790209791, "grad_norm": 0.5798046099495293, "learning_rate": 3.981050472110753e-05, "loss": 0.3703, "loss_nan_ranks": 0, "loss_rank_avg": 0.38240253925323486, "step": 560, "valid_targets_mean": 3724.3, "valid_targets_min": 1237 }, { "epoch": 0.9877622377622378, "grad_norm": 0.6238998765833637, "learning_rate": 3.979834209418914e-05, "loss": 0.4027, "loss_nan_ranks": 0, "loss_rank_avg": 0.42617619037628174, "step": 565, "valid_targets_mean": 4521.6, "valid_targets_min": 740 }, { "epoch": 0.9965034965034965, "grad_norm": 0.6024006428537647, "learning_rate": 3.97858031628104e-05, "loss": 0.4082, "loss_nan_ranks": 0, "loss_rank_avg": 0.49112826585769653, "step": 570, "valid_targets_mean": 5095.2, "valid_targets_min": 1146 }, { "epoch": 1.0052447552447552, "grad_norm": 0.6342997589440736, "learning_rate": 3.977288816529711e-05, "loss": 0.3258, "loss_nan_ranks": 0, "loss_rank_avg": 0.3129345178604126, "step": 575, "valid_targets_mean": 2719.0, "valid_targets_min": 968 }, { "epoch": 1.013986013986014, "grad_norm": 0.629458660323066, "learning_rate": 3.975959734712293e-05, "loss": 0.406, "loss_nan_ranks": 0, "loss_rank_avg": 0.3763844668865204, "step": 580, "valid_targets_mean": 3271.1, "valid_targets_min": 402 }, { "epoch": 1.0227272727272727, "grad_norm": 0.656404561523582, "learning_rate": 3.974593096090465e-05, "loss": 0.3476, "loss_nan_ranks": 0, "loss_rank_avg": 0.31588298082351685, "step": 585, "valid_targets_mean": 2591.9, "valid_targets_min": 659 }, { "epoch": 1.0314685314685315, "grad_norm": 0.7256823083367988, "learning_rate": 3.973188926639749e-05, "loss": 0.3918, "loss_nan_ranks": 0, "loss_rank_avg": 0.45462703704833984, "step": 590, "valid_targets_mean": 3205.2, "valid_targets_min": 1217 }, { "epoch": 1.0402097902097902, "grad_norm": 0.5895144169036058, "learning_rate": 3.971747253049004e-05, "loss": 0.381, "loss_nan_ranks": 0, "loss_rank_avg": 0.3712193965911865, "step": 595, "valid_targets_mean": 3694.0, "valid_targets_min": 1084 }, { "epoch": 1.048951048951049, "grad_norm": 0.5690400741815232, "learning_rate": 3.9702681027199315e-05, "loss": 0.3814, "loss_nan_ranks": 0, "loss_rank_avg": 0.427038311958313, "step": 600, "valid_targets_mean": 4761.9, "valid_targets_min": 1074 }, { "epoch": 1.0576923076923077, "grad_norm": 0.638796668052871, "learning_rate": 3.968751503766544e-05, "loss": 0.3895, "loss_nan_ranks": 0, "loss_rank_avg": 0.3525705337524414, "step": 605, "valid_targets_mean": 3294.1, "valid_targets_min": 1100 }, { "epoch": 1.0664335664335665, "grad_norm": 0.5612529799321073, "learning_rate": 3.967197485014637e-05, "loss": 0.3967, "loss_nan_ranks": 0, "loss_rank_avg": 0.40732014179229736, "step": 610, "valid_targets_mean": 4946.8, "valid_targets_min": 829 }, { "epoch": 1.0751748251748252, "grad_norm": 0.5332511823970404, "learning_rate": 3.9656060760012386e-05, "loss": 0.3887, "loss_nan_ranks": 0, "loss_rank_avg": 0.3988763093948364, "step": 615, "valid_targets_mean": 4778.2, "valid_targets_min": 1161 }, { "epoch": 1.083916083916084, "grad_norm": 0.9907300506794291, "learning_rate": 3.9639773069740484e-05, "loss": 0.3474, "loss_nan_ranks": 0, "loss_rank_avg": 0.348149836063385, "step": 620, "valid_targets_mean": 3704.6, "valid_targets_min": 1498 }, { "epoch": 1.0926573426573427, "grad_norm": 0.6489040626377737, "learning_rate": 3.9623112088908627e-05, "loss": 0.3851, "loss_nan_ranks": 0, "loss_rank_avg": 0.22918564081192017, "step": 625, "valid_targets_mean": 2000.0, "valid_targets_min": 864 }, { "epoch": 1.1013986013986015, "grad_norm": 0.5178066275559241, "learning_rate": 3.960607813418987e-05, "loss": 0.3858, "loss_nan_ranks": 0, "loss_rank_avg": 0.4411054849624634, "step": 630, "valid_targets_mean": 6213.5, "valid_targets_min": 1224 }, { "epoch": 1.1101398601398602, "grad_norm": 0.586299273251672, "learning_rate": 3.9588671529346345e-05, "loss": 0.3361, "loss_nan_ranks": 0, "loss_rank_avg": 0.4047016203403473, "step": 635, "valid_targets_mean": 4316.3, "valid_targets_min": 1014 }, { "epoch": 1.118881118881119, "grad_norm": 0.6006735013024012, "learning_rate": 3.957089260522306e-05, "loss": 0.347, "loss_nan_ranks": 0, "loss_rank_avg": 0.3549342155456543, "step": 640, "valid_targets_mean": 3763.6, "valid_targets_min": 1124 }, { "epoch": 1.1276223776223777, "grad_norm": 0.6863014700797007, "learning_rate": 3.9552741699741674e-05, "loss": 0.3996, "loss_nan_ranks": 0, "loss_rank_avg": 0.452499657869339, "step": 645, "valid_targets_mean": 3432.2, "valid_targets_min": 281 }, { "epoch": 1.1363636363636362, "grad_norm": 0.6285631579650135, "learning_rate": 3.953421915789403e-05, "loss": 0.3744, "loss_nan_ranks": 0, "loss_rank_avg": 0.3433941602706909, "step": 650, "valid_targets_mean": 2940.2, "valid_targets_min": 727 }, { "epoch": 1.145104895104895, "grad_norm": 0.6198040249923603, "learning_rate": 3.9515325331735635e-05, "loss": 0.3474, "loss_nan_ranks": 0, "loss_rank_avg": 0.36902672052383423, "step": 655, "valid_targets_mean": 3038.7, "valid_targets_min": 1422 }, { "epoch": 1.1538461538461537, "grad_norm": 0.5020755508723698, "learning_rate": 3.949606058037893e-05, "loss": 0.3811, "loss_nan_ranks": 0, "loss_rank_avg": 0.3350529670715332, "step": 660, "valid_targets_mean": 4884.1, "valid_targets_min": 1339 }, { "epoch": 1.1625874125874125, "grad_norm": 0.5538973265752763, "learning_rate": 3.947642526998649e-05, "loss": 0.357, "loss_nan_ranks": 0, "loss_rank_avg": 0.38185301423072815, "step": 665, "valid_targets_mean": 4053.4, "valid_targets_min": 711 }, { "epoch": 1.1713286713286712, "grad_norm": 0.6390899954407651, "learning_rate": 3.945641977376404e-05, "loss": 0.3731, "loss_nan_ranks": 0, "loss_rank_avg": 0.4220157265663147, "step": 670, "valid_targets_mean": 4628.8, "valid_targets_min": 1091 }, { "epoch": 1.18006993006993, "grad_norm": 0.6411330384913675, "learning_rate": 3.94360444719534e-05, "loss": 0.4001, "loss_nan_ranks": 0, "loss_rank_avg": 0.4042211174964905, "step": 675, "valid_targets_mean": 3807.4, "valid_targets_min": 1606 }, { "epoch": 1.1888111888111887, "grad_norm": 0.6039498968928956, "learning_rate": 3.941529975182524e-05, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.40398502349853516, "step": 680, "valid_targets_mean": 4085.2, "valid_targets_min": 831 }, { "epoch": 1.1975524475524475, "grad_norm": 0.5877952077296495, "learning_rate": 3.939418600767168e-05, "loss": 0.3757, "loss_nan_ranks": 0, "loss_rank_avg": 0.4611789584159851, "step": 685, "valid_targets_mean": 4750.3, "valid_targets_min": 1151 }, { "epoch": 1.2062937062937062, "grad_norm": 0.6355903559851636, "learning_rate": 3.937270364079886e-05, "loss": 0.3513, "loss_nan_ranks": 0, "loss_rank_avg": 0.31703072786331177, "step": 690, "valid_targets_mean": 3618.4, "valid_targets_min": 1137 }, { "epoch": 1.215034965034965, "grad_norm": 0.6128675990146162, "learning_rate": 3.935085305951929e-05, "loss": 0.3937, "loss_nan_ranks": 0, "loss_rank_avg": 0.4473511874675751, "step": 695, "valid_targets_mean": 3876.3, "valid_targets_min": 1234 }, { "epoch": 1.2237762237762237, "grad_norm": 0.6112543941773279, "learning_rate": 3.932863467914405e-05, "loss": 0.359, "loss_nan_ranks": 0, "loss_rank_avg": 0.36574071645736694, "step": 700, "valid_targets_mean": 3475.4, "valid_targets_min": 898 }, { "epoch": 1.2325174825174825, "grad_norm": 0.6808146656666811, "learning_rate": 3.930604892197496e-05, "loss": 0.3789, "loss_nan_ranks": 0, "loss_rank_avg": 0.4020303785800934, "step": 705, "valid_targets_mean": 3257.4, "valid_targets_min": 904 }, { "epoch": 1.2412587412587412, "grad_norm": 0.6143751077595933, "learning_rate": 3.9283096217296496e-05, "loss": 0.3558, "loss_nan_ranks": 0, "loss_rank_avg": 0.38672855496406555, "step": 710, "valid_targets_mean": 3559.6, "valid_targets_min": 933 }, { "epoch": 1.25, "grad_norm": 0.638690578066305, "learning_rate": 3.925977700136768e-05, "loss": 0.3882, "loss_nan_ranks": 0, "loss_rank_avg": 0.39257192611694336, "step": 715, "valid_targets_mean": 3589.1, "valid_targets_min": 940 }, { "epoch": 1.2587412587412588, "grad_norm": 0.5457598428008629, "learning_rate": 3.923609171741374e-05, "loss": 0.3654, "loss_nan_ranks": 0, "loss_rank_avg": 0.3970078229904175, "step": 720, "valid_targets_mean": 4277.0, "valid_targets_min": 286 }, { "epoch": 1.2674825174825175, "grad_norm": 0.502276044700275, "learning_rate": 3.921204081561774e-05, "loss": 0.3799, "loss_nan_ranks": 0, "loss_rank_avg": 0.30176183581352234, "step": 725, "valid_targets_mean": 4076.9, "valid_targets_min": 875 }, { "epoch": 1.2762237762237763, "grad_norm": 0.6472659228715367, "learning_rate": 3.918762475311197e-05, "loss": 0.4084, "loss_nan_ranks": 0, "loss_rank_avg": 0.4843234419822693, "step": 730, "valid_targets_mean": 4021.4, "valid_targets_min": 1101 }, { "epoch": 1.284965034965035, "grad_norm": 0.5283842836058, "learning_rate": 3.91628439939693e-05, "loss": 0.3659, "loss_nan_ranks": 0, "loss_rank_avg": 0.3728162348270416, "step": 735, "valid_targets_mean": 4352.0, "valid_targets_min": 954 }, { "epoch": 1.2937062937062938, "grad_norm": 0.5966704473150931, "learning_rate": 3.913769900919431e-05, "loss": 0.3566, "loss_nan_ranks": 0, "loss_rank_avg": 0.38558197021484375, "step": 740, "valid_targets_mean": 5053.8, "valid_targets_min": 1163 }, { "epoch": 1.3024475524475525, "grad_norm": 0.6138554581865869, "learning_rate": 3.91121902767144e-05, "loss": 0.3435, "loss_nan_ranks": 0, "loss_rank_avg": 0.3052510619163513, "step": 745, "valid_targets_mean": 3518.2, "valid_targets_min": 1127 }, { "epoch": 1.3111888111888113, "grad_norm": 0.6487462123963363, "learning_rate": 3.908631828137067e-05, "loss": 0.4114, "loss_nan_ranks": 0, "loss_rank_avg": 0.4444257318973541, "step": 750, "valid_targets_mean": 4018.6, "valid_targets_min": 836 }, { "epoch": 1.31993006993007, "grad_norm": 0.508254488406239, "learning_rate": 3.9060083514908695e-05, "loss": 0.4277, "loss_nan_ranks": 0, "loss_rank_avg": 0.42669036984443665, "step": 755, "valid_targets_mean": 5763.0, "valid_targets_min": 1080 }, { "epoch": 1.3286713286713288, "grad_norm": 0.48404850385049064, "learning_rate": 3.903348647596919e-05, "loss": 0.3673, "loss_nan_ranks": 0, "loss_rank_avg": 0.42117491364479065, "step": 760, "valid_targets_mean": 6734.8, "valid_targets_min": 1439 }, { "epoch": 1.3374125874125875, "grad_norm": 0.5928130214677121, "learning_rate": 3.900652767007855e-05, "loss": 0.363, "loss_nan_ranks": 0, "loss_rank_avg": 0.3812492787837982, "step": 765, "valid_targets_mean": 5822.9, "valid_targets_min": 844 }, { "epoch": 1.3461538461538463, "grad_norm": 0.6239373645782617, "learning_rate": 3.8979207609639225e-05, "loss": 0.3715, "loss_nan_ranks": 0, "loss_rank_avg": 0.4304284155368805, "step": 770, "valid_targets_mean": 4057.4, "valid_targets_min": 816 }, { "epoch": 1.354895104895105, "grad_norm": 0.5195351816200816, "learning_rate": 3.8951526813919975e-05, "loss": 0.3717, "loss_nan_ranks": 0, "loss_rank_avg": 0.30584895610809326, "step": 775, "valid_targets_mean": 4133.8, "valid_targets_min": 1393 }, { "epoch": 1.3636363636363638, "grad_norm": 0.602430063013215, "learning_rate": 3.8923485809046006e-05, "loss": 0.3618, "loss_nan_ranks": 0, "loss_rank_avg": 0.43198758363723755, "step": 780, "valid_targets_mean": 5221.6, "valid_targets_min": 865 }, { "epoch": 1.3723776223776225, "grad_norm": 0.5793853580026894, "learning_rate": 3.889508512798898e-05, "loss": 0.3733, "loss_nan_ranks": 0, "loss_rank_avg": 0.375804603099823, "step": 785, "valid_targets_mean": 3890.5, "valid_targets_min": 1119 }, { "epoch": 1.381118881118881, "grad_norm": 0.6283176928865934, "learning_rate": 3.886632531055687e-05, "loss": 0.3507, "loss_nan_ranks": 0, "loss_rank_avg": 0.36522990465164185, "step": 790, "valid_targets_mean": 2879.0, "valid_targets_min": 914 }, { "epoch": 1.3898601398601398, "grad_norm": 0.5586170363792717, "learning_rate": 3.883720690338372e-05, "loss": 0.3915, "loss_nan_ranks": 0, "loss_rank_avg": 0.36750155687332153, "step": 795, "valid_targets_mean": 3684.4, "valid_targets_min": 1034 }, { "epoch": 1.3986013986013985, "grad_norm": 0.5971605319742396, "learning_rate": 3.880773045991921e-05, "loss": 0.3822, "loss_nan_ranks": 0, "loss_rank_avg": 0.31041955947875977, "step": 800, "valid_targets_mean": 3070.0, "valid_targets_min": 405 }, { "epoch": 1.4073426573426573, "grad_norm": 0.5992895435680253, "learning_rate": 3.8777896540418204e-05, "loss": 0.3407, "loss_nan_ranks": 0, "loss_rank_avg": 0.3061218559741974, "step": 805, "valid_targets_mean": 2962.3, "valid_targets_min": 1200 }, { "epoch": 1.416083916083916, "grad_norm": 0.5163991467972393, "learning_rate": 3.874770571193004e-05, "loss": 0.3634, "loss_nan_ranks": 0, "loss_rank_avg": 0.4339129328727722, "step": 810, "valid_targets_mean": 6174.8, "valid_targets_min": 2106 }, { "epoch": 1.4248251748251748, "grad_norm": 0.5915515016899537, "learning_rate": 3.871715854828779e-05, "loss": 0.3775, "loss_nan_ranks": 0, "loss_rank_avg": 0.3776523470878601, "step": 815, "valid_targets_mean": 4111.8, "valid_targets_min": 986 }, { "epoch": 1.4335664335664335, "grad_norm": 0.5746894134419273, "learning_rate": 3.8686255630097346e-05, "loss": 0.3695, "loss_nan_ranks": 0, "loss_rank_avg": 0.3666810989379883, "step": 820, "valid_targets_mean": 3390.7, "valid_targets_min": 1340 }, { "epoch": 1.4423076923076923, "grad_norm": 0.6144270484363288, "learning_rate": 3.8654997544726374e-05, "loss": 0.3715, "loss_nan_ranks": 0, "loss_rank_avg": 0.38752689957618713, "step": 825, "valid_targets_mean": 3446.4, "valid_targets_min": 1126 }, { "epoch": 1.451048951048951, "grad_norm": 0.5922060872547307, "learning_rate": 3.862338488629314e-05, "loss": 0.3757, "loss_nan_ranks": 0, "loss_rank_avg": 0.34740880131721497, "step": 830, "valid_targets_mean": 4006.9, "valid_targets_min": 991 }, { "epoch": 1.4597902097902098, "grad_norm": 0.6002301065901973, "learning_rate": 3.859141825565525e-05, "loss": 0.3843, "loss_nan_ranks": 0, "loss_rank_avg": 0.35890963673591614, "step": 835, "valid_targets_mean": 3065.4, "valid_targets_min": 1571 }, { "epoch": 1.4685314685314685, "grad_norm": 0.6051255681472264, "learning_rate": 3.855909826039822e-05, "loss": 0.3499, "loss_nan_ranks": 0, "loss_rank_avg": 0.3590480089187622, "step": 840, "valid_targets_mean": 2918.1, "valid_targets_min": 1159 }, { "epoch": 1.4772727272727273, "grad_norm": 0.46918016708384985, "learning_rate": 3.852642551482391e-05, "loss": 0.3998, "loss_nan_ranks": 0, "loss_rank_avg": 0.3891509175300598, "step": 845, "valid_targets_mean": 5518.4, "valid_targets_min": 794 }, { "epoch": 1.486013986013986, "grad_norm": 0.5672184897056678, "learning_rate": 3.849340063993884e-05, "loss": 0.3841, "loss_nan_ranks": 0, "loss_rank_avg": 0.46270751953125, "step": 850, "valid_targets_mean": 5028.8, "valid_targets_min": 1013 }, { "epoch": 1.4947552447552448, "grad_norm": 0.6032267971221293, "learning_rate": 3.8460024263442446e-05, "loss": 0.3907, "loss_nan_ranks": 0, "loss_rank_avg": 0.36976176500320435, "step": 855, "valid_targets_mean": 3296.6, "valid_targets_min": 295 }, { "epoch": 1.5034965034965035, "grad_norm": 0.5937950046708127, "learning_rate": 3.842629701971507e-05, "loss": 0.3838, "loss_nan_ranks": 0, "loss_rank_avg": 0.3807605504989624, "step": 860, "valid_targets_mean": 3674.1, "valid_targets_min": 866 }, { "epoch": 1.512237762237762, "grad_norm": 0.5638487866108519, "learning_rate": 3.839221954980596e-05, "loss": 0.3611, "loss_nan_ranks": 0, "loss_rank_avg": 0.35325905680656433, "step": 865, "valid_targets_mean": 3803.4, "valid_targets_min": 397 }, { "epoch": 1.5209790209790208, "grad_norm": 0.5702323841541543, "learning_rate": 3.835779250142108e-05, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.34167003631591797, "step": 870, "valid_targets_mean": 3481.8, "valid_targets_min": 992 }, { "epoch": 1.5297202797202796, "grad_norm": 0.5291286455210686, "learning_rate": 3.8323016528910746e-05, "loss": 0.3859, "loss_nan_ranks": 0, "loss_rank_avg": 0.3847964107990265, "step": 875, "valid_targets_mean": 4120.1, "valid_targets_min": 1221 }, { "epoch": 1.5384615384615383, "grad_norm": 0.6275254868035214, "learning_rate": 3.828789229325726e-05, "loss": 0.3926, "loss_nan_ranks": 0, "loss_rank_avg": 0.42605069279670715, "step": 880, "valid_targets_mean": 4082.6, "valid_targets_min": 865 }, { "epoch": 1.547202797202797, "grad_norm": 0.5396398856381337, "learning_rate": 3.8252420462062315e-05, "loss": 0.3914, "loss_nan_ranks": 0, "loss_rank_avg": 0.36167097091674805, "step": 885, "valid_targets_mean": 4174.7, "valid_targets_min": 1224 }, { "epoch": 1.5559440559440558, "grad_norm": 0.47910903259168275, "learning_rate": 3.8216601709534284e-05, "loss": 0.3922, "loss_nan_ranks": 0, "loss_rank_avg": 0.3376033306121826, "step": 890, "valid_targets_mean": 5025.0, "valid_targets_min": 1179 }, { "epoch": 1.5646853146853146, "grad_norm": 0.5073648171270649, "learning_rate": 3.818043671647545e-05, "loss": 0.368, "loss_nan_ranks": 0, "loss_rank_avg": 0.39315563440322876, "step": 895, "valid_targets_mean": 5091.6, "valid_targets_min": 286 }, { "epoch": 1.5734265734265733, "grad_norm": 0.6352472398575295, "learning_rate": 3.814392617026904e-05, "loss": 0.3474, "loss_nan_ranks": 0, "loss_rank_avg": 0.42686229944229126, "step": 900, "valid_targets_mean": 4175.8, "valid_targets_min": 783 }, { "epoch": 1.582167832167832, "grad_norm": 0.6935854438042858, "learning_rate": 3.810707076486616e-05, "loss": 0.3934, "loss_nan_ranks": 0, "loss_rank_avg": 0.27806347608566284, "step": 905, "valid_targets_mean": 2418.1, "valid_targets_min": 745 }, { "epoch": 1.5909090909090908, "grad_norm": 0.6454560477570744, "learning_rate": 3.80698712007726e-05, "loss": 0.3393, "loss_nan_ranks": 0, "loss_rank_avg": 0.40068015456199646, "step": 910, "valid_targets_mean": 3282.2, "valid_targets_min": 1009 }, { "epoch": 1.5996503496503496, "grad_norm": 0.71255907929696, "learning_rate": 3.8032328185035535e-05, "loss": 0.3491, "loss_nan_ranks": 0, "loss_rank_avg": 0.38632285594940186, "step": 915, "valid_targets_mean": 2531.9, "valid_targets_min": 1153 }, { "epoch": 1.6083916083916083, "grad_norm": 0.6583779603016164, "learning_rate": 3.7994442431230096e-05, "loss": 0.3722, "loss_nan_ranks": 0, "loss_rank_avg": 0.3876379430294037, "step": 920, "valid_targets_mean": 2792.9, "valid_targets_min": 721 }, { "epoch": 1.617132867132867, "grad_norm": 0.548264282270815, "learning_rate": 3.7956214659445764e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.3522208034992218, "step": 925, "valid_targets_mean": 3671.8, "valid_targets_min": 1283 }, { "epoch": 1.6258741258741258, "grad_norm": 0.5866905542029235, "learning_rate": 3.7917645596272734e-05, "loss": 0.3874, "loss_nan_ranks": 0, "loss_rank_avg": 0.3922966420650482, "step": 930, "valid_targets_mean": 3553.9, "valid_targets_min": 753 }, { "epoch": 1.6346153846153846, "grad_norm": 0.48891096645703447, "learning_rate": 3.7878735974788056e-05, "loss": 0.3726, "loss_nan_ranks": 0, "loss_rank_avg": 0.4203706383705139, "step": 935, "valid_targets_mean": 5460.0, "valid_targets_min": 1274 }, { "epoch": 1.6433566433566433, "grad_norm": 0.5973489726719953, "learning_rate": 3.783948653454176e-05, "loss": 0.3664, "loss_nan_ranks": 0, "loss_rank_avg": 0.3803213834762573, "step": 940, "valid_targets_mean": 3419.8, "valid_targets_min": 1239 }, { "epoch": 1.652097902097902, "grad_norm": 0.5931207818844045, "learning_rate": 3.779989802154273e-05, "loss": 0.3846, "loss_nan_ranks": 0, "loss_rank_avg": 0.4405151903629303, "step": 945, "valid_targets_mean": 4785.6, "valid_targets_min": 703 }, { "epoch": 1.6608391608391608, "grad_norm": 0.49894822325713817, "learning_rate": 3.7759971188244594e-05, "loss": 0.3649, "loss_nan_ranks": 0, "loss_rank_avg": 0.3540881276130676, "step": 950, "valid_targets_mean": 4723.8, "valid_targets_min": 1461 }, { "epoch": 1.6695804195804196, "grad_norm": 0.5865370598515728, "learning_rate": 3.771970679353135e-05, "loss": 0.3366, "loss_nan_ranks": 0, "loss_rank_avg": 0.2708732485771179, "step": 955, "valid_targets_mean": 2668.8, "valid_targets_min": 1174 }, { "epoch": 1.6783216783216783, "grad_norm": 0.5791850182023949, "learning_rate": 3.767910560270303e-05, "loss": 0.3523, "loss_nan_ranks": 0, "loss_rank_avg": 0.3443334102630615, "step": 960, "valid_targets_mean": 3261.9, "valid_targets_min": 317 }, { "epoch": 1.687062937062937, "grad_norm": 0.6093901195497682, "learning_rate": 3.763816838746107e-05, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.3926513195037842, "step": 965, "valid_targets_mean": 3403.4, "valid_targets_min": 860 }, { "epoch": 1.6958041958041958, "grad_norm": 0.5919210341830557, "learning_rate": 3.759689592589367e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.31532764434814453, "step": 970, "valid_targets_mean": 2884.4, "valid_targets_min": 1038 }, { "epoch": 1.7045454545454546, "grad_norm": 0.5817284643320272, "learning_rate": 3.755528900246106e-05, "loss": 0.3591, "loss_nan_ranks": 0, "loss_rank_avg": 0.3037341237068176, "step": 975, "valid_targets_mean": 2825.8, "valid_targets_min": 1070 }, { "epoch": 1.7132867132867133, "grad_norm": 0.5981859182760877, "learning_rate": 3.7513348407980483e-05, "loss": 0.4053, "loss_nan_ranks": 0, "loss_rank_avg": 0.34905627369880676, "step": 980, "valid_targets_mean": 3172.6, "valid_targets_min": 1304 }, { "epoch": 1.722027972027972, "grad_norm": 0.5243877796252934, "learning_rate": 3.747107493961126e-05, "loss": 0.3649, "loss_nan_ranks": 0, "loss_rank_avg": 0.44003045558929443, "step": 985, "valid_targets_mean": 6281.9, "valid_targets_min": 1602 }, { "epoch": 1.7307692307692308, "grad_norm": 0.6888200590905601, "learning_rate": 3.7428469400839604e-05, "loss": 0.3172, "loss_nan_ranks": 0, "loss_rank_avg": 0.27428072690963745, "step": 990, "valid_targets_mean": 2553.9, "valid_targets_min": 908 }, { "epoch": 1.7395104895104896, "grad_norm": 0.6562142049594524, "learning_rate": 3.738553260146332e-05, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.36127781867980957, "step": 995, "valid_targets_mean": 3028.3, "valid_targets_min": 938 }, { "epoch": 1.7482517482517483, "grad_norm": 0.6242645620698037, "learning_rate": 3.734226535757647e-05, "loss": 0.3666, "loss_nan_ranks": 0, "loss_rank_avg": 0.4239537715911865, "step": 1000, "valid_targets_mean": 3935.4, "valid_targets_min": 1225 }, { "epoch": 1.756993006993007, "grad_norm": 0.48728283464574973, "learning_rate": 3.729866849155381e-05, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.388911634683609, "step": 1005, "valid_targets_mean": 5385.4, "valid_targets_min": 1104 }, { "epoch": 1.7657342657342658, "grad_norm": 0.6342231197385638, "learning_rate": 3.7254742832035174e-05, "loss": 0.3811, "loss_nan_ranks": 0, "loss_rank_avg": 0.3924434185028076, "step": 1010, "valid_targets_mean": 3746.3, "valid_targets_min": 1110 }, { "epoch": 1.7744755244755246, "grad_norm": 0.5552439867083838, "learning_rate": 3.721048921390975e-05, "loss": 0.3546, "loss_nan_ranks": 0, "loss_rank_avg": 0.32628345489501953, "step": 1015, "valid_targets_mean": 2988.6, "valid_targets_min": 1117 }, { "epoch": 1.7832167832167833, "grad_norm": 0.5174881529638417, "learning_rate": 3.716590847830019e-05, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.4475651979446411, "step": 1020, "valid_targets_mean": 5184.8, "valid_targets_min": 1395 }, { "epoch": 1.791958041958042, "grad_norm": 0.5747806673287248, "learning_rate": 3.712100147254662e-05, "loss": 0.3569, "loss_nan_ranks": 0, "loss_rank_avg": 0.31613489985466003, "step": 1025, "valid_targets_mean": 3144.9, "valid_targets_min": 1323 }, { "epoch": 1.8006993006993008, "grad_norm": 0.5455829057478265, "learning_rate": 3.707576905019053e-05, "loss": 0.3623, "loss_nan_ranks": 0, "loss_rank_avg": 0.33471807837486267, "step": 1030, "valid_targets_mean": 3088.8, "valid_targets_min": 857 }, { "epoch": 1.8094405594405596, "grad_norm": 0.6517636899008046, "learning_rate": 3.703021207095856e-05, "loss": 0.3776, "loss_nan_ranks": 0, "loss_rank_avg": 0.38492679595947266, "step": 1035, "valid_targets_mean": 2833.6, "valid_targets_min": 894 }, { "epoch": 1.8181818181818183, "grad_norm": 0.5801054629631718, "learning_rate": 3.6984331400746184e-05, "loss": 0.3721, "loss_nan_ranks": 0, "loss_rank_avg": 0.3238530457019806, "step": 1040, "valid_targets_mean": 3322.8, "valid_targets_min": 985 }, { "epoch": 1.8269230769230769, "grad_norm": 0.5586861505293964, "learning_rate": 3.693812791160121e-05, "loss": 0.3558, "loss_nan_ranks": 0, "loss_rank_avg": 0.3880930542945862, "step": 1045, "valid_targets_mean": 3823.8, "valid_targets_min": 1197 }, { "epoch": 1.8356643356643356, "grad_norm": 0.6145308306637935, "learning_rate": 3.6891602481707207e-05, "loss": 0.3266, "loss_nan_ranks": 0, "loss_rank_avg": 0.3544296622276306, "step": 1050, "valid_targets_mean": 3499.2, "valid_targets_min": 1000 }, { "epoch": 1.8444055944055944, "grad_norm": 0.58907820308691, "learning_rate": 3.684475599536687e-05, "loss": 0.3682, "loss_nan_ranks": 0, "loss_rank_avg": 0.4255306124687195, "step": 1055, "valid_targets_mean": 5237.4, "valid_targets_min": 1340 }, { "epoch": 1.8531468531468531, "grad_norm": 0.5015996234360681, "learning_rate": 3.6797589342985126e-05, "loss": 0.3616, "loss_nan_ranks": 0, "loss_rank_avg": 0.37960782647132874, "step": 1060, "valid_targets_mean": 4262.1, "valid_targets_min": 910 }, { "epoch": 1.8618881118881119, "grad_norm": 0.5260945935702037, "learning_rate": 3.6750103421052286e-05, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.37209346890449524, "step": 1065, "valid_targets_mean": 4495.8, "valid_targets_min": 1369 }, { "epoch": 1.8706293706293706, "grad_norm": 0.5542537902859789, "learning_rate": 3.670229913212696e-05, "loss": 0.38, "loss_nan_ranks": 0, "loss_rank_avg": 0.42989593744277954, "step": 1070, "valid_targets_mean": 5143.3, "valid_targets_min": 1686 }, { "epoch": 1.8793706293706294, "grad_norm": 0.5321301926401418, "learning_rate": 3.6654177384818936e-05, "loss": 0.3785, "loss_nan_ranks": 0, "loss_rank_avg": 0.4028235673904419, "step": 1075, "valid_targets_mean": 4950.6, "valid_targets_min": 1291 }, { "epoch": 1.8881118881118881, "grad_norm": 0.584447522220945, "learning_rate": 3.6605739093771854e-05, "loss": 0.3795, "loss_nan_ranks": 0, "loss_rank_avg": 0.37142544984817505, "step": 1080, "valid_targets_mean": 3263.2, "valid_targets_min": 795 }, { "epoch": 1.8968531468531469, "grad_norm": 0.5350619514142159, "learning_rate": 3.6556985179645905e-05, "loss": 0.3577, "loss_nan_ranks": 0, "loss_rank_avg": 0.41316014528274536, "step": 1085, "valid_targets_mean": 4889.9, "valid_targets_min": 1222 }, { "epoch": 1.9055944055944056, "grad_norm": 0.5814069068694546, "learning_rate": 3.6507916569100255e-05, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.3615434169769287, "step": 1090, "valid_targets_mean": 2938.7, "valid_targets_min": 1106 }, { "epoch": 1.9143356643356644, "grad_norm": 0.6849481252444816, "learning_rate": 3.645853419477547e-05, "loss": 0.3651, "loss_nan_ranks": 0, "loss_rank_avg": 0.258215069770813, "step": 1095, "valid_targets_mean": 2303.6, "valid_targets_min": 344 }, { "epoch": 1.9230769230769231, "grad_norm": 0.5454940887177128, "learning_rate": 3.640883899527579e-05, "loss": 0.3889, "loss_nan_ranks": 0, "loss_rank_avg": 0.38337862491607666, "step": 1100, "valid_targets_mean": 4225.1, "valid_targets_min": 1207 }, { "epoch": 1.9318181818181817, "grad_norm": 0.5879298330740542, "learning_rate": 3.6358831915151276e-05, "loss": 0.3781, "loss_nan_ranks": 0, "loss_rank_avg": 0.5195822715759277, "step": 1105, "valid_targets_mean": 5530.6, "valid_targets_min": 896 }, { "epoch": 1.9405594405594404, "grad_norm": 0.5232477468919542, "learning_rate": 3.630851390487985e-05, "loss": 0.3618, "loss_nan_ranks": 0, "loss_rank_avg": 0.32636207342147827, "step": 1110, "valid_targets_mean": 3888.2, "valid_targets_min": 1052 }, { "epoch": 1.9493006993006992, "grad_norm": 0.5356916033918182, "learning_rate": 3.625788592084926e-05, "loss": 0.3587, "loss_nan_ranks": 0, "loss_rank_avg": 0.3277405798435211, "step": 1115, "valid_targets_mean": 3823.6, "valid_targets_min": 408 }, { "epoch": 1.958041958041958, "grad_norm": 0.5544913344651682, "learning_rate": 3.620694892533889e-05, "loss": 0.3694, "loss_nan_ranks": 0, "loss_rank_avg": 0.42964452505111694, "step": 1120, "valid_targets_mean": 4196.4, "valid_targets_min": 1248 }, { "epoch": 1.9667832167832167, "grad_norm": 0.558219067439635, "learning_rate": 3.615570388650144e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.38968485593795776, "step": 1125, "valid_targets_mean": 3462.7, "valid_targets_min": 870 }, { "epoch": 1.9755244755244754, "grad_norm": 0.5275189202715219, "learning_rate": 3.610415177834457e-05, "loss": 0.3589, "loss_nan_ranks": 0, "loss_rank_avg": 0.42595839500427246, "step": 1130, "valid_targets_mean": 4739.6, "valid_targets_min": 880 }, { "epoch": 1.9842657342657342, "grad_norm": 0.5691050784475108, "learning_rate": 3.605229358071236e-05, "loss": 0.3618, "loss_nan_ranks": 0, "loss_rank_avg": 0.39064157009124756, "step": 1135, "valid_targets_mean": 3912.1, "valid_targets_min": 1217 }, { "epoch": 1.993006993006993, "grad_norm": 0.5388771565097371, "learning_rate": 3.600013027926667e-05, "loss": 0.3487, "loss_nan_ranks": 0, "loss_rank_avg": 0.2591717839241028, "step": 1140, "valid_targets_mean": 3237.1, "valid_targets_min": 1415 }, { "epoch": 2.0017482517482517, "grad_norm": 0.5553503636171387, "learning_rate": 3.594766286546847e-05, "loss": 0.3646, "loss_nan_ranks": 0, "loss_rank_avg": 0.32958346605300903, "step": 1145, "valid_targets_mean": 3299.1, "valid_targets_min": 890 }, { "epoch": 2.0104895104895104, "grad_norm": 0.6240329555824098, "learning_rate": 3.589489233655891e-05, "loss": 0.3581, "loss_nan_ranks": 0, "loss_rank_avg": 0.3101613521575928, "step": 1150, "valid_targets_mean": 3488.4, "valid_targets_min": 910 }, { "epoch": 2.019230769230769, "grad_norm": 0.5394247078220722, "learning_rate": 3.5841819695540446e-05, "loss": 0.35, "loss_nan_ranks": 0, "loss_rank_avg": 0.3253103196620941, "step": 1155, "valid_targets_mean": 3960.2, "valid_targets_min": 1113 }, { "epoch": 2.027972027972028, "grad_norm": 0.5536721946245187, "learning_rate": 3.5788445951157705e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.2637212872505188, "step": 1160, "valid_targets_mean": 3050.2, "valid_targets_min": 1087 }, { "epoch": 2.0367132867132867, "grad_norm": 0.5495101580283069, "learning_rate": 3.5734772117878376e-05, "loss": 0.3411, "loss_nan_ranks": 0, "loss_rank_avg": 0.286973237991333, "step": 1165, "valid_targets_mean": 3388.9, "valid_targets_min": 1085 }, { "epoch": 2.0454545454545454, "grad_norm": 0.7159443153475205, "learning_rate": 3.568079921587388e-05, "loss": 0.3789, "loss_nan_ranks": 0, "loss_rank_avg": 0.396413117647171, "step": 1170, "valid_targets_mean": 4071.5, "valid_targets_min": 1321 }, { "epoch": 2.054195804195804, "grad_norm": 0.5091694275857868, "learning_rate": 3.5626528271000004e-05, "loss": 0.3309, "loss_nan_ranks": 0, "loss_rank_avg": 0.26522356271743774, "step": 1175, "valid_targets_mean": 3710.6, "valid_targets_min": 1186 }, { "epoch": 2.062937062937063, "grad_norm": 0.5494408643701906, "learning_rate": 3.557196031477739e-05, "loss": 0.3245, "loss_nan_ranks": 0, "loss_rank_avg": 0.26861274242401123, "step": 1180, "valid_targets_mean": 3189.2, "valid_targets_min": 444 }, { "epoch": 2.0716783216783217, "grad_norm": 0.5642588272002523, "learning_rate": 3.551709638437193e-05, "loss": 0.3679, "loss_nan_ranks": 0, "loss_rank_avg": 0.4018964469432831, "step": 1185, "valid_targets_mean": 4603.7, "valid_targets_min": 1275 }, { "epoch": 2.0804195804195804, "grad_norm": 0.6029948726748001, "learning_rate": 3.546193752257509e-05, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.4047200679779053, "step": 1190, "valid_targets_mean": 3797.2, "valid_targets_min": 1575 }, { "epoch": 2.089160839160839, "grad_norm": 0.6765562020479058, "learning_rate": 3.540648477778401e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.2479398250579834, "step": 1195, "valid_targets_mean": 2208.5, "valid_targets_min": 864 }, { "epoch": 2.097902097902098, "grad_norm": 0.6399857417560751, "learning_rate": 3.535073920398167e-05, "loss": 0.3357, "loss_nan_ranks": 0, "loss_rank_avg": 0.3365986943244934, "step": 1200, "valid_targets_mean": 4008.9, "valid_targets_min": 780 }, { "epoch": 2.1066433566433567, "grad_norm": 0.5423206989158699, "learning_rate": 3.5294701860716773e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.36652547121047974, "step": 1205, "valid_targets_mean": 4254.9, "valid_targets_min": 1298 }, { "epoch": 2.1153846153846154, "grad_norm": 0.5548106930603924, "learning_rate": 3.523837381308369e-05, "loss": 0.3519, "loss_nan_ranks": 0, "loss_rank_avg": 0.28331395983695984, "step": 1210, "valid_targets_mean": 3385.2, "valid_targets_min": 814 }, { "epoch": 2.124125874125874, "grad_norm": 0.5212164148919388, "learning_rate": 3.518175613170212e-05, "loss": 0.3265, "loss_nan_ranks": 0, "loss_rank_avg": 0.29387807846069336, "step": 1215, "valid_targets_mean": 3507.8, "valid_targets_min": 286 }, { "epoch": 2.132867132867133, "grad_norm": 0.5973253477387896, "learning_rate": 3.512484989269683e-05, "loss": 0.3086, "loss_nan_ranks": 0, "loss_rank_avg": 0.33061522245407104, "step": 1220, "valid_targets_mean": 3305.0, "valid_targets_min": 1372 }, { "epoch": 2.1416083916083917, "grad_norm": 0.6309218234838987, "learning_rate": 3.506765617767715e-05, "loss": 0.3305, "loss_nan_ranks": 0, "loss_rank_avg": 0.3732965588569641, "step": 1225, "valid_targets_mean": 3301.4, "valid_targets_min": 721 }, { "epoch": 2.1503496503496504, "grad_norm": 0.5574659734718239, "learning_rate": 3.501017607371644e-05, "loss": 0.3393, "loss_nan_ranks": 0, "loss_rank_avg": 0.31696557998657227, "step": 1230, "valid_targets_mean": 3856.6, "valid_targets_min": 785 }, { "epoch": 2.159090909090909, "grad_norm": 0.5329453873399369, "learning_rate": 3.4952410673331394e-05, "loss": 0.3115, "loss_nan_ranks": 0, "loss_rank_avg": 0.3600800335407257, "step": 1235, "valid_targets_mean": 4775.6, "valid_targets_min": 749 }, { "epoch": 2.167832167832168, "grad_norm": 0.8114793310805336, "learning_rate": 3.489436107446131e-05, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.3316611051559448, "step": 1240, "valid_targets_mean": 4332.1, "valid_targets_min": 1436 }, { "epoch": 2.1765734265734267, "grad_norm": 0.6006878212399688, "learning_rate": 3.483602838044722e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.3003237247467041, "step": 1245, "valid_targets_mean": 3266.6, "valid_targets_min": 1159 }, { "epoch": 2.1853146853146854, "grad_norm": 0.6353674050757039, "learning_rate": 3.477741370001088e-05, "loss": 0.3026, "loss_nan_ranks": 0, "loss_rank_avg": 0.36900120973587036, "step": 1250, "valid_targets_mean": 3345.0, "valid_targets_min": 1196 }, { "epoch": 2.194055944055944, "grad_norm": 0.5737740743381646, "learning_rate": 3.471851814723375e-05, "loss": 0.3521, "loss_nan_ranks": 0, "loss_rank_avg": 0.3949390649795532, "step": 1255, "valid_targets_mean": 3930.3, "valid_targets_min": 1197 }, { "epoch": 2.202797202797203, "grad_norm": 0.552663490793486, "learning_rate": 3.4659342841535795e-05, "loss": 0.3548, "loss_nan_ranks": 0, "loss_rank_avg": 0.371884286403656, "step": 1260, "valid_targets_mean": 4117.4, "valid_targets_min": 1068 }, { "epoch": 2.2115384615384617, "grad_norm": 0.6384782410157998, "learning_rate": 3.459988890765418e-05, "loss": 0.369, "loss_nan_ranks": 0, "loss_rank_avg": 0.3499044179916382, "step": 1265, "valid_targets_mean": 4232.2, "valid_targets_min": 1426 }, { "epoch": 2.2202797202797204, "grad_norm": 0.5746738157396588, "learning_rate": 3.454015747562194e-05, "loss": 0.2951, "loss_nan_ranks": 0, "loss_rank_avg": 0.34578144550323486, "step": 1270, "valid_targets_mean": 3794.6, "valid_targets_min": 1139 }, { "epoch": 2.229020979020979, "grad_norm": 0.5054542749499512, "learning_rate": 3.448014968074648e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.2880406081676483, "step": 1275, "valid_targets_mean": 4538.5, "valid_targets_min": 1731 }, { "epoch": 2.237762237762238, "grad_norm": 0.5818466658704541, "learning_rate": 3.4419866663587985e-05, "loss": 0.3404, "loss_nan_ranks": 0, "loss_rank_avg": 0.3284459114074707, "step": 1280, "valid_targets_mean": 3571.0, "valid_targets_min": 1487 }, { "epoch": 2.2465034965034967, "grad_norm": 0.4995232658017769, "learning_rate": 3.4359309569937766e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.297016978263855, "step": 1285, "valid_targets_mean": 4168.3, "valid_targets_min": 1398 }, { "epoch": 2.2552447552447554, "grad_norm": 0.5808033797273252, "learning_rate": 3.429847955079646e-05, "loss": 0.3706, "loss_nan_ranks": 0, "loss_rank_avg": 0.32967421412467957, "step": 1290, "valid_targets_mean": 3232.4, "valid_targets_min": 933 }, { "epoch": 2.263986013986014, "grad_norm": 0.551203626753292, "learning_rate": 3.4237377762352166e-05, "loss": 0.3053, "loss_nan_ranks": 0, "loss_rank_avg": 0.30884337425231934, "step": 1295, "valid_targets_mean": 3447.6, "valid_targets_min": 1581 }, { "epoch": 2.2727272727272725, "grad_norm": 0.6298591338426267, "learning_rate": 3.4176005365958484e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.3573980927467346, "step": 1300, "valid_targets_mean": 3034.1, "valid_targets_min": 870 }, { "epoch": 2.2814685314685317, "grad_norm": 0.543847122853011, "learning_rate": 3.4114363528112376e-05, "loss": 0.361, "loss_nan_ranks": 0, "loss_rank_avg": 0.35683882236480713, "step": 1305, "valid_targets_mean": 4214.3, "valid_targets_min": 250 }, { "epoch": 2.29020979020979, "grad_norm": 0.5493972333043645, "learning_rate": 3.40524534204321e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.3217867314815521, "step": 1310, "valid_targets_mean": 4069.3, "valid_targets_min": 1209 }, { "epoch": 2.298951048951049, "grad_norm": 0.5790482571574604, "learning_rate": 3.399027621963484e-05, "loss": 0.3362, "loss_nan_ranks": 0, "loss_rank_avg": 0.3702848255634308, "step": 1315, "valid_targets_mean": 3910.4, "valid_targets_min": 1270 }, { "epoch": 2.3076923076923075, "grad_norm": 0.5521276510177341, "learning_rate": 3.392783310751441e-05, "loss": 0.342, "loss_nan_ranks": 0, "loss_rank_avg": 0.3059583306312561, "step": 1320, "valid_targets_mean": 3604.1, "valid_targets_min": 783 }, { "epoch": 2.3164335664335667, "grad_norm": 0.6269207847914563, "learning_rate": 3.3865125270918735e-05, "loss": 0.3392, "loss_nan_ranks": 0, "loss_rank_avg": 0.30475157499313354, "step": 1325, "valid_targets_mean": 2917.2, "valid_targets_min": 340 }, { "epoch": 2.325174825174825, "grad_norm": 0.6239842100481497, "learning_rate": 3.380215390172736e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.23520943522453308, "step": 1330, "valid_targets_mean": 2649.5, "valid_targets_min": 902 }, { "epoch": 2.3339160839160837, "grad_norm": 0.786197683842576, "learning_rate": 3.373892019682874e-05, "loss": 0.3944, "loss_nan_ranks": 0, "loss_rank_avg": 0.4770873785018921, "step": 1335, "valid_targets_mean": 5682.6, "valid_targets_min": 857 }, { "epoch": 2.3426573426573425, "grad_norm": 0.5897989134852589, "learning_rate": 3.36754253580975e-05, "loss": 0.3396, "loss_nan_ranks": 0, "loss_rank_avg": 0.41615045070648193, "step": 1340, "valid_targets_mean": 4481.4, "valid_targets_min": 1026 }, { "epoch": 2.3513986013986012, "grad_norm": 0.5033226934658113, "learning_rate": 3.361167059237162e-05, "loss": 0.4161, "loss_nan_ranks": 0, "loss_rank_avg": 0.3581768870353699, "step": 1345, "valid_targets_mean": 4554.1, "valid_targets_min": 1684 }, { "epoch": 2.36013986013986, "grad_norm": 0.6251621961865819, "learning_rate": 3.354765711142946e-05, "loss": 0.3507, "loss_nan_ranks": 0, "loss_rank_avg": 0.3330328166484833, "step": 1350, "valid_targets_mean": 3935.3, "valid_targets_min": 826 }, { "epoch": 2.3688811188811187, "grad_norm": 0.543210210337472, "learning_rate": 3.348338613196678e-05, "loss": 0.3605, "loss_nan_ranks": 0, "loss_rank_avg": 0.37580981850624084, "step": 1355, "valid_targets_mean": 4101.4, "valid_targets_min": 1062 }, { "epoch": 2.3776223776223775, "grad_norm": 1.263978205574014, "learning_rate": 3.341885887557353e-05, "loss": 0.3516, "loss_nan_ranks": 0, "loss_rank_avg": 0.3562210500240326, "step": 1360, "valid_targets_mean": 3485.2, "valid_targets_min": 1030 }, { "epoch": 2.3863636363636362, "grad_norm": 0.5891510875039799, "learning_rate": 3.3354076568710715e-05, "loss": 0.3245, "loss_nan_ranks": 0, "loss_rank_avg": 0.29343318939208984, "step": 1365, "valid_targets_mean": 3082.8, "valid_targets_min": 745 }, { "epoch": 2.395104895104895, "grad_norm": 0.6049119497188193, "learning_rate": 3.328904044268705e-05, "loss": 0.3184, "loss_nan_ranks": 0, "loss_rank_avg": 0.3105580806732178, "step": 1370, "valid_targets_mean": 3080.9, "valid_targets_min": 774 }, { "epoch": 2.4038461538461537, "grad_norm": 0.5211424331279453, "learning_rate": 3.322375173363554e-05, "loss": 0.3088, "loss_nan_ranks": 0, "loss_rank_avg": 0.2609102129936218, "step": 1375, "valid_targets_mean": 3569.1, "valid_targets_min": 1052 }, { "epoch": 2.4125874125874125, "grad_norm": 0.4570911075451314, "learning_rate": 3.315821168249002e-05, "loss": 0.3583, "loss_nan_ranks": 0, "loss_rank_avg": 0.34511393308639526, "step": 1380, "valid_targets_mean": 5819.4, "valid_targets_min": 1308 }, { "epoch": 2.4213286713286712, "grad_norm": 0.6915681486907906, "learning_rate": 3.309242153496154e-05, "loss": 0.3087, "loss_nan_ranks": 0, "loss_rank_avg": 0.31641054153442383, "step": 1385, "valid_targets_mean": 2650.2, "valid_targets_min": 1219 }, { "epoch": 2.43006993006993, "grad_norm": 0.5044835103913676, "learning_rate": 3.3026382541514706e-05, "loss": 0.36, "loss_nan_ranks": 0, "loss_rank_avg": 0.3088311553001404, "step": 1390, "valid_targets_mean": 4296.8, "valid_targets_min": 1167 }, { "epoch": 2.4388111888111887, "grad_norm": 0.5352841239256858, "learning_rate": 3.29600959573439e-05, "loss": 0.3652, "loss_nan_ranks": 0, "loss_rank_avg": 0.3440842032432556, "step": 1395, "valid_targets_mean": 4173.2, "valid_targets_min": 1070 }, { "epoch": 2.4475524475524475, "grad_norm": 0.5386197966301163, "learning_rate": 3.289356304234942e-05, "loss": 0.3521, "loss_nan_ranks": 0, "loss_rank_avg": 0.2736024558544159, "step": 1400, "valid_targets_mean": 3539.0, "valid_targets_min": 942 }, { "epoch": 2.4562937062937062, "grad_norm": 0.5671969479135336, "learning_rate": 3.2826785061113564e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.3724323809146881, "step": 1405, "valid_targets_mean": 3864.0, "valid_targets_min": 1121 }, { "epoch": 2.465034965034965, "grad_norm": 0.5827298416516434, "learning_rate": 3.275976328287654e-05, "loss": 0.3485, "loss_nan_ranks": 0, "loss_rank_avg": 0.29571932554244995, "step": 1410, "valid_targets_mean": 3138.4, "valid_targets_min": 915 }, { "epoch": 2.4737762237762237, "grad_norm": 0.5047580511144616, "learning_rate": 3.269249898151241e-05, "loss": 0.3293, "loss_nan_ranks": 0, "loss_rank_avg": 0.3644856810569763, "step": 1415, "valid_targets_mean": 4450.2, "valid_targets_min": 1031 }, { "epoch": 2.4825174825174825, "grad_norm": 0.5540884026688192, "learning_rate": 3.262499343550481e-05, "loss": 0.333, "loss_nan_ranks": 0, "loss_rank_avg": 0.30576711893081665, "step": 1420, "valid_targets_mean": 3474.9, "valid_targets_min": 1176 }, { "epoch": 2.4912587412587412, "grad_norm": 0.6282355274552387, "learning_rate": 3.25572479279227e-05, "loss": 0.3045, "loss_nan_ranks": 0, "loss_rank_avg": 0.2186950147151947, "step": 1425, "valid_targets_mean": 2447.4, "valid_targets_min": 1368 }, { "epoch": 2.5, "grad_norm": 0.46532594589288007, "learning_rate": 3.2489263746395946e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.2158913016319275, "step": 1430, "valid_targets_mean": 4137.2, "valid_targets_min": 1300 }, { "epoch": 2.5087412587412588, "grad_norm": 0.515624368170962, "learning_rate": 3.242104218309087e-05, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.311441570520401, "step": 1435, "valid_targets_mean": 4209.9, "valid_targets_min": 1573 }, { "epoch": 2.5174825174825175, "grad_norm": 0.4745417190069869, "learning_rate": 3.235258453468566e-05, "loss": 0.3833, "loss_nan_ranks": 0, "loss_rank_avg": 0.4018992781639099, "step": 1440, "valid_targets_mean": 5670.8, "valid_targets_min": 913 }, { "epoch": 2.5262237762237763, "grad_norm": 0.5077390838148781, "learning_rate": 3.2283892102345753e-05, "loss": 0.3265, "loss_nan_ranks": 0, "loss_rank_avg": 0.335680216550827, "step": 1445, "valid_targets_mean": 4140.2, "valid_targets_min": 1754 }, { "epoch": 2.534965034965035, "grad_norm": 0.6332018264920871, "learning_rate": 3.2214966191699103e-05, "loss": 0.3041, "loss_nan_ranks": 0, "loss_rank_avg": 0.21595916152000427, "step": 1450, "valid_targets_mean": 2705.9, "valid_targets_min": 1154 }, { "epoch": 2.5437062937062938, "grad_norm": 0.48385050928663215, "learning_rate": 3.2145808112811346e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.2742727994918823, "step": 1455, "valid_targets_mean": 4247.0, "valid_targets_min": 745 }, { "epoch": 2.5524475524475525, "grad_norm": 0.5577007979771508, "learning_rate": 3.207641918016089e-05, "loss": 0.3286, "loss_nan_ranks": 0, "loss_rank_avg": 0.3233272135257721, "step": 1460, "valid_targets_mean": 3605.4, "valid_targets_min": 1827 }, { "epoch": 2.5611888111888113, "grad_norm": 0.5872688946896231, "learning_rate": 3.200680071261399e-05, "loss": 0.3435, "loss_nan_ranks": 0, "loss_rank_avg": 0.3883779048919678, "step": 1465, "valid_targets_mean": 4236.3, "valid_targets_min": 1237 }, { "epoch": 2.56993006993007, "grad_norm": 0.5103628984175301, "learning_rate": 3.1936954033399604e-05, "loss": 0.3338, "loss_nan_ranks": 0, "loss_rank_avg": 0.3114474415779114, "step": 1470, "valid_targets_mean": 4111.7, "valid_targets_min": 1671 }, { "epoch": 2.5786713286713288, "grad_norm": 0.540599739633964, "learning_rate": 3.1866880470084295e-05, "loss": 0.3184, "loss_nan_ranks": 0, "loss_rank_avg": 0.346377968788147, "step": 1475, "valid_targets_mean": 3915.7, "valid_targets_min": 1226 }, { "epoch": 2.5874125874125875, "grad_norm": 0.5182722420558209, "learning_rate": 3.1796581354546986e-05, "loss": 0.3422, "loss_nan_ranks": 0, "loss_rank_avg": 0.365431010723114, "step": 1480, "valid_targets_mean": 4607.2, "valid_targets_min": 1553 }, { "epoch": 2.5961538461538463, "grad_norm": 0.5325618536519481, "learning_rate": 3.172605802295363e-05, "loss": 0.3141, "loss_nan_ranks": 0, "loss_rank_avg": 0.3091772794723511, "step": 1485, "valid_targets_mean": 3804.9, "valid_targets_min": 1206 }, { "epoch": 2.604895104895105, "grad_norm": 0.5080776916603383, "learning_rate": 3.165531181573183e-05, "loss": 0.3577, "loss_nan_ranks": 0, "loss_rank_avg": 0.29155874252319336, "step": 1490, "valid_targets_mean": 3623.9, "valid_targets_min": 1234 }, { "epoch": 2.6136363636363638, "grad_norm": 0.5493133795695918, "learning_rate": 3.158434407754536e-05, "loss": 0.3224, "loss_nan_ranks": 0, "loss_rank_avg": 0.37722280621528625, "step": 1495, "valid_targets_mean": 4509.4, "valid_targets_min": 1005 }, { "epoch": 2.6223776223776225, "grad_norm": 0.4760962427482821, "learning_rate": 3.15131561572686e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.33894044160842896, "step": 1500, "valid_targets_mean": 5020.0, "valid_targets_min": 1178 }, { "epoch": 2.6311188811188813, "grad_norm": 0.5909610512631924, "learning_rate": 3.14417494079609e-05, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.2644537389278412, "step": 1505, "valid_targets_mean": 2790.8, "valid_targets_min": 1458 }, { "epoch": 2.63986013986014, "grad_norm": 0.4867929709499423, "learning_rate": 3.137012518684087e-05, "loss": 0.335, "loss_nan_ranks": 0, "loss_rank_avg": 0.3499234914779663, "step": 1510, "valid_targets_mean": 5411.1, "valid_targets_min": 844 }, { "epoch": 2.6486013986013988, "grad_norm": 0.6312052243485106, "learning_rate": 3.129828485526056e-05, "loss": 0.3713, "loss_nan_ranks": 0, "loss_rank_avg": 0.35967153310775757, "step": 1515, "valid_targets_mean": 4242.8, "valid_targets_min": 1373 }, { "epoch": 2.6573426573426575, "grad_norm": 0.4836028803777569, "learning_rate": 3.122622977867963e-05, "loss": 0.3551, "loss_nan_ranks": 0, "loss_rank_avg": 0.3933538794517517, "step": 1520, "valid_targets_mean": 6016.8, "valid_targets_min": 778 }, { "epoch": 2.666083916083916, "grad_norm": 0.48888711002835405, "learning_rate": 3.1153961326639364e-05, "loss": 0.3507, "loss_nan_ranks": 0, "loss_rank_avg": 0.3524247705936432, "step": 1525, "valid_targets_mean": 4931.2, "valid_targets_min": 1005 }, { "epoch": 2.674825174825175, "grad_norm": 0.6089357100371079, "learning_rate": 3.1081480872736625e-05, "loss": 0.3383, "loss_nan_ranks": 0, "loss_rank_avg": 0.44115176796913147, "step": 1530, "valid_targets_mean": 4462.6, "valid_targets_min": 1632 }, { "epoch": 2.6835664335664333, "grad_norm": 0.4578837646445128, "learning_rate": 3.1008789794597776e-05, "loss": 0.338, "loss_nan_ranks": 0, "loss_rank_avg": 0.351039856672287, "step": 1535, "valid_targets_mean": 5812.1, "valid_targets_min": 1240 }, { "epoch": 2.6923076923076925, "grad_norm": 0.41101789198349736, "learning_rate": 3.0935889473852504e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.27018117904663086, "step": 1540, "valid_targets_mean": 5820.7, "valid_targets_min": 937 }, { "epoch": 2.701048951048951, "grad_norm": 0.532122890158766, "learning_rate": 3.086278129610752e-05, "loss": 0.3155, "loss_nan_ranks": 0, "loss_rank_avg": 0.39900821447372437, "step": 1545, "valid_targets_mean": 5061.4, "valid_targets_min": 939 }, { "epoch": 2.70979020979021, "grad_norm": 0.558531282366923, "learning_rate": 3.078946665092026e-05, "loss": 0.3141, "loss_nan_ranks": 0, "loss_rank_avg": 0.24225279688835144, "step": 1550, "valid_targets_mean": 2957.4, "valid_targets_min": 1131 }, { "epoch": 2.7185314685314683, "grad_norm": 0.5109631555447813, "learning_rate": 3.071594693177245e-05, "loss": 0.3675, "loss_nan_ranks": 0, "loss_rank_avg": 0.4015381336212158, "step": 1555, "valid_targets_mean": 4465.8, "valid_targets_min": 828 }, { "epoch": 2.7272727272727275, "grad_norm": 0.536961938759069, "learning_rate": 3.064222353604364e-05, "loss": 0.3344, "loss_nan_ranks": 0, "loss_rank_avg": 0.278196781873703, "step": 1560, "valid_targets_mean": 3323.1, "valid_targets_min": 1201 }, { "epoch": 2.736013986013986, "grad_norm": 0.6246699552933006, "learning_rate": 3.056829786498462e-05, "loss": 0.3385, "loss_nan_ranks": 0, "loss_rank_avg": 0.3288848400115967, "step": 1565, "valid_targets_mean": 3083.0, "valid_targets_min": 430 }, { "epoch": 2.744755244755245, "grad_norm": 0.606461060216546, "learning_rate": 3.0494171323690806e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.2629588842391968, "step": 1570, "valid_targets_mean": 2680.1, "valid_targets_min": 1377 }, { "epoch": 2.7534965034965033, "grad_norm": 0.5680548667160676, "learning_rate": 3.041984532107554e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.23354268074035645, "step": 1575, "valid_targets_mean": 2878.9, "valid_targets_min": 1391 }, { "epoch": 2.762237762237762, "grad_norm": 0.4888929142446612, "learning_rate": 3.0345321269843277e-05, "loss": 0.3359, "loss_nan_ranks": 0, "loss_rank_avg": 0.3905789256095886, "step": 1580, "valid_targets_mean": 5311.2, "valid_targets_min": 894 }, { "epoch": 2.770979020979021, "grad_norm": 0.4913581565807214, "learning_rate": 3.0270600586462778e-05, "loss": 0.335, "loss_nan_ranks": 0, "loss_rank_avg": 0.3499818742275238, "step": 1585, "valid_targets_mean": 5184.2, "valid_targets_min": 1497 }, { "epoch": 2.7797202797202796, "grad_norm": 0.6229148339552479, "learning_rate": 3.019568469114015e-05, "loss": 0.3432, "loss_nan_ranks": 0, "loss_rank_avg": 0.4142291843891144, "step": 1590, "valid_targets_mean": 3948.3, "valid_targets_min": 1096 }, { "epoch": 2.7884615384615383, "grad_norm": 0.4869929533107764, "learning_rate": 3.012057500779187e-05, "loss": 0.3461, "loss_nan_ranks": 0, "loss_rank_avg": 0.3251883387565613, "step": 1595, "valid_targets_mean": 4624.6, "valid_targets_min": 1304 }, { "epoch": 2.797202797202797, "grad_norm": 0.5826642414041437, "learning_rate": 3.0045272964017716e-05, "loss": 0.343, "loss_nan_ranks": 0, "loss_rank_avg": 0.36511659622192383, "step": 1600, "valid_targets_mean": 4380.1, "valid_targets_min": 278 }, { "epoch": 2.805944055944056, "grad_norm": 0.519436625480804, "learning_rate": 2.996977999107365e-05, "loss": 0.3224, "loss_nan_ranks": 0, "loss_rank_avg": 0.34158188104629517, "step": 1605, "valid_targets_mean": 4013.6, "valid_targets_min": 1457 }, { "epoch": 2.8146853146853146, "grad_norm": 0.5696670222694973, "learning_rate": 2.989409752384458e-05, "loss": 0.3291, "loss_nan_ranks": 0, "loss_rank_avg": 0.3094896972179413, "step": 1610, "valid_targets_mean": 3533.7, "valid_targets_min": 991 }, { "epoch": 2.8234265734265733, "grad_norm": 0.5347638782980102, "learning_rate": 2.9818227000817118e-05, "loss": 0.3289, "loss_nan_ranks": 0, "loss_rank_avg": 0.28824296593666077, "step": 1615, "valid_targets_mean": 3428.8, "valid_targets_min": 1488 }, { "epoch": 2.832167832167832, "grad_norm": 0.5142694431369366, "learning_rate": 2.9742169864052228e-05, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.33047711849212646, "step": 1620, "valid_targets_mean": 3887.8, "valid_targets_min": 1383 }, { "epoch": 2.840909090909091, "grad_norm": 0.5251206238823921, "learning_rate": 2.9665927559157806e-05, "loss": 0.3305, "loss_nan_ranks": 0, "loss_rank_avg": 0.36617588996887207, "step": 1625, "valid_targets_mean": 5211.3, "valid_targets_min": 900 }, { "epoch": 2.8496503496503496, "grad_norm": 0.6372098783365453, "learning_rate": 2.9589501535261225e-05, "loss": 0.3314, "loss_nan_ranks": 0, "loss_rank_avg": 0.3497511148452759, "step": 1630, "valid_targets_mean": 2946.0, "valid_targets_min": 867 }, { "epoch": 2.8583916083916083, "grad_norm": 0.50501773040429, "learning_rate": 2.9512893244981787e-05, "loss": 0.3475, "loss_nan_ranks": 0, "loss_rank_avg": 0.32178816199302673, "step": 1635, "valid_targets_mean": 4174.2, "valid_targets_min": 1037 }, { "epoch": 2.867132867132867, "grad_norm": 0.6092809892942609, "learning_rate": 2.9436104144403077e-05, "loss": 0.3566, "loss_nan_ranks": 0, "loss_rank_avg": 0.37956398725509644, "step": 1640, "valid_targets_mean": 3658.4, "valid_targets_min": 1280 }, { "epoch": 2.875874125874126, "grad_norm": 0.49333402495352063, "learning_rate": 2.935913569304535e-05, "loss": 0.3413, "loss_nan_ranks": 0, "loss_rank_avg": 0.31394535303115845, "step": 1645, "valid_targets_mean": 4416.7, "valid_targets_min": 1183 }, { "epoch": 2.8846153846153846, "grad_norm": 0.6289070209634252, "learning_rate": 2.9281989353837746e-05, "loss": 0.3338, "loss_nan_ranks": 0, "loss_rank_avg": 0.2899363338947296, "step": 1650, "valid_targets_mean": 2902.4, "valid_targets_min": 1459 }, { "epoch": 2.8933566433566433, "grad_norm": 0.889407629295206, "learning_rate": 2.9204666593090497e-05, "loss": 0.3377, "loss_nan_ranks": 0, "loss_rank_avg": 0.40736573934555054, "step": 1655, "valid_targets_mean": 3440.2, "valid_targets_min": 1080 }, { "epoch": 2.902097902097902, "grad_norm": 0.5530560757360455, "learning_rate": 2.9127168880467046e-05, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.23936739563941956, "step": 1660, "valid_targets_mean": 2988.8, "valid_targets_min": 1192 }, { "epoch": 2.910839160839161, "grad_norm": 0.4627722312735592, "learning_rate": 2.904949768895613e-05, "loss": 0.3629, "loss_nan_ranks": 0, "loss_rank_avg": 0.38242220878601074, "step": 1665, "valid_targets_mean": 5788.4, "valid_targets_min": 1672 }, { "epoch": 2.9195804195804196, "grad_norm": 0.5282100795632996, "learning_rate": 2.8971654494843787e-05, "loss": 0.3452, "loss_nan_ranks": 0, "loss_rank_avg": 0.3152114748954773, "step": 1670, "valid_targets_mean": 3547.1, "valid_targets_min": 1059 }, { "epoch": 2.9283216783216783, "grad_norm": 0.5555470512379443, "learning_rate": 2.8893640777685262e-05, "loss": 0.3549, "loss_nan_ranks": 0, "loss_rank_avg": 0.2666780948638916, "step": 1675, "valid_targets_mean": 2986.2, "valid_targets_min": 1327 }, { "epoch": 2.937062937062937, "grad_norm": 0.73170673641065, "learning_rate": 2.8815458020276926e-05, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.34276720881462097, "step": 1680, "valid_targets_mean": 3467.1, "valid_targets_min": 1189 }, { "epoch": 2.945804195804196, "grad_norm": 0.5551173357470257, "learning_rate": 2.873710770862808e-05, "loss": 0.2935, "loss_nan_ranks": 0, "loss_rank_avg": 0.39830976724624634, "step": 1685, "valid_targets_mean": 4390.9, "valid_targets_min": 1355 }, { "epoch": 2.9545454545454546, "grad_norm": 0.5429468572998486, "learning_rate": 2.865859133193269e-05, "loss": 0.3495, "loss_nan_ranks": 0, "loss_rank_avg": 0.35579365491867065, "step": 1690, "valid_targets_mean": 4104.4, "valid_targets_min": 867 }, { "epoch": 2.9632867132867133, "grad_norm": 0.588815970444589, "learning_rate": 2.857991038254111e-05, "loss": 0.3557, "loss_nan_ranks": 0, "loss_rank_avg": 0.29141175746917725, "step": 1695, "valid_targets_mean": 2931.9, "valid_targets_min": 831 }, { "epoch": 2.972027972027972, "grad_norm": 0.530558546752831, "learning_rate": 2.8501066355931706e-05, "loss": 0.3188, "loss_nan_ranks": 0, "loss_rank_avg": 0.2682480812072754, "step": 1700, "valid_targets_mean": 3245.7, "valid_targets_min": 923 }, { "epoch": 2.980769230769231, "grad_norm": 0.5237411811728068, "learning_rate": 2.8422060750682415e-05, "loss": 0.3317, "loss_nan_ranks": 0, "loss_rank_avg": 0.32749104499816895, "step": 1705, "valid_targets_mean": 3853.8, "valid_targets_min": 1482 }, { "epoch": 2.9895104895104896, "grad_norm": 0.5573031127069092, "learning_rate": 2.8342895068442294e-05, "loss": 0.3687, "loss_nan_ranks": 0, "loss_rank_avg": 0.4529867172241211, "step": 1710, "valid_targets_mean": 5293.9, "valid_targets_min": 880 }, { "epoch": 2.9982517482517483, "grad_norm": 0.5866186073439474, "learning_rate": 2.8263570813902964e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.4375874400138855, "step": 1715, "valid_targets_mean": 4802.0, "valid_targets_min": 1091 }, { "epoch": 3.006993006993007, "grad_norm": 0.5593741909162024, "learning_rate": 2.8184089494769996e-05, "loss": 0.336, "loss_nan_ranks": 0, "loss_rank_avg": 0.30689311027526855, "step": 1720, "valid_targets_mean": 3870.9, "valid_targets_min": 1023 }, { "epoch": 3.015734265734266, "grad_norm": 0.6875702773552215, "learning_rate": 2.8104452621734276e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.24441856145858765, "step": 1725, "valid_targets_mean": 2328.2, "valid_targets_min": 785 }, { "epoch": 3.0244755244755246, "grad_norm": 0.6701000204338885, "learning_rate": 2.8024661708443283e-05, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.27847230434417725, "step": 1730, "valid_targets_mean": 2640.6, "valid_targets_min": 1097 }, { "epoch": 3.0332167832167833, "grad_norm": 0.5561404654820966, "learning_rate": 2.7944718271472307e-05, "loss": 0.3239, "loss_nan_ranks": 0, "loss_rank_avg": 0.2966724634170532, "step": 1735, "valid_targets_mean": 3719.1, "valid_targets_min": 1431 }, { "epoch": 3.041958041958042, "grad_norm": 0.5474562888952275, "learning_rate": 2.7864623830295644e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.2625727951526642, "step": 1740, "valid_targets_mean": 3559.9, "valid_targets_min": 1339 }, { "epoch": 3.050699300699301, "grad_norm": 0.5467537174092281, "learning_rate": 2.778437990725772e-05, "loss": 0.3275, "loss_nan_ranks": 0, "loss_rank_avg": 0.32522091269493103, "step": 1745, "valid_targets_mean": 3952.1, "valid_targets_min": 1306 }, { "epoch": 3.0594405594405596, "grad_norm": 0.5837961644003972, "learning_rate": 2.770398802754411e-05, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.27994534373283386, "step": 1750, "valid_targets_mean": 3050.2, "valid_targets_min": 1634 }, { "epoch": 3.0681818181818183, "grad_norm": 0.5722932789937027, "learning_rate": 2.762344971915261e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.3312224745750427, "step": 1755, "valid_targets_mean": 4157.8, "valid_targets_min": 1501 }, { "epoch": 3.076923076923077, "grad_norm": 0.5310388929296251, "learning_rate": 2.754276651286417e-05, "loss": 0.3043, "loss_nan_ranks": 0, "loss_rank_avg": 0.2896951735019684, "step": 1760, "valid_targets_mean": 3732.2, "valid_targets_min": 765 }, { "epoch": 3.085664335664336, "grad_norm": 0.5520914848544317, "learning_rate": 2.7461939942213764e-05, "loss": 0.3191, "loss_nan_ranks": 0, "loss_rank_avg": 0.2980251908302307, "step": 1765, "valid_targets_mean": 4002.0, "valid_targets_min": 1123 }, { "epoch": 3.0944055944055946, "grad_norm": 0.6542055095053531, "learning_rate": 2.7380971543461297e-05, "loss": 0.3217, "loss_nan_ranks": 0, "loss_rank_avg": 0.29861879348754883, "step": 1770, "valid_targets_mean": 5110.6, "valid_targets_min": 1737 }, { "epoch": 3.1031468531468533, "grad_norm": 0.5594852097545516, "learning_rate": 2.7299862855562388e-05, "loss": 0.344, "loss_nan_ranks": 0, "loss_rank_avg": 0.35483282804489136, "step": 1775, "valid_targets_mean": 4066.8, "valid_targets_min": 1142 }, { "epoch": 3.111888111888112, "grad_norm": 0.5118972220091799, "learning_rate": 2.7218615420139087e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.26075172424316406, "step": 1780, "valid_targets_mean": 3815.4, "valid_targets_min": 1091 }, { "epoch": 3.120629370629371, "grad_norm": 0.5806431136298092, "learning_rate": 2.7137230781450622e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.22283409535884857, "step": 1785, "valid_targets_mean": 2682.1, "valid_targets_min": 1586 }, { "epoch": 3.129370629370629, "grad_norm": 0.6888048962906062, "learning_rate": 2.705571048636402e-05, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.3880237936973572, "step": 1790, "valid_targets_mean": 4161.1, "valid_targets_min": 865 }, { "epoch": 3.138111888111888, "grad_norm": 0.5897865617319268, "learning_rate": 2.6974056084324714e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.19622839987277985, "step": 1795, "valid_targets_mean": 2572.1, "valid_targets_min": 1043 }, { "epoch": 3.1468531468531467, "grad_norm": 0.5139881969438773, "learning_rate": 2.689226912732708e-05, "loss": 0.3195, "loss_nan_ranks": 0, "loss_rank_avg": 0.310763955116272, "step": 1800, "valid_targets_mean": 4432.8, "valid_targets_min": 1740 }, { "epoch": 3.1555944055944054, "grad_norm": 0.6327514647943825, "learning_rate": 2.681035116988495e-05, "loss": 0.2854, "loss_nan_ranks": 0, "loss_rank_avg": 0.2328225076198578, "step": 1805, "valid_targets_mean": 2745.8, "valid_targets_min": 1203 }, { "epoch": 3.164335664335664, "grad_norm": 0.5786087357328902, "learning_rate": 2.672830376900207e-05, "loss": 0.2758, "loss_nan_ranks": 0, "loss_rank_avg": 0.21883933246135712, "step": 1810, "valid_targets_mean": 2616.9, "valid_targets_min": 791 }, { "epoch": 3.173076923076923, "grad_norm": 0.5982326471685516, "learning_rate": 2.6646128484142496e-05, "loss": 0.2805, "loss_nan_ranks": 0, "loss_rank_avg": 0.2592069208621979, "step": 1815, "valid_targets_mean": 2841.3, "valid_targets_min": 769 }, { "epoch": 3.1818181818181817, "grad_norm": 0.5077262037530513, "learning_rate": 2.6563826877200973e-05, "loss": 0.3337, "loss_nan_ranks": 0, "loss_rank_avg": 0.305428147315979, "step": 1820, "valid_targets_mean": 4644.9, "valid_targets_min": 870 }, { "epoch": 3.1905594405594404, "grad_norm": 0.5277249384140703, "learning_rate": 2.6481400512473216e-05, "loss": 0.3314, "loss_nan_ranks": 0, "loss_rank_avg": 0.3702384829521179, "step": 1825, "valid_targets_mean": 4858.6, "valid_targets_min": 1258 }, { "epoch": 3.199300699300699, "grad_norm": 0.5934305740478432, "learning_rate": 2.6398850956626185e-05, "loss": 0.3159, "loss_nan_ranks": 0, "loss_rank_avg": 0.3127822279930115, "step": 1830, "valid_targets_mean": 3075.4, "valid_targets_min": 1248 }, { "epoch": 3.208041958041958, "grad_norm": 0.5556627340017823, "learning_rate": 2.6316179778668342e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.27353787422180176, "step": 1835, "valid_targets_mean": 3647.0, "valid_targets_min": 875 }, { "epoch": 3.2167832167832167, "grad_norm": 0.6769529052233687, "learning_rate": 2.62333885499198e-05, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.2421294003725052, "step": 1840, "valid_targets_mean": 2436.8, "valid_targets_min": 795 }, { "epoch": 3.2255244755244754, "grad_norm": 0.5674592394416891, "learning_rate": 2.6150478843982442e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.2963680922985077, "step": 1845, "valid_targets_mean": 3300.4, "valid_targets_min": 1277 }, { "epoch": 3.234265734265734, "grad_norm": 0.4952708038181234, "learning_rate": 2.606745223671005e-05, "loss": 0.3533, "loss_nan_ranks": 0, "loss_rank_avg": 0.4648565649986267, "step": 1850, "valid_targets_mean": 6469.8, "valid_targets_min": 869 }, { "epoch": 3.243006993006993, "grad_norm": 0.503186087950448, "learning_rate": 2.5984310306178326e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.3806156516075134, "step": 1855, "valid_targets_mean": 5322.2, "valid_targets_min": 1201 }, { "epoch": 3.2517482517482517, "grad_norm": 0.5743530413508324, "learning_rate": 2.5901054632654915e-05, "loss": 0.3232, "loss_nan_ranks": 0, "loss_rank_avg": 0.3227553963661194, "step": 1860, "valid_targets_mean": 3967.1, "valid_targets_min": 911 }, { "epoch": 3.2604895104895104, "grad_norm": 0.5653915692401206, "learning_rate": 2.5817686798569344e-05, "loss": 0.3773, "loss_nan_ranks": 0, "loss_rank_avg": 0.45867377519607544, "step": 1865, "valid_targets_mean": 5937.1, "valid_targets_min": 1105 }, { "epoch": 3.269230769230769, "grad_norm": 0.5756883469118854, "learning_rate": 2.5734208388482978e-05, "loss": 0.3006, "loss_nan_ranks": 0, "loss_rank_avg": 0.24555999040603638, "step": 1870, "valid_targets_mean": 2718.0, "valid_targets_min": 956 }, { "epoch": 3.277972027972028, "grad_norm": 0.5740807872776593, "learning_rate": 2.565062098905887e-05, "loss": 0.3458, "loss_nan_ranks": 0, "loss_rank_avg": 0.2976549565792084, "step": 1875, "valid_targets_mean": 3536.9, "valid_targets_min": 1558 }, { "epoch": 3.2867132867132867, "grad_norm": 0.5351814557204507, "learning_rate": 2.556692618903163e-05, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.23402386903762817, "step": 1880, "valid_targets_mean": 3553.0, "valid_targets_min": 1245 }, { "epoch": 3.2954545454545454, "grad_norm": 0.5347095217029892, "learning_rate": 2.548312557917721e-05, "loss": 0.3092, "loss_nan_ranks": 0, "loss_rank_avg": 0.37455683946609497, "step": 1885, "valid_targets_mean": 4354.1, "valid_targets_min": 1197 }, { "epoch": 3.304195804195804, "grad_norm": 0.5087532787953783, "learning_rate": 2.539922075228269e-05, "loss": 0.3, "loss_nan_ranks": 0, "loss_rank_avg": 0.28234240412712097, "step": 1890, "valid_targets_mean": 4121.2, "valid_targets_min": 1014 }, { "epoch": 3.312937062937063, "grad_norm": 0.6003931803373139, "learning_rate": 2.5315213303115965e-05, "loss": 0.3228, "loss_nan_ranks": 0, "loss_rank_avg": 0.31622016429901123, "step": 1895, "valid_targets_mean": 3575.1, "valid_targets_min": 1184 }, { "epoch": 3.3216783216783217, "grad_norm": 0.5324200090699127, "learning_rate": 2.5231104828395482e-05, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.43272459506988525, "step": 1900, "valid_targets_mean": 4967.6, "valid_targets_min": 970 }, { "epoch": 3.3304195804195804, "grad_norm": 0.4644604979173125, "learning_rate": 2.5146896926759846e-05, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.26517045497894287, "step": 1905, "valid_targets_mean": 4802.2, "valid_targets_min": 465 }, { "epoch": 3.339160839160839, "grad_norm": 0.5567107972295677, "learning_rate": 2.506259119873747e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.2603760361671448, "step": 1910, "valid_targets_mean": 3453.2, "valid_targets_min": 1046 }, { "epoch": 3.347902097902098, "grad_norm": 0.5824511685174325, "learning_rate": 2.4978189246716138e-05, "loss": 0.3317, "loss_nan_ranks": 0, "loss_rank_avg": 0.3032684624195099, "step": 1915, "valid_targets_mean": 3675.1, "valid_targets_min": 1394 }, { "epoch": 3.3566433566433567, "grad_norm": 0.562852289563815, "learning_rate": 2.4893692674912546e-05, "loss": 0.3148, "loss_nan_ranks": 0, "loss_rank_avg": 0.27050256729125977, "step": 1920, "valid_targets_mean": 3446.0, "valid_targets_min": 1239 }, { "epoch": 3.3653846153846154, "grad_norm": 0.4985979591826673, "learning_rate": 2.480910308934182e-05, "loss": 0.3332, "loss_nan_ranks": 0, "loss_rank_avg": 0.3425469994544983, "step": 1925, "valid_targets_mean": 5447.1, "valid_targets_min": 1395 }, { "epoch": 3.374125874125874, "grad_norm": 0.5319686306642291, "learning_rate": 2.4724422097787e-05, "loss": 0.3131, "loss_nan_ranks": 0, "loss_rank_avg": 0.33209139108657837, "step": 1930, "valid_targets_mean": 4106.9, "valid_targets_min": 1241 }, { "epoch": 3.382867132867133, "grad_norm": 0.5452257512149177, "learning_rate": 2.463965130976843e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.25301462411880493, "step": 1935, "valid_targets_mean": 3712.9, "valid_targets_min": 1248 }, { "epoch": 3.3916083916083917, "grad_norm": 0.5994620335296995, "learning_rate": 2.455479233651324e-05, "loss": 0.3094, "loss_nan_ranks": 0, "loss_rank_avg": 0.3276280164718628, "step": 1940, "valid_targets_mean": 3709.6, "valid_targets_min": 1363 }, { "epoch": 3.4003496503496504, "grad_norm": 0.6461501673593458, "learning_rate": 2.4469846790924665e-05, "loss": 0.3061, "loss_nan_ranks": 0, "loss_rank_avg": 0.29547345638275146, "step": 1945, "valid_targets_mean": 2801.9, "valid_targets_min": 942 }, { "epoch": 3.409090909090909, "grad_norm": 0.6637610589856805, "learning_rate": 2.4384816287551417e-05, "loss": 0.3183, "loss_nan_ranks": 0, "loss_rank_avg": 0.2376343160867691, "step": 1950, "valid_targets_mean": 3314.5, "valid_targets_min": 844 }, { "epoch": 3.417832167832168, "grad_norm": 0.5781629714916717, "learning_rate": 2.429970244255699e-05, "loss": 0.3443, "loss_nan_ranks": 0, "loss_rank_avg": 0.4136093854904175, "step": 1955, "valid_targets_mean": 4240.6, "valid_targets_min": 904 }, { "epoch": 3.4265734265734267, "grad_norm": 0.6348556096389305, "learning_rate": 2.421450687368893e-05, "loss": 0.3334, "loss_nan_ranks": 0, "loss_rank_avg": 0.25327175855636597, "step": 1960, "valid_targets_mean": 2663.6, "valid_targets_min": 1247 }, { "epoch": 3.4353146853146854, "grad_norm": 0.5470950021821281, "learning_rate": 2.4129231200248127e-05, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.31240352988243103, "step": 1965, "valid_targets_mean": 3655.2, "valid_targets_min": 844 }, { "epoch": 3.444055944055944, "grad_norm": 0.545174136340182, "learning_rate": 2.4043877043057967e-05, "loss": 0.3037, "loss_nan_ranks": 0, "loss_rank_avg": 0.3076508343219757, "step": 1970, "valid_targets_mean": 3656.6, "valid_targets_min": 1120 }, { "epoch": 3.452797202797203, "grad_norm": 0.548675450396162, "learning_rate": 2.3958446024433594e-05, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.26705825328826904, "step": 1975, "valid_targets_mean": 3810.5, "valid_targets_min": 1198 }, { "epoch": 3.4615384615384617, "grad_norm": 0.5451879746136353, "learning_rate": 2.387293976815104e-05, "loss": 0.2967, "loss_nan_ranks": 0, "loss_rank_avg": 0.31972768902778625, "step": 1980, "valid_targets_mean": 4197.5, "valid_targets_min": 1083 }, { "epoch": 3.4702797202797204, "grad_norm": 0.5581621250486566, "learning_rate": 2.3787359899416368e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.3593602776527405, "step": 1985, "valid_targets_mean": 4509.0, "valid_targets_min": 1340 }, { "epoch": 3.479020979020979, "grad_norm": 0.7071170505697403, "learning_rate": 2.370170804483477e-05, "loss": 0.3123, "loss_nan_ranks": 0, "loss_rank_avg": 0.363255113363266, "step": 1990, "valid_targets_mean": 4484.3, "valid_targets_min": 988 }, { "epoch": 3.487762237762238, "grad_norm": 0.5953191456261493, "learning_rate": 2.3615985832379712e-05, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.39135444164276123, "step": 1995, "valid_targets_mean": 4099.6, "valid_targets_min": 838 }, { "epoch": 3.4965034965034967, "grad_norm": 0.6266903019082694, "learning_rate": 2.353019489136188e-05, "loss": 0.3184, "loss_nan_ranks": 0, "loss_rank_avg": 0.35590970516204834, "step": 2000, "valid_targets_mean": 3606.8, "valid_targets_min": 934 }, { "epoch": 3.505244755244755, "grad_norm": 0.4764377794762096, "learning_rate": 2.344433685239831e-05, "loss": 0.329, "loss_nan_ranks": 0, "loss_rank_avg": 0.3431362509727478, "step": 2005, "valid_targets_mean": 6622.6, "valid_targets_min": 1105 }, { "epoch": 3.513986013986014, "grad_norm": 0.6304170909454058, "learning_rate": 2.335841334738136e-05, "loss": 0.3164, "loss_nan_ranks": 0, "loss_rank_avg": 0.29519712924957275, "step": 2010, "valid_targets_mean": 4467.6, "valid_targets_min": 1355 }, { "epoch": 3.5227272727272725, "grad_norm": 0.490952302275404, "learning_rate": 2.3272426009447672e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.2910092771053314, "step": 2015, "valid_targets_mean": 5033.2, "valid_targets_min": 1287 }, { "epoch": 3.5314685314685317, "grad_norm": 0.6155323428675108, "learning_rate": 2.3186376472947168e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.2902764678001404, "step": 2020, "valid_targets_mean": 2894.0, "valid_targets_min": 740 }, { "epoch": 3.54020979020979, "grad_norm": 0.6025591175683395, "learning_rate": 2.3100266373411974e-05, "loss": 0.3453, "loss_nan_ranks": 0, "loss_rank_avg": 0.4039961099624634, "step": 2025, "valid_targets_mean": 4974.3, "valid_targets_min": 1085 }, { "epoch": 3.548951048951049, "grad_norm": 0.6541300455848044, "learning_rate": 2.3014097347525318e-05, "loss": 0.3228, "loss_nan_ranks": 0, "loss_rank_avg": 0.3308113217353821, "step": 2030, "valid_targets_mean": 2943.2, "valid_targets_min": 370 }, { "epoch": 3.5576923076923075, "grad_norm": 0.5772386978918906, "learning_rate": 2.292787103309044e-05, "loss": 0.313, "loss_nan_ranks": 0, "loss_rank_avg": 0.34256115555763245, "step": 2035, "valid_targets_mean": 3433.4, "valid_targets_min": 1081 }, { "epoch": 3.5664335664335667, "grad_norm": 0.5104371056143377, "learning_rate": 2.2841589068999458e-05, "loss": 0.3112, "loss_nan_ranks": 0, "loss_rank_avg": 0.2974053621292114, "step": 2040, "valid_targets_mean": 4280.6, "valid_targets_min": 1377 }, { "epoch": 3.575174825174825, "grad_norm": 0.537050676241048, "learning_rate": 2.2755253095202197e-05, "loss": 0.3329, "loss_nan_ranks": 0, "loss_rank_avg": 0.3554688096046448, "step": 2045, "valid_targets_mean": 4372.0, "valid_targets_min": 1054 }, { "epoch": 3.583916083916084, "grad_norm": 0.5208129965095871, "learning_rate": 2.2668864752675067e-05, "loss": 0.2975, "loss_nan_ranks": 0, "loss_rank_avg": 0.36728352308273315, "step": 2050, "valid_targets_mean": 4518.3, "valid_targets_min": 1222 }, { "epoch": 3.5926573426573425, "grad_norm": 0.5363774636487812, "learning_rate": 2.2582425683389815e-05, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.2853674292564392, "step": 2055, "valid_targets_mean": 3562.8, "valid_targets_min": 632 }, { "epoch": 3.6013986013986012, "grad_norm": 0.5865618188816509, "learning_rate": 2.2495937530282368e-05, "loss": 0.3391, "loss_nan_ranks": 0, "loss_rank_avg": 0.34035515785217285, "step": 2060, "valid_targets_mean": 4121.7, "valid_targets_min": 778 }, { "epoch": 3.61013986013986, "grad_norm": 0.6378564206491916, "learning_rate": 2.240940193722157e-05, "loss": 0.3218, "loss_nan_ranks": 0, "loss_rank_avg": 0.33596569299697876, "step": 2065, "valid_targets_mean": 3544.1, "valid_targets_min": 295 }, { "epoch": 3.6188811188811187, "grad_norm": 0.8804204695385472, "learning_rate": 2.232282054897795e-05, "loss": 0.3141, "loss_nan_ranks": 0, "loss_rank_avg": 0.3685414791107178, "step": 2070, "valid_targets_mean": 3786.0, "valid_targets_min": 948 }, { "epoch": 3.6276223776223775, "grad_norm": 4.564250479592216, "learning_rate": 2.2236195011192465e-05, "loss": 0.309, "loss_nan_ranks": 0, "loss_rank_avg": 0.2899073362350464, "step": 2075, "valid_targets_mean": 3357.1, "valid_targets_min": 1336 }, { "epoch": 3.6363636363636362, "grad_norm": 0.635900091215057, "learning_rate": 2.2149526970345206e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.30170345306396484, "step": 2080, "valid_targets_mean": 2948.2, "valid_targets_min": 730 }, { "epoch": 3.645104895104895, "grad_norm": 0.5582750079594184, "learning_rate": 2.2062818073724132e-05, "loss": 0.2988, "loss_nan_ranks": 0, "loss_rank_avg": 0.24713920056819916, "step": 2085, "valid_targets_mean": 3688.3, "valid_targets_min": 1570 }, { "epoch": 3.6538461538461537, "grad_norm": 0.5603245581882423, "learning_rate": 2.197606996939373e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.3602690100669861, "step": 2090, "valid_targets_mean": 5358.8, "valid_targets_min": 1278 }, { "epoch": 3.6625874125874125, "grad_norm": 0.4738594919894474, "learning_rate": 2.1889284306163705e-05, "loss": 0.2993, "loss_nan_ranks": 0, "loss_rank_avg": 0.30577272176742554, "step": 2095, "valid_targets_mean": 4808.5, "valid_targets_min": 408 }, { "epoch": 3.6713286713286712, "grad_norm": 0.6366766240922407, "learning_rate": 2.1802462733557633e-05, "loss": 0.3392, "loss_nan_ranks": 0, "loss_rank_avg": 0.3579673767089844, "step": 2100, "valid_targets_mean": 5506.0, "valid_targets_min": 897 }, { "epoch": 3.68006993006993, "grad_norm": 0.6139697875303248, "learning_rate": 2.1715606901781632e-05, "loss": 0.3237, "loss_nan_ranks": 0, "loss_rank_avg": 0.33977657556533813, "step": 2105, "valid_targets_mean": 4469.7, "valid_targets_min": 813 }, { "epoch": 3.6888111888111887, "grad_norm": 0.5475120095818063, "learning_rate": 2.1628718461692958e-05, "loss": 0.2856, "loss_nan_ranks": 0, "loss_rank_avg": 0.2815313935279846, "step": 2110, "valid_targets_mean": 3470.9, "valid_targets_min": 1034 }, { "epoch": 3.6975524475524475, "grad_norm": 0.64206791153299, "learning_rate": 2.1541799064768657e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.27947911620140076, "step": 2115, "valid_targets_mean": 2544.1, "valid_targets_min": 1200 }, { "epoch": 3.7062937062937062, "grad_norm": 0.5642192836007337, "learning_rate": 2.1454850363074185e-05, "loss": 0.3429, "loss_nan_ranks": 0, "loss_rank_avg": 0.26924845576286316, "step": 2120, "valid_targets_mean": 3421.4, "valid_targets_min": 700 }, { "epoch": 3.715034965034965, "grad_norm": 0.5687312412041607, "learning_rate": 2.1367874009231952e-05, "loss": 0.3134, "loss_nan_ranks": 0, "loss_rank_avg": 0.3756811022758484, "step": 2125, "valid_targets_mean": 4092.6, "valid_targets_min": 1091 }, { "epoch": 3.7237762237762237, "grad_norm": 0.5254319030668086, "learning_rate": 2.128087165638999e-05, "loss": 0.3382, "loss_nan_ranks": 0, "loss_rank_avg": 0.295890212059021, "step": 2130, "valid_targets_mean": 4654.0, "valid_targets_min": 1198 }, { "epoch": 3.7325174825174825, "grad_norm": 0.507350094446985, "learning_rate": 2.119384495819047e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.34149473905563354, "step": 2135, "valid_targets_mean": 4297.9, "valid_targets_min": 286 }, { "epoch": 3.7412587412587412, "grad_norm": 0.5874873776278813, "learning_rate": 2.1106795568738282e-05, "loss": 0.3242, "loss_nan_ranks": 0, "loss_rank_avg": 0.29470622539520264, "step": 2140, "valid_targets_mean": 3362.8, "valid_targets_min": 1310 }, { "epoch": 3.75, "grad_norm": 0.6344178553130709, "learning_rate": 2.1019725142569624e-05, "loss": 0.3454, "loss_nan_ranks": 0, "loss_rank_avg": 0.3341315686702728, "step": 2145, "valid_targets_mean": 4382.1, "valid_targets_min": 363 }, { "epoch": 3.7587412587412588, "grad_norm": 1.224454305795279, "learning_rate": 2.0932635334620538e-05, "loss": 0.3285, "loss_nan_ranks": 0, "loss_rank_avg": 0.3387570083141327, "step": 2150, "valid_targets_mean": 3175.1, "valid_targets_min": 1080 }, { "epoch": 3.7674825174825175, "grad_norm": 0.4946950905437756, "learning_rate": 2.084552780019543e-05, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.261683851480484, "step": 2155, "valid_targets_mean": 4516.0, "valid_targets_min": 740 }, { "epoch": 3.7762237762237763, "grad_norm": 0.5650252780634637, "learning_rate": 2.075840419493565e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.26833733916282654, "step": 2160, "valid_targets_mean": 3376.2, "valid_targets_min": 885 }, { "epoch": 3.784965034965035, "grad_norm": 0.5530808312399973, "learning_rate": 2.0671266174787993e-05, "loss": 0.3636, "loss_nan_ranks": 0, "loss_rank_avg": 0.3434409201145172, "step": 2165, "valid_targets_mean": 3988.6, "valid_targets_min": 1309 }, { "epoch": 3.7937062937062938, "grad_norm": 0.5785171812014174, "learning_rate": 2.0584115395973255e-05, "loss": 0.3515, "loss_nan_ranks": 0, "loss_rank_avg": 0.41139060258865356, "step": 2170, "valid_targets_mean": 4776.5, "valid_targets_min": 1094 }, { "epoch": 3.8024475524475525, "grad_norm": 0.45557991298431744, "learning_rate": 2.049695351495472e-05, "loss": 0.3466, "loss_nan_ranks": 0, "loss_rank_avg": 0.3612552285194397, "step": 2175, "valid_targets_mean": 5962.0, "valid_targets_min": 1323 }, { "epoch": 3.8111888111888113, "grad_norm": 0.62555155861987, "learning_rate": 2.0409782188406683e-05, "loss": 0.3349, "loss_nan_ranks": 0, "loss_rank_avg": 0.27812838554382324, "step": 2180, "valid_targets_mean": 2643.1, "valid_targets_min": 396 }, { "epoch": 3.81993006993007, "grad_norm": 0.6924523922525574, "learning_rate": 2.032260307318298e-05, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.29945462942123413, "step": 2185, "valid_targets_mean": 3498.6, "valid_targets_min": 1210 }, { "epoch": 3.8286713286713288, "grad_norm": 0.6015653998125049, "learning_rate": 2.0235417826285488e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.2896122336387634, "step": 2190, "valid_targets_mean": 2937.8, "valid_targets_min": 938 }, { "epoch": 3.8374125874125875, "grad_norm": 0.5861252074236171, "learning_rate": 2.0148228104832614e-05, "loss": 0.3066, "loss_nan_ranks": 0, "loss_rank_avg": 0.2773173153400421, "step": 2195, "valid_targets_mean": 3218.1, "valid_targets_min": 1289 }, { "epoch": 3.8461538461538463, "grad_norm": 0.531620088389809, "learning_rate": 2.0061035566027828e-05, "loss": 0.323, "loss_nan_ranks": 0, "loss_rank_avg": 0.29950347542762756, "step": 2200, "valid_targets_mean": 3860.1, "valid_targets_min": 1100 }, { "epoch": 3.854895104895105, "grad_norm": 0.4886301358801487, "learning_rate": 1.9973841867128137e-05, "loss": 0.3281, "loss_nan_ranks": 0, "loss_rank_avg": 0.36873340606689453, "step": 2205, "valid_targets_mean": 5673.1, "valid_targets_min": 437 }, { "epoch": 3.8636363636363638, "grad_norm": 0.5784230025210767, "learning_rate": 1.9886648665412612e-05, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.36677759885787964, "step": 2210, "valid_targets_mean": 3799.9, "valid_targets_min": 885 }, { "epoch": 3.8723776223776225, "grad_norm": 0.6969081154876361, "learning_rate": 1.9799457618150847e-05, "loss": 0.3197, "loss_nan_ranks": 0, "loss_rank_avg": 0.35714465379714966, "step": 2215, "valid_targets_mean": 3011.3, "valid_targets_min": 857 }, { "epoch": 3.8811188811188813, "grad_norm": 0.597796061214715, "learning_rate": 1.9712270382571527e-05, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.3203423023223877, "step": 2220, "valid_targets_mean": 3129.9, "valid_targets_min": 783 }, { "epoch": 3.88986013986014, "grad_norm": 0.5086711274830522, "learning_rate": 1.9625088615830852e-05, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.30308815836906433, "step": 2225, "valid_targets_mean": 4242.3, "valid_targets_min": 870 }, { "epoch": 3.8986013986013988, "grad_norm": 0.5822116633636045, "learning_rate": 1.9537913974981093e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.33314594626426697, "step": 2230, "valid_targets_mean": 3820.7, "valid_targets_min": 2027 }, { "epoch": 3.9073426573426575, "grad_norm": 0.5836236703850111, "learning_rate": 1.9450748116939076e-05, "loss": 0.303, "loss_nan_ranks": 0, "loss_rank_avg": 0.3218787610530853, "step": 2235, "valid_targets_mean": 3663.4, "valid_targets_min": 902 }, { "epoch": 3.916083916083916, "grad_norm": 0.5924349660287784, "learning_rate": 1.936359269845471e-05, "loss": 0.295, "loss_nan_ranks": 0, "loss_rank_avg": 0.291001558303833, "step": 2240, "valid_targets_mean": 2916.3, "valid_targets_min": 836 }, { "epoch": 3.924825174825175, "grad_norm": 0.5459663099084542, "learning_rate": 1.927644937607944e-05, "loss": 0.3512, "loss_nan_ranks": 0, "loss_rank_avg": 0.33792153000831604, "step": 2245, "valid_targets_mean": 4093.5, "valid_targets_min": 1395 }, { "epoch": 3.9335664335664333, "grad_norm": 0.5193027045932389, "learning_rate": 1.9189319806134847e-05, "loss": 0.3393, "loss_nan_ranks": 0, "loss_rank_avg": 0.28675055503845215, "step": 2250, "valid_targets_mean": 3711.7, "valid_targets_min": 1220 }, { "epoch": 3.9423076923076925, "grad_norm": 0.5883356076136136, "learning_rate": 1.91022056446811e-05, "loss": 0.3205, "loss_nan_ranks": 0, "loss_rank_avg": 0.3391038179397583, "step": 2255, "valid_targets_mean": 3419.8, "valid_targets_min": 840 }, { "epoch": 3.951048951048951, "grad_norm": 0.5586868273562965, "learning_rate": 1.9015108547485494e-05, "loss": 0.3069, "loss_nan_ranks": 0, "loss_rank_avg": 0.262579083442688, "step": 2260, "valid_targets_mean": 3207.1, "valid_targets_min": 919 }, { "epoch": 3.95979020979021, "grad_norm": 0.5554339434479842, "learning_rate": 1.8928030169991006e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.24667473137378693, "step": 2265, "valid_targets_mean": 3612.5, "valid_targets_min": 1378 }, { "epoch": 3.9685314685314683, "grad_norm": 0.505303802479737, "learning_rate": 1.8840972167284797e-05, "loss": 0.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.35376450419425964, "step": 2270, "valid_targets_mean": 5061.0, "valid_targets_min": 1318 }, { "epoch": 3.9772727272727275, "grad_norm": 0.5448435256913293, "learning_rate": 1.8753936194066756e-05, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.31435316801071167, "step": 2275, "valid_targets_mean": 3888.8, "valid_targets_min": 904 }, { "epoch": 3.986013986013986, "grad_norm": 0.5264911091118978, "learning_rate": 1.8666923904618098e-05, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.27534744143486023, "step": 2280, "valid_targets_mean": 3623.6, "valid_targets_min": 1612 }, { "epoch": 3.994755244755245, "grad_norm": 0.7118360207165516, "learning_rate": 1.8579936952769842e-05, "loss": 0.3431, "loss_nan_ranks": 0, "loss_rank_avg": 0.30096369981765747, "step": 2285, "valid_targets_mean": 3708.7, "valid_targets_min": 1137 }, { "epoch": 4.003496503496503, "grad_norm": 0.5351169874979324, "learning_rate": 1.8492976991871432e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.2072516679763794, "step": 2290, "valid_targets_mean": 2993.5, "valid_targets_min": 1274 }, { "epoch": 4.0122377622377625, "grad_norm": 0.47553857464505833, "learning_rate": 1.840604567475932e-05, "loss": 0.2913, "loss_nan_ranks": 0, "loss_rank_avg": 0.2974964380264282, "step": 2295, "valid_targets_mean": 5104.4, "valid_targets_min": 310 }, { "epoch": 4.020979020979021, "grad_norm": 0.4899707307146761, "learning_rate": 1.8319144653725496e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.23744121193885803, "step": 2300, "valid_targets_mean": 4422.4, "valid_targets_min": 1360 }, { "epoch": 4.02972027972028, "grad_norm": 0.6081271010604331, "learning_rate": 1.8232275580486132e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.2675149440765381, "step": 2305, "valid_targets_mean": 3177.8, "valid_targets_min": 758 }, { "epoch": 4.038461538461538, "grad_norm": 0.5181437168972942, "learning_rate": 1.8145440106150193e-05, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.31278491020202637, "step": 2310, "valid_targets_mean": 5048.5, "valid_targets_min": 1347 }, { "epoch": 4.0472027972027975, "grad_norm": 0.6091159221103379, "learning_rate": 1.8058639881188e-05, "loss": 0.2788, "loss_nan_ranks": 0, "loss_rank_avg": 0.32723408937454224, "step": 2315, "valid_targets_mean": 3590.0, "valid_targets_min": 1321 }, { "epoch": 4.055944055944056, "grad_norm": 0.5773222384218777, "learning_rate": 1.7971876555399897e-05, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.3435593247413635, "step": 2320, "valid_targets_mean": 3994.2, "valid_targets_min": 1003 }, { "epoch": 4.064685314685315, "grad_norm": 0.5617194273901538, "learning_rate": 1.7885151777884923e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.3240012526512146, "step": 2325, "valid_targets_mean": 4003.6, "valid_targets_min": 1523 }, { "epoch": 4.073426573426573, "grad_norm": 0.5511985618275491, "learning_rate": 1.77984671970094e-05, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.29591992497444153, "step": 2330, "valid_targets_mean": 5243.3, "valid_targets_min": 1455 }, { "epoch": 4.0821678321678325, "grad_norm": 0.593007324714538, "learning_rate": 1.7711824460375652e-05, "loss": 0.3108, "loss_nan_ranks": 0, "loss_rank_avg": 0.34284406900405884, "step": 2335, "valid_targets_mean": 3934.2, "valid_targets_min": 1201 }, { "epoch": 4.090909090909091, "grad_norm": 0.4665478716876811, "learning_rate": 1.7625225214790676e-05, "loss": 0.319, "loss_nan_ranks": 0, "loss_rank_avg": 0.3358380198478699, "step": 2340, "valid_targets_mean": 6468.1, "valid_targets_min": 1338 }, { "epoch": 4.09965034965035, "grad_norm": 0.6081324344603725, "learning_rate": 1.7538671106234844e-05, "loss": 0.2765, "loss_nan_ranks": 0, "loss_rank_avg": 0.22779546678066254, "step": 2345, "valid_targets_mean": 2993.1, "valid_targets_min": 1087 }, { "epoch": 4.108391608391608, "grad_norm": 0.5694494355739524, "learning_rate": 1.7452163779830594e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.27797362208366394, "step": 2350, "valid_targets_mean": 3926.6, "valid_targets_min": 1238 }, { "epoch": 4.1171328671328675, "grad_norm": 0.692642453035784, "learning_rate": 1.7365704879811218e-05, "loss": 0.2881, "loss_nan_ranks": 0, "loss_rank_avg": 0.29587244987487793, "step": 2355, "valid_targets_mean": 3438.6, "valid_targets_min": 894 }, { "epoch": 4.125874125874126, "grad_norm": 0.5884637093456763, "learning_rate": 1.7279296049489534e-05, "loss": 0.287, "loss_nan_ranks": 0, "loss_rank_avg": 0.29776161909103394, "step": 2360, "valid_targets_mean": 3834.5, "valid_targets_min": 1711 }, { "epoch": 4.134615384615385, "grad_norm": 0.8095854580575237, "learning_rate": 1.7192938931226718e-05, "loss": 0.3166, "loss_nan_ranks": 0, "loss_rank_avg": 0.3704269826412201, "step": 2365, "valid_targets_mean": 4851.2, "valid_targets_min": 1429 }, { "epoch": 4.143356643356643, "grad_norm": 0.6470687556702546, "learning_rate": 1.7106635166401055e-05, "loss": 0.3019, "loss_nan_ranks": 0, "loss_rank_avg": 0.22572281956672668, "step": 2370, "valid_targets_mean": 2469.3, "valid_targets_min": 812 }, { "epoch": 4.1520979020979025, "grad_norm": 0.5299244250517481, "learning_rate": 1.7020386395376754e-05, "loss": 0.2931, "loss_nan_ranks": 0, "loss_rank_avg": 0.3037104904651642, "step": 2375, "valid_targets_mean": 4737.6, "valid_targets_min": 1518 }, { "epoch": 4.160839160839161, "grad_norm": 0.5734004469644143, "learning_rate": 1.6934194257472742e-05, "loss": 0.2802, "loss_nan_ranks": 0, "loss_rank_avg": 0.3412582576274872, "step": 2380, "valid_targets_mean": 4164.4, "valid_targets_min": 904 }, { "epoch": 4.16958041958042, "grad_norm": 0.522302186747358, "learning_rate": 1.6848060390931563e-05, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.31243306398391724, "step": 2385, "valid_targets_mean": 5573.2, "valid_targets_min": 1552 }, { "epoch": 4.178321678321678, "grad_norm": 0.6004156669696765, "learning_rate": 1.6761986432888176e-05, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.2502054274082184, "step": 2390, "valid_targets_mean": 3042.6, "valid_targets_min": 765 }, { "epoch": 4.187062937062937, "grad_norm": 0.5233158597298586, "learning_rate": 1.667597401933887e-05, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.28923219442367554, "step": 2395, "valid_targets_mean": 4870.8, "valid_targets_min": 1237 }, { "epoch": 4.195804195804196, "grad_norm": 0.5483627771622933, "learning_rate": 1.6590024785110185e-05, "loss": 0.3103, "loss_nan_ranks": 0, "loss_rank_avg": 0.3161337971687317, "step": 2400, "valid_targets_mean": 5001.0, "valid_targets_min": 941 }, { "epoch": 4.204545454545454, "grad_norm": 0.5871866958014593, "learning_rate": 1.6504140363827806e-05, "loss": 0.302, "loss_nan_ranks": 0, "loss_rank_avg": 0.3478851020336151, "step": 2405, "valid_targets_mean": 3951.9, "valid_targets_min": 882 }, { "epoch": 4.213286713286713, "grad_norm": 0.6006732063938374, "learning_rate": 1.6418322387885516e-05, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.29331815242767334, "step": 2410, "valid_targets_mean": 3227.8, "valid_targets_min": 1113 }, { "epoch": 4.222027972027972, "grad_norm": 0.5349202137195906, "learning_rate": 1.6332572488414217e-05, "loss": 0.3081, "loss_nan_ranks": 0, "loss_rank_avg": 0.34923678636550903, "step": 2415, "valid_targets_mean": 4982.9, "valid_targets_min": 852 }, { "epoch": 4.230769230769231, "grad_norm": 0.5312131062229603, "learning_rate": 1.624689229525085e-05, "loss": 0.3054, "loss_nan_ranks": 0, "loss_rank_avg": 0.3073064088821411, "step": 2420, "valid_targets_mean": 4661.3, "valid_targets_min": 1189 }, { "epoch": 4.239510489510489, "grad_norm": 0.5799290945851939, "learning_rate": 1.6161283436907466e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.3483518362045288, "step": 2425, "valid_targets_mean": 4749.2, "valid_targets_min": 1558 }, { "epoch": 4.248251748251748, "grad_norm": 0.5006339545460906, "learning_rate": 1.6075747540540297e-05, "loss": 0.3054, "loss_nan_ranks": 0, "loss_rank_avg": 0.2663540840148926, "step": 2430, "valid_targets_mean": 4513.2, "valid_targets_min": 1177 }, { "epoch": 4.256993006993007, "grad_norm": 0.542580678933771, "learning_rate": 1.599028623191875e-05, "loss": 0.2768, "loss_nan_ranks": 0, "loss_rank_avg": 0.274956613779068, "step": 2435, "valid_targets_mean": 4109.2, "valid_targets_min": 1575 }, { "epoch": 4.265734265734266, "grad_norm": 0.5326860859143445, "learning_rate": 1.5904901135394585e-05, "loss": 0.2689, "loss_nan_ranks": 0, "loss_rank_avg": 0.2595234215259552, "step": 2440, "valid_targets_mean": 3658.4, "valid_targets_min": 703 }, { "epoch": 4.274475524475524, "grad_norm": 0.5394753907754853, "learning_rate": 1.5819593873871e-05, "loss": 0.3204, "loss_nan_ranks": 0, "loss_rank_avg": 0.2550932466983795, "step": 2445, "valid_targets_mean": 3616.3, "valid_targets_min": 1453 }, { "epoch": 4.283216783216783, "grad_norm": 0.5560535542529935, "learning_rate": 1.5734366068771784e-05, "loss": 0.2792, "loss_nan_ranks": 0, "loss_rank_avg": 0.27691853046417236, "step": 2450, "valid_targets_mean": 4063.1, "valid_targets_min": 1196 }, { "epoch": 4.291958041958042, "grad_norm": 0.6200097958741395, "learning_rate": 1.5649219340010526e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.326045423746109, "step": 2455, "valid_targets_mean": 3681.8, "valid_targets_min": 1163 }, { "epoch": 4.300699300699301, "grad_norm": 0.5628210227789493, "learning_rate": 1.5564155305959796e-05, "loss": 0.2985, "loss_nan_ranks": 0, "loss_rank_avg": 0.31680306792259216, "step": 2460, "valid_targets_mean": 3843.2, "valid_targets_min": 878 }, { "epoch": 4.309440559440559, "grad_norm": 0.5604933048616457, "learning_rate": 1.547917558342039e-05, "loss": 0.3369, "loss_nan_ranks": 0, "loss_rank_avg": 0.32571083307266235, "step": 2465, "valid_targets_mean": 4244.7, "valid_targets_min": 1078 }, { "epoch": 4.318181818181818, "grad_norm": 0.5778075405917112, "learning_rate": 1.5394281787590625e-05, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.2553318440914154, "step": 2470, "valid_targets_mean": 3426.7, "valid_targets_min": 1366 }, { "epoch": 4.326923076923077, "grad_norm": 0.5995882800981643, "learning_rate": 1.5309475532035602e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.3515400290489197, "step": 2475, "valid_targets_mean": 4027.1, "valid_targets_min": 986 }, { "epoch": 4.335664335664336, "grad_norm": 0.521959423096504, "learning_rate": 1.5224758428656565e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.2591817378997803, "step": 2480, "valid_targets_mean": 4302.8, "valid_targets_min": 1045 }, { "epoch": 4.344405594405594, "grad_norm": 0.6208431532511489, "learning_rate": 1.5140132087660267e-05, "loss": 0.3251, "loss_nan_ranks": 0, "loss_rank_avg": 0.2892325520515442, "step": 2485, "valid_targets_mean": 3343.4, "valid_targets_min": 824 }, { "epoch": 4.353146853146853, "grad_norm": 0.6314479692815503, "learning_rate": 1.5055598117528327e-05, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.34228602051734924, "step": 2490, "valid_targets_mean": 4748.9, "valid_targets_min": 1244 }, { "epoch": 4.361888111888112, "grad_norm": 0.6147592728755509, "learning_rate": 1.497115812498669e-05, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.26770299673080444, "step": 2495, "valid_targets_mean": 3033.6, "valid_targets_min": 1366 }, { "epoch": 4.370629370629371, "grad_norm": 0.6046397551554065, "learning_rate": 1.4886813714975098e-05, "loss": 0.2505, "loss_nan_ranks": 0, "loss_rank_avg": 0.2695387601852417, "step": 2500, "valid_targets_mean": 3264.9, "valid_targets_min": 1345 }, { "epoch": 4.379370629370629, "grad_norm": 0.500859303620456, "learning_rate": 1.480256649061655e-05, "loss": 0.3122, "loss_nan_ranks": 0, "loss_rank_avg": 0.3223142623901367, "step": 2505, "valid_targets_mean": 5378.9, "valid_targets_min": 1083 }, { "epoch": 4.388111888111888, "grad_norm": 0.6865694931163415, "learning_rate": 1.4718418053186854e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.24780099093914032, "step": 2510, "valid_targets_mean": 2477.6, "valid_targets_min": 816 }, { "epoch": 4.396853146853147, "grad_norm": 0.5867839077278701, "learning_rate": 1.4634370002084205e-05, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.31326526403427124, "step": 2515, "valid_targets_mean": 3771.1, "valid_targets_min": 838 }, { "epoch": 4.405594405594406, "grad_norm": 0.5978502595499985, "learning_rate": 1.4550423934798747e-05, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.27199578285217285, "step": 2520, "valid_targets_mean": 3424.1, "valid_targets_min": 1490 }, { "epoch": 4.414335664335664, "grad_norm": 0.5735035291809039, "learning_rate": 1.4466581446882231e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.34619852900505066, "step": 2525, "valid_targets_mean": 4088.4, "valid_targets_min": 1412 }, { "epoch": 4.423076923076923, "grad_norm": 0.5692035115010636, "learning_rate": 1.438284413191771e-05, "loss": 0.2816, "loss_nan_ranks": 0, "loss_rank_avg": 0.2908937633037567, "step": 2530, "valid_targets_mean": 3680.6, "valid_targets_min": 835 }, { "epoch": 4.431818181818182, "grad_norm": 0.6108968071141647, "learning_rate": 1.4299213581489203e-05, "loss": 0.3469, "loss_nan_ranks": 0, "loss_rank_avg": 0.333668977022171, "step": 2535, "valid_targets_mean": 3268.6, "valid_targets_min": 389 }, { "epoch": 4.440559440559441, "grad_norm": 0.6778129262816379, "learning_rate": 1.421569138515149e-05, "loss": 0.2812, "loss_nan_ranks": 0, "loss_rank_avg": 0.2540547549724579, "step": 2540, "valid_targets_mean": 2597.3, "valid_targets_min": 1052 }, { "epoch": 4.449300699300699, "grad_norm": 0.4807213661570069, "learning_rate": 1.4132279130399866e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.19758757948875427, "step": 2545, "valid_targets_mean": 3986.0, "valid_targets_min": 851 }, { "epoch": 4.458041958041958, "grad_norm": 0.6287083054789264, "learning_rate": 1.4048978402639995e-05, "loss": 0.2608, "loss_nan_ranks": 0, "loss_rank_avg": 0.2614743709564209, "step": 2550, "valid_targets_mean": 2846.9, "valid_targets_min": 396 }, { "epoch": 4.466783216783217, "grad_norm": 0.5079659942405071, "learning_rate": 1.3965790785157733e-05, "loss": 0.304, "loss_nan_ranks": 0, "loss_rank_avg": 0.2736564874649048, "step": 2555, "valid_targets_mean": 4273.1, "valid_targets_min": 1275 }, { "epoch": 4.475524475524476, "grad_norm": 0.623480452513458, "learning_rate": 1.388271785908911e-05, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.2957373559474945, "step": 2560, "valid_targets_mean": 3718.1, "valid_targets_min": 923 }, { "epoch": 4.484265734265734, "grad_norm": 0.6577985176467535, "learning_rate": 1.379976120339019e-05, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.270229697227478, "step": 2565, "valid_targets_mean": 2898.3, "valid_targets_min": 969 }, { "epoch": 4.493006993006993, "grad_norm": 0.5465264693819658, "learning_rate": 1.3716922394807108e-05, "loss": 0.3135, "loss_nan_ranks": 0, "loss_rank_avg": 0.323173463344574, "step": 2570, "valid_targets_mean": 4383.8, "valid_targets_min": 1359 }, { "epoch": 4.501748251748252, "grad_norm": 0.5661164401178533, "learning_rate": 1.3634203007846123e-05, "loss": 0.3073, "loss_nan_ranks": 0, "loss_rank_avg": 0.3571394085884094, "step": 2575, "valid_targets_mean": 4352.5, "valid_targets_min": 1213 }, { "epoch": 4.510489510489511, "grad_norm": 0.6173442841080252, "learning_rate": 1.3551604614743638e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.2723095417022705, "step": 2580, "valid_targets_mean": 3077.6, "valid_targets_min": 1212 }, { "epoch": 4.519230769230769, "grad_norm": 0.5285171225530177, "learning_rate": 1.3469128785436336e-05, "loss": 0.3152, "loss_nan_ranks": 0, "loss_rank_avg": 0.39151817560195923, "step": 2585, "valid_targets_mean": 5290.2, "valid_targets_min": 1008 }, { "epoch": 4.527972027972028, "grad_norm": 0.6424931675333562, "learning_rate": 1.3386777087531378e-05, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.2340153455734253, "step": 2590, "valid_targets_mean": 3059.4, "valid_targets_min": 787 }, { "epoch": 4.536713286713287, "grad_norm": 0.5536096774127396, "learning_rate": 1.3304551086276542e-05, "loss": 0.3235, "loss_nan_ranks": 0, "loss_rank_avg": 0.360897421836853, "step": 2595, "valid_targets_mean": 4667.6, "valid_targets_min": 904 }, { "epoch": 4.545454545454545, "grad_norm": 0.5522304667699259, "learning_rate": 1.3222452344530514e-05, "loss": 0.309, "loss_nan_ranks": 0, "loss_rank_avg": 0.3527144193649292, "step": 2600, "valid_targets_mean": 5043.0, "valid_targets_min": 769 }, { "epoch": 4.554195804195804, "grad_norm": 0.5930207853002226, "learning_rate": 1.3140482422733198e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.21184858679771423, "step": 2605, "valid_targets_mean": 2679.9, "valid_targets_min": 360 }, { "epoch": 4.562937062937063, "grad_norm": 0.4523824968127589, "learning_rate": 1.3058642878876005e-05, "loss": 0.305, "loss_nan_ranks": 0, "loss_rank_avg": 0.400458425283432, "step": 2610, "valid_targets_mean": 6793.4, "valid_targets_min": 794 }, { "epoch": 4.571678321678322, "grad_norm": 0.6660598737030216, "learning_rate": 1.2976935268472282e-05, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.31761932373046875, "step": 2615, "valid_targets_mean": 2962.8, "valid_targets_min": 788 }, { "epoch": 4.58041958041958, "grad_norm": 0.570251827846613, "learning_rate": 1.289536114452775e-05, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.3196180462837219, "step": 2620, "valid_targets_mean": 4478.8, "valid_targets_min": 1368 }, { "epoch": 4.589160839160839, "grad_norm": 0.7146176161503408, "learning_rate": 1.2813922057510941e-05, "loss": 0.3078, "loss_nan_ranks": 0, "loss_rank_avg": 0.35588014125823975, "step": 2625, "valid_targets_mean": 3962.6, "valid_targets_min": 1574 }, { "epoch": 4.597902097902098, "grad_norm": 0.5910225666256981, "learning_rate": 1.2732619555323771e-05, "loss": 0.2962, "loss_nan_ranks": 0, "loss_rank_avg": 0.3604264259338379, "step": 2630, "valid_targets_mean": 4157.6, "valid_targets_min": 836 }, { "epoch": 4.606643356643357, "grad_norm": 0.5876064972193442, "learning_rate": 1.2651455183272123e-05, "loss": 0.2977, "loss_nan_ranks": 0, "loss_rank_avg": 0.24652817845344543, "step": 2635, "valid_targets_mean": 3293.5, "valid_targets_min": 1311 }, { "epoch": 4.615384615384615, "grad_norm": 0.6316151890865688, "learning_rate": 1.2570430484036428e-05, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.3414528965950012, "step": 2640, "valid_targets_mean": 3320.4, "valid_targets_min": 1186 }, { "epoch": 4.624125874125874, "grad_norm": 0.6231043964765773, "learning_rate": 1.2489546997642394e-05, "loss": 0.2988, "loss_nan_ranks": 0, "loss_rank_avg": 0.24330928921699524, "step": 2645, "valid_targets_mean": 3018.8, "valid_targets_min": 1173 }, { "epoch": 4.632867132867133, "grad_norm": 0.5459532756435473, "learning_rate": 1.2408806261431719e-05, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.2778834402561188, "step": 2650, "valid_targets_mean": 3856.0, "valid_targets_min": 841 }, { "epoch": 4.641608391608392, "grad_norm": 0.5138719298724235, "learning_rate": 1.2328209810032852e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.3052661418914795, "step": 2655, "valid_targets_mean": 4457.4, "valid_targets_min": 1094 }, { "epoch": 4.65034965034965, "grad_norm": 0.7468748014300275, "learning_rate": 1.2247759175331843e-05, "loss": 0.3214, "loss_nan_ranks": 0, "loss_rank_avg": 0.2765350639820099, "step": 2660, "valid_targets_mean": 3678.1, "valid_targets_min": 397 }, { "epoch": 4.659090909090909, "grad_norm": 0.568068341055875, "learning_rate": 1.2167455886443244e-05, "loss": 0.32, "loss_nan_ranks": 0, "loss_rank_avg": 0.33724042773246765, "step": 2665, "valid_targets_mean": 4406.8, "valid_targets_min": 274 }, { "epoch": 4.6678321678321675, "grad_norm": 0.5369284700537394, "learning_rate": 1.2087301469680992e-05, "loss": 0.312, "loss_nan_ranks": 0, "loss_rank_avg": 0.3213573098182678, "step": 2670, "valid_targets_mean": 5050.0, "valid_targets_min": 721 }, { "epoch": 4.676573426573427, "grad_norm": 0.5418193994362802, "learning_rate": 1.2007297448529451e-05, "loss": 0.3102, "loss_nan_ranks": 0, "loss_rank_avg": 0.35388627648353577, "step": 2675, "valid_targets_mean": 4565.1, "valid_targets_min": 315 }, { "epoch": 4.685314685314685, "grad_norm": 0.5017207500392754, "learning_rate": 1.1927445343614436e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.27704697847366333, "step": 2680, "valid_targets_mean": 4477.9, "valid_targets_min": 1565 }, { "epoch": 4.694055944055944, "grad_norm": 0.5363032891756204, "learning_rate": 1.1847746672674308e-05, "loss": 0.2716, "loss_nan_ranks": 0, "loss_rank_avg": 0.24790403246879578, "step": 2685, "valid_targets_mean": 3882.2, "valid_targets_min": 984 }, { "epoch": 4.7027972027972025, "grad_norm": 0.5760992816533218, "learning_rate": 1.1768202950531116e-05, "loss": 0.2885, "loss_nan_ranks": 0, "loss_rank_avg": 0.3482862114906311, "step": 2690, "valid_targets_mean": 3853.1, "valid_targets_min": 866 }, { "epoch": 4.711538461538462, "grad_norm": 0.5278073637246373, "learning_rate": 1.1688815689061845e-05, "loss": 0.3242, "loss_nan_ranks": 0, "loss_rank_avg": 0.3284091353416443, "step": 2695, "valid_targets_mean": 4456.2, "valid_targets_min": 711 }, { "epoch": 4.72027972027972, "grad_norm": 0.46225936004312645, "learning_rate": 1.160958639716963e-05, "loss": 0.3021, "loss_nan_ranks": 0, "loss_rank_avg": 0.3566405773162842, "step": 2700, "valid_targets_mean": 6233.1, "valid_targets_min": 1931 }, { "epoch": 4.729020979020979, "grad_norm": 0.6393556958936994, "learning_rate": 1.1530516580755094e-05, "loss": 0.2669, "loss_nan_ranks": 0, "loss_rank_avg": 0.23386213183403015, "step": 2705, "valid_targets_mean": 2735.7, "valid_targets_min": 1235 }, { "epoch": 4.7377622377622375, "grad_norm": 0.7313544858772298, "learning_rate": 1.145160774268776e-05, "loss": 0.2866, "loss_nan_ranks": 0, "loss_rank_avg": 0.2925187945365906, "step": 2710, "valid_targets_mean": 3208.3, "valid_targets_min": 760 }, { "epoch": 4.746503496503497, "grad_norm": 0.593415721475349, "learning_rate": 1.1372861382777436e-05, "loss": 0.3431, "loss_nan_ranks": 0, "loss_rank_avg": 0.27762988209724426, "step": 2715, "valid_targets_mean": 3455.1, "valid_targets_min": 894 }, { "epoch": 4.755244755244755, "grad_norm": 0.6896039425675504, "learning_rate": 1.1294278997745717e-05, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.27165350317955017, "step": 2720, "valid_targets_mean": 3064.6, "valid_targets_min": 1453 }, { "epoch": 4.763986013986014, "grad_norm": 0.653532801402401, "learning_rate": 1.1215862081197588e-05, "loss": 0.2444, "loss_nan_ranks": 0, "loss_rank_avg": 0.22621586918830872, "step": 2725, "valid_targets_mean": 2338.2, "valid_targets_min": 659 }, { "epoch": 4.7727272727272725, "grad_norm": 0.5579565197706448, "learning_rate": 1.1137612123592955e-05, "loss": 0.3407, "loss_nan_ranks": 0, "loss_rank_avg": 0.3474411964416504, "step": 2730, "valid_targets_mean": 4759.7, "valid_targets_min": 1250 }, { "epoch": 4.781468531468532, "grad_norm": 0.6008079310769544, "learning_rate": 1.1059530612218384e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.24356213212013245, "step": 2735, "valid_targets_mean": 3257.1, "valid_targets_min": 1154 }, { "epoch": 4.79020979020979, "grad_norm": 0.5625591929943424, "learning_rate": 1.0981619031158805e-05, "loss": 0.3002, "loss_nan_ranks": 0, "loss_rank_avg": 0.25547558069229126, "step": 2740, "valid_targets_mean": 3769.6, "valid_targets_min": 1096 }, { "epoch": 4.798951048951049, "grad_norm": 0.5564650872223581, "learning_rate": 1.0903878861269283e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.39255663752555847, "step": 2745, "valid_targets_mean": 4813.8, "valid_targets_min": 1190 }, { "epoch": 4.8076923076923075, "grad_norm": 0.5465111718947036, "learning_rate": 1.0826311580146926e-05, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.31452226638793945, "step": 2750, "valid_targets_mean": 4456.3, "valid_targets_min": 1608 }, { "epoch": 4.816433566433567, "grad_norm": 0.6002285372123841, "learning_rate": 1.0748918662102738e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.24080748856067657, "step": 2755, "valid_targets_mean": 2933.1, "valid_targets_min": 776 }, { "epoch": 4.825174825174825, "grad_norm": 0.6031634744630441, "learning_rate": 1.0671701578133638e-05, "loss": 0.3093, "loss_nan_ranks": 0, "loss_rank_avg": 0.2960241734981537, "step": 2760, "valid_targets_mean": 3287.8, "valid_targets_min": 1340 }, { "epoch": 4.833916083916084, "grad_norm": 0.5648244176335662, "learning_rate": 1.0594661795894506e-05, "loss": 0.3288, "loss_nan_ranks": 0, "loss_rank_avg": 0.3948041498661041, "step": 2765, "valid_targets_mean": 4577.2, "valid_targets_min": 400 }, { "epoch": 4.8426573426573425, "grad_norm": 0.5897183525483226, "learning_rate": 1.0517800779670246e-05, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.2534165680408478, "step": 2770, "valid_targets_mean": 2986.2, "valid_targets_min": 885 }, { "epoch": 4.851398601398602, "grad_norm": 0.599383167273539, "learning_rate": 1.044111999034799e-05, "loss": 0.2741, "loss_nan_ranks": 0, "loss_rank_avg": 0.31281739473342896, "step": 2775, "valid_targets_mean": 3864.4, "valid_targets_min": 599 }, { "epoch": 4.86013986013986, "grad_norm": 0.621675092661028, "learning_rate": 1.0364620885389332e-05, "loss": 0.2779, "loss_nan_ranks": 0, "loss_rank_avg": 0.2532220780849457, "step": 2780, "valid_targets_mean": 2882.8, "valid_targets_min": 1129 }, { "epoch": 4.868881118881119, "grad_norm": 0.5174219008544854, "learning_rate": 1.0288304918802601e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.3275800347328186, "step": 2785, "valid_targets_mean": 5350.1, "valid_targets_min": 1528 }, { "epoch": 4.8776223776223775, "grad_norm": 0.5564725618436285, "learning_rate": 1.0212173541115238e-05, "loss": 0.3181, "loss_nan_ranks": 0, "loss_rank_avg": 0.3417879641056061, "step": 2790, "valid_targets_mean": 4438.7, "valid_targets_min": 1031 }, { "epoch": 4.886363636363637, "grad_norm": 0.5202279923981036, "learning_rate": 1.013622819934625e-05, "loss": 0.2873, "loss_nan_ranks": 0, "loss_rank_avg": 0.31056395173072815, "step": 2795, "valid_targets_mean": 5017.1, "valid_targets_min": 1366 }, { "epoch": 4.895104895104895, "grad_norm": 0.8272229183082167, "learning_rate": 1.0060470336978647e-05, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.2937367260456085, "step": 2800, "valid_targets_mean": 3412.6, "valid_targets_min": 1314 }, { "epoch": 4.903846153846154, "grad_norm": 0.6023369863061019, "learning_rate": 9.984901393932079e-06, "loss": 0.3024, "loss_nan_ranks": 0, "loss_rank_avg": 0.3329635262489319, "step": 2805, "valid_targets_mean": 3690.2, "valid_targets_min": 1103 }, { "epoch": 4.9125874125874125, "grad_norm": 0.5347626155440187, "learning_rate": 9.909522806535419e-06, "loss": 0.3002, "loss_nan_ranks": 0, "loss_rank_avg": 0.34003421664237976, "step": 2810, "valid_targets_mean": 4804.3, "valid_targets_min": 1241 }, { "epoch": 4.921328671328672, "grad_norm": 0.5810834195037871, "learning_rate": 9.834336007499466e-06, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.2992189824581146, "step": 2815, "valid_targets_mean": 3655.9, "valid_targets_min": 363 }, { "epoch": 4.93006993006993, "grad_norm": 0.7516655603694848, "learning_rate": 9.759342425889719e-06, "loss": 0.3299, "loss_nan_ranks": 0, "loss_rank_avg": 0.26004546880722046, "step": 2820, "valid_targets_mean": 2960.8, "valid_targets_min": 775 }, { "epoch": 4.938811188811189, "grad_norm": 0.5474762483923421, "learning_rate": 9.684543487099252e-06, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.31097865104675293, "step": 2825, "valid_targets_mean": 4025.8, "valid_targets_min": 1372 }, { "epoch": 4.9475524475524475, "grad_norm": 0.603868266770557, "learning_rate": 9.609940612821553e-06, "loss": 0.2902, "loss_nan_ranks": 0, "loss_rank_avg": 0.21819128096103668, "step": 2830, "valid_targets_mean": 2892.9, "valid_targets_min": 843 }, { "epoch": 4.956293706293707, "grad_norm": 0.6179932621413688, "learning_rate": 9.535535221023547e-06, "loss": 0.2902, "loss_nan_ranks": 0, "loss_rank_avg": 0.2900503873825073, "step": 2835, "valid_targets_mean": 3740.0, "valid_targets_min": 1399 }, { "epoch": 4.965034965034965, "grad_norm": 0.5718727937808842, "learning_rate": 9.461328725918652e-06, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.32516181468963623, "step": 2840, "valid_targets_mean": 3534.2, "valid_targets_min": 1482 }, { "epoch": 4.973776223776223, "grad_norm": 0.5820685648597708, "learning_rate": 9.387322537939867e-06, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.23170748353004456, "step": 2845, "valid_targets_mean": 2971.9, "valid_targets_min": 1151 }, { "epoch": 4.9825174825174825, "grad_norm": 0.6160327533376939, "learning_rate": 9.313518063712977e-06, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.2837224304676056, "step": 2850, "valid_targets_mean": 4007.0, "valid_targets_min": 977 }, { "epoch": 4.991258741258742, "grad_norm": 0.6590612654521167, "learning_rate": 9.239916706029837e-06, "loss": 0.2644, "loss_nan_ranks": 0, "loss_rank_avg": 0.2656211256980896, "step": 2855, "valid_targets_mean": 2824.0, "valid_targets_min": 867 }, { "epoch": 5.0, "grad_norm": 0.487778840287654, "learning_rate": 9.166519863821682e-06, "loss": 0.2977, "loss_nan_ranks": 0, "loss_rank_avg": 0.3223125636577606, "step": 2860, "valid_targets_mean": 5592.4, "valid_targets_min": 1554 }, { "epoch": 5.008741258741258, "grad_norm": 0.5515870319188418, "learning_rate": 9.093328932132536e-06, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.29514843225479126, "step": 2865, "valid_targets_mean": 3846.6, "valid_targets_min": 977 }, { "epoch": 5.0174825174825175, "grad_norm": 0.6027515247820308, "learning_rate": 9.02034530209274e-06, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.21801328659057617, "step": 2870, "valid_targets_mean": 3039.9, "valid_targets_min": 868 }, { "epoch": 5.026223776223776, "grad_norm": 0.6604761384788594, "learning_rate": 8.94757036089246e-06, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.29287010431289673, "step": 2875, "valid_targets_mean": 3395.0, "valid_targets_min": 703 }, { "epoch": 5.034965034965035, "grad_norm": 0.5186334303195224, "learning_rate": 8.875005491755336e-06, "loss": 0.3228, "loss_nan_ranks": 0, "loss_rank_avg": 0.39983949065208435, "step": 2880, "valid_targets_mean": 5769.5, "valid_targets_min": 780 }, { "epoch": 5.043706293706293, "grad_norm": 0.6726806564828863, "learning_rate": 8.802652073912217e-06, "loss": 0.2941, "loss_nan_ranks": 0, "loss_rank_avg": 0.2766971290111542, "step": 2885, "valid_targets_mean": 2916.9, "valid_targets_min": 1247 }, { "epoch": 5.0524475524475525, "grad_norm": 0.6558280884607233, "learning_rate": 8.730511482574905e-06, "loss": 0.2988, "loss_nan_ranks": 0, "loss_rank_avg": 0.2496262788772583, "step": 2890, "valid_targets_mean": 2870.6, "valid_targets_min": 1260 }, { "epoch": 5.061188811188811, "grad_norm": 0.5997253722708635, "learning_rate": 8.658585088910034e-06, "loss": 0.2845, "loss_nan_ranks": 0, "loss_rank_avg": 0.30124104022979736, "step": 2895, "valid_targets_mean": 4088.7, "valid_targets_min": 771 }, { "epoch": 5.06993006993007, "grad_norm": 0.6511353534883123, "learning_rate": 8.586874260013043e-06, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.24419128894805908, "step": 2900, "valid_targets_mean": 3125.4, "valid_targets_min": 882 }, { "epoch": 5.078671328671328, "grad_norm": 0.5500028690151533, "learning_rate": 8.515380358882125e-06, "loss": 0.2648, "loss_nan_ranks": 0, "loss_rank_avg": 0.1970711648464203, "step": 2905, "valid_targets_mean": 3520.8, "valid_targets_min": 844 }, { "epoch": 5.0874125874125875, "grad_norm": 1.1741959939280981, "learning_rate": 8.444104744392368e-06, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.3086763918399811, "step": 2910, "valid_targets_mean": 3857.3, "valid_targets_min": 1625 }, { "epoch": 5.096153846153846, "grad_norm": 0.6282809967830072, "learning_rate": 8.373048771269925e-06, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.32048705220222473, "step": 2915, "valid_targets_mean": 3851.1, "valid_targets_min": 1160 }, { "epoch": 5.104895104895105, "grad_norm": 0.6350201505584189, "learning_rate": 8.30221379006624e-06, "loss": 0.2971, "loss_nan_ranks": 0, "loss_rank_avg": 0.2668588161468506, "step": 2920, "valid_targets_mean": 3230.1, "valid_targets_min": 1067 }, { "epoch": 5.113636363636363, "grad_norm": 0.537977318451259, "learning_rate": 8.231601147132395e-06, "loss": 0.3058, "loss_nan_ranks": 0, "loss_rank_avg": 0.31173622608184814, "step": 2925, "valid_targets_mean": 4844.6, "valid_targets_min": 833 }, { "epoch": 5.1223776223776225, "grad_norm": 0.6525436356749689, "learning_rate": 8.161212184593533e-06, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.2828228175640106, "step": 2930, "valid_targets_mean": 2888.5, "valid_targets_min": 1244 }, { "epoch": 5.131118881118881, "grad_norm": 0.7670147857668765, "learning_rate": 8.091048240323309e-06, "loss": 0.2898, "loss_nan_ranks": 0, "loss_rank_avg": 0.3218318223953247, "step": 2935, "valid_targets_mean": 4409.9, "valid_targets_min": 783 }, { "epoch": 5.13986013986014, "grad_norm": 0.5832403428104913, "learning_rate": 8.021110647918506e-06, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.28175467252731323, "step": 2940, "valid_targets_mean": 4289.4, "valid_targets_min": 1588 }, { "epoch": 5.148601398601398, "grad_norm": 0.5913795547664308, "learning_rate": 7.951400736673666e-06, "loss": 0.2929, "loss_nan_ranks": 0, "loss_rank_avg": 0.2117207646369934, "step": 2945, "valid_targets_mean": 3373.2, "valid_targets_min": 1135 }, { "epoch": 5.1573426573426575, "grad_norm": 0.6195775292187421, "learning_rate": 7.881919831555812e-06, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.19947922229766846, "step": 2950, "valid_targets_mean": 2951.7, "valid_targets_min": 1245 }, { "epoch": 5.166083916083916, "grad_norm": 0.5629505536805914, "learning_rate": 7.812669253179284e-06, "loss": 0.2957, "loss_nan_ranks": 0, "loss_rank_avg": 0.2782512903213501, "step": 2955, "valid_targets_mean": 4214.4, "valid_targets_min": 1349 }, { "epoch": 5.174825174825175, "grad_norm": 0.6510672774482675, "learning_rate": 7.74365031778064e-06, "loss": 0.2817, "loss_nan_ranks": 0, "loss_rank_avg": 0.2591198682785034, "step": 2960, "valid_targets_mean": 3180.0, "valid_targets_min": 1215 }, { "epoch": 5.183566433566433, "grad_norm": 0.5026506652919864, "learning_rate": 7.67486433719362e-06, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.2523643374443054, "step": 2965, "valid_targets_mean": 4377.1, "valid_targets_min": 1551 }, { "epoch": 5.1923076923076925, "grad_norm": 0.5981654940081627, "learning_rate": 7.606312618824221e-06, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.3656559884548187, "step": 2970, "valid_targets_mean": 4603.1, "valid_targets_min": 1128 }, { "epoch": 5.201048951048951, "grad_norm": 5.001470852750849, "learning_rate": 7.53799646562587e-06, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.26559704542160034, "step": 2975, "valid_targets_mean": 3457.1, "valid_targets_min": 1008 }, { "epoch": 5.20979020979021, "grad_norm": 0.6154061160480875, "learning_rate": 7.469917176074615e-06, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.284348726272583, "step": 2980, "valid_targets_mean": 3541.6, "valid_targets_min": 1072 }, { "epoch": 5.218531468531468, "grad_norm": 0.5767457725736881, "learning_rate": 7.402076044144468e-06, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.288425475358963, "step": 2985, "valid_targets_mean": 3888.5, "valid_targets_min": 754 }, { "epoch": 5.2272727272727275, "grad_norm": 0.9484072946363189, "learning_rate": 7.334474359282835e-06, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.2538584768772125, "step": 2990, "valid_targets_mean": 3242.8, "valid_targets_min": 1171 }, { "epoch": 5.236013986013986, "grad_norm": 0.6182933263467078, "learning_rate": 7.267113406385957e-06, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.30061790347099304, "step": 2995, "valid_targets_mean": 3523.0, "valid_targets_min": 700 }, { "epoch": 5.244755244755245, "grad_norm": 0.6353976287717851, "learning_rate": 7.199994465774525e-06, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508491277694702, "step": 3000, "valid_targets_mean": 3439.9, "valid_targets_min": 948 }, { "epoch": 5.253496503496503, "grad_norm": 0.5482075343729362, "learning_rate": 7.133118813169333e-06, "loss": 0.2788, "loss_nan_ranks": 0, "loss_rank_avg": 0.2493390440940857, "step": 3005, "valid_targets_mean": 4017.3, "valid_targets_min": 281 }, { "epoch": 5.2622377622377625, "grad_norm": 0.6796942212521933, "learning_rate": 7.066487719667048e-06, "loss": 0.3051, "loss_nan_ranks": 0, "loss_rank_avg": 0.3333054184913635, "step": 3010, "valid_targets_mean": 3150.6, "valid_targets_min": 1401 }, { "epoch": 5.270979020979021, "grad_norm": 0.5316665562656377, "learning_rate": 7.000102451716002e-06, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.19675248861312866, "step": 3015, "valid_targets_mean": 4021.2, "valid_targets_min": 1108 }, { "epoch": 5.27972027972028, "grad_norm": 0.601665131189074, "learning_rate": 6.9339642710921865e-06, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.2753317058086395, "step": 3020, "valid_targets_mean": 3542.6, "valid_targets_min": 878 }, { "epoch": 5.288461538461538, "grad_norm": 0.6016387836746144, "learning_rate": 6.868074434875207e-06, "loss": 0.3308, "loss_nan_ranks": 0, "loss_rank_avg": 0.3341265916824341, "step": 3025, "valid_targets_mean": 4177.6, "valid_targets_min": 1125 }, { "epoch": 5.2972027972027975, "grad_norm": 0.6319032564526934, "learning_rate": 6.802434195424452e-06, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.29447418451309204, "step": 3030, "valid_targets_mean": 3719.3, "valid_targets_min": 913 }, { "epoch": 5.305944055944056, "grad_norm": 0.5916637424592456, "learning_rate": 6.73704480035523e-06, "loss": 0.3015, "loss_nan_ranks": 0, "loss_rank_avg": 0.2799910306930542, "step": 3035, "valid_targets_mean": 3499.6, "valid_targets_min": 1323 }, { "epoch": 5.314685314685315, "grad_norm": 0.6561281929032633, "learning_rate": 6.6719074925150885e-06, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.22917607426643372, "step": 3040, "valid_targets_mean": 3229.9, "valid_targets_min": 1366 }, { "epoch": 5.323426573426573, "grad_norm": 0.5631601957129813, "learning_rate": 6.607023509960207e-06, "loss": 0.2806, "loss_nan_ranks": 0, "loss_rank_avg": 0.30073410272598267, "step": 3045, "valid_targets_mean": 4102.4, "valid_targets_min": 902 }, { "epoch": 5.3321678321678325, "grad_norm": 0.5939420651573594, "learning_rate": 6.54239408593182e-06, "loss": 0.2826, "loss_nan_ranks": 0, "loss_rank_avg": 0.30191031098365784, "step": 3050, "valid_targets_mean": 4112.1, "valid_targets_min": 1112 }, { "epoch": 5.340909090909091, "grad_norm": 0.62297242809634, "learning_rate": 6.478020448832807e-06, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.26781389117240906, "step": 3055, "valid_targets_mean": 3714.4, "valid_targets_min": 1393 }, { "epoch": 5.34965034965035, "grad_norm": 0.5551628821680462, "learning_rate": 6.41390382220436e-06, "loss": 0.3012, "loss_nan_ranks": 0, "loss_rank_avg": 0.3098997473716736, "step": 3060, "valid_targets_mean": 4681.3, "valid_targets_min": 699 }, { "epoch": 5.358391608391608, "grad_norm": 0.5574581153427564, "learning_rate": 6.350045424702678e-06, "loss": 0.3141, "loss_nan_ranks": 0, "loss_rank_avg": 0.34914591908454895, "step": 3065, "valid_targets_mean": 5659.1, "valid_targets_min": 1391 }, { "epoch": 5.3671328671328675, "grad_norm": 0.5862085004980788, "learning_rate": 6.286446470075844e-06, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.24797584116458893, "step": 3070, "valid_targets_mean": 3695.2, "valid_targets_min": 1317 }, { "epoch": 5.375874125874126, "grad_norm": 0.5191297805074992, "learning_rate": 6.223108167140754e-06, "loss": 0.292, "loss_nan_ranks": 0, "loss_rank_avg": 0.2748684585094452, "step": 3075, "valid_targets_mean": 4941.7, "valid_targets_min": 1381 }, { "epoch": 5.384615384615385, "grad_norm": 0.5045700473089122, "learning_rate": 6.1600317197601315e-06, "loss": 0.3003, "loss_nan_ranks": 0, "loss_rank_avg": 0.3563288748264313, "step": 3080, "valid_targets_mean": 5475.4, "valid_targets_min": 1462 }, { "epoch": 5.393356643356643, "grad_norm": 0.5378903669303158, "learning_rate": 6.0972183268196226e-06, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.2671928405761719, "step": 3085, "valid_targets_mean": 4020.6, "valid_targets_min": 984 }, { "epoch": 5.402097902097902, "grad_norm": 0.5843880944609243, "learning_rate": 6.034669182205069e-06, "loss": 0.2687, "loss_nan_ranks": 0, "loss_rank_avg": 0.27627307176589966, "step": 3090, "valid_targets_mean": 3800.9, "valid_targets_min": 1235 }, { "epoch": 5.410839160839161, "grad_norm": 0.6602300244309561, "learning_rate": 5.972385474779749e-06, "loss": 0.2679, "loss_nan_ranks": 0, "loss_rank_avg": 0.2647150754928589, "step": 3095, "valid_targets_mean": 2855.0, "valid_targets_min": 843 }, { "epoch": 5.41958041958042, "grad_norm": 0.6462995998231272, "learning_rate": 5.910368388361818e-06, "loss": 0.2926, "loss_nan_ranks": 0, "loss_rank_avg": 0.26018214225769043, "step": 3100, "valid_targets_mean": 3224.8, "valid_targets_min": 1357 }, { "epoch": 5.428321678321678, "grad_norm": 0.4891544819132749, "learning_rate": 5.84861910170182e-06, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.2529061734676361, "step": 3105, "valid_targets_mean": 5225.0, "valid_targets_min": 1269 }, { "epoch": 5.437062937062937, "grad_norm": 0.5575392553853251, "learning_rate": 5.787138788460243e-06, "loss": 0.2638, "loss_nan_ranks": 0, "loss_rank_avg": 0.27974453568458557, "step": 3110, "valid_targets_mean": 4549.4, "valid_targets_min": 1333 }, { "epoch": 5.445804195804196, "grad_norm": 0.9169550213827106, "learning_rate": 5.725928617185232e-06, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.36411306262016296, "step": 3115, "valid_targets_mean": 4993.6, "valid_targets_min": 465 }, { "epoch": 5.454545454545454, "grad_norm": 0.6333429716490787, "learning_rate": 5.664989751290404e-06, "loss": 0.2704, "loss_nan_ranks": 0, "loss_rank_avg": 0.2409021258354187, "step": 3120, "valid_targets_mean": 2938.7, "valid_targets_min": 1156 }, { "epoch": 5.463286713286713, "grad_norm": 0.6164781154770047, "learning_rate": 5.604323349032688e-06, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.3192230761051178, "step": 3125, "valid_targets_mean": 3691.0, "valid_targets_min": 1022 }, { "epoch": 5.472027972027972, "grad_norm": 0.673990836348822, "learning_rate": 5.543930563490329e-06, "loss": 0.3229, "loss_nan_ranks": 0, "loss_rank_avg": 0.2710210084915161, "step": 3130, "valid_targets_mean": 2789.3, "valid_targets_min": 1063 }, { "epoch": 5.480769230769231, "grad_norm": 0.6255943702870599, "learning_rate": 5.483812542541005e-06, "loss": 0.2877, "loss_nan_ranks": 0, "loss_rank_avg": 0.26079046726226807, "step": 3135, "valid_targets_mean": 4804.1, "valid_targets_min": 1268 }, { "epoch": 5.489510489510489, "grad_norm": 0.6091977606764691, "learning_rate": 5.423970428839944e-06, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.27790728211402893, "step": 3140, "valid_targets_mean": 3833.6, "valid_targets_min": 1655 }, { "epoch": 5.498251748251748, "grad_norm": 0.6667888999428736, "learning_rate": 5.364405359798273e-06, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.25091731548309326, "step": 3145, "valid_targets_mean": 2849.9, "valid_targets_min": 1083 }, { "epoch": 5.506993006993007, "grad_norm": 0.7128463727312214, "learning_rate": 5.305118467561337e-06, "loss": 0.2655, "loss_nan_ranks": 0, "loss_rank_avg": 0.24288232624530792, "step": 3150, "valid_targets_mean": 2881.0, "valid_targets_min": 841 }, { "epoch": 5.515734265734266, "grad_norm": 0.5707716004157022, "learning_rate": 5.246110878987243e-06, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.26704850792884827, "step": 3155, "valid_targets_mean": 4202.4, "valid_targets_min": 1416 }, { "epoch": 5.524475524475524, "grad_norm": 0.5654249158794692, "learning_rate": 5.187383715625382e-06, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.24396446347236633, "step": 3160, "valid_targets_mean": 3794.2, "valid_targets_min": 970 }, { "epoch": 5.533216783216783, "grad_norm": 0.5007607833940395, "learning_rate": 5.128938093695166e-06, "loss": 0.2723, "loss_nan_ranks": 0, "loss_rank_avg": 0.3158084750175476, "step": 3165, "valid_targets_mean": 5185.2, "valid_targets_min": 1196 }, { "epoch": 5.541958041958042, "grad_norm": 0.6987253561806125, "learning_rate": 5.0707751240647665e-06, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.2553308308124542, "step": 3170, "valid_targets_mean": 2831.2, "valid_targets_min": 1078 }, { "epoch": 5.550699300699301, "grad_norm": 0.6693739024014761, "learning_rate": 5.012895912230021e-06, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.2554604411125183, "step": 3175, "valid_targets_mean": 3050.4, "valid_targets_min": 437 }, { "epoch": 5.559440559440559, "grad_norm": 0.5729662992883009, "learning_rate": 4.955301558293439e-06, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.237440288066864, "step": 3180, "valid_targets_mean": 3831.5, "valid_targets_min": 1266 }, { "epoch": 5.568181818181818, "grad_norm": 0.6086761990951153, "learning_rate": 4.897993156943257e-06, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.26315420866012573, "step": 3185, "valid_targets_mean": 3630.5, "valid_targets_min": 1483 }, { "epoch": 5.576923076923077, "grad_norm": 0.6680147625247186, "learning_rate": 4.840971797432643e-06, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.2638908922672272, "step": 3190, "valid_targets_mean": 3079.1, "valid_targets_min": 769 }, { "epoch": 5.585664335664336, "grad_norm": 0.6033920894084822, "learning_rate": 4.784238563559025e-06, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.3316216468811035, "step": 3195, "valid_targets_mean": 4097.1, "valid_targets_min": 1321 }, { "epoch": 5.594405594405594, "grad_norm": 0.6247334828081322, "learning_rate": 4.727794533643442e-06, "loss": 0.2731, "loss_nan_ranks": 0, "loss_rank_avg": 0.2612161636352539, "step": 3200, "valid_targets_mean": 3408.8, "valid_targets_min": 805 }, { "epoch": 5.603146853146853, "grad_norm": 0.5988968477062824, "learning_rate": 4.671640780510069e-06, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.2181917130947113, "step": 3205, "valid_targets_mean": 2906.1, "valid_targets_min": 1078 }, { "epoch": 5.611888111888112, "grad_norm": 0.46415277622783324, "learning_rate": 4.615778371465856e-06, "loss": 0.2921, "loss_nan_ranks": 0, "loss_rank_avg": 0.3689541816711426, "step": 3210, "valid_targets_mean": 6330.0, "valid_targets_min": 402 }, { "epoch": 5.620629370629371, "grad_norm": 0.5613877412055053, "learning_rate": 4.560208368280183e-06, "loss": 0.3161, "loss_nan_ranks": 0, "loss_rank_avg": 0.3414204716682434, "step": 3215, "valid_targets_mean": 4572.8, "valid_targets_min": 1159 }, { "epoch": 5.629370629370629, "grad_norm": 0.5560487965185203, "learning_rate": 4.5049318271647295e-06, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.2097901999950409, "step": 3220, "valid_targets_mean": 3893.2, "valid_targets_min": 915 }, { "epoch": 5.638111888111888, "grad_norm": 0.7296638177669432, "learning_rate": 4.4499497987533816e-06, "loss": 0.3103, "loss_nan_ranks": 0, "loss_rank_avg": 0.229948490858078, "step": 3225, "valid_targets_mean": 2531.2, "valid_targets_min": 807 }, { "epoch": 5.646853146853147, "grad_norm": 0.6166550888524173, "learning_rate": 4.395263328082251e-06, "loss": 0.2568, "loss_nan_ranks": 0, "loss_rank_avg": 0.29370614886283875, "step": 3230, "valid_targets_mean": 3795.5, "valid_targets_min": 917 }, { "epoch": 5.655594405594406, "grad_norm": 0.5808842651980372, "learning_rate": 4.340873454569821e-06, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.3381272554397583, "step": 3235, "valid_targets_mean": 4567.4, "valid_targets_min": 1063 }, { "epoch": 5.664335664335664, "grad_norm": 0.548523750131149, "learning_rate": 4.286781211997208e-06, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.2726270854473114, "step": 3240, "valid_targets_mean": 4212.8, "valid_targets_min": 1200 }, { "epoch": 5.673076923076923, "grad_norm": 0.6767114674832129, "learning_rate": 4.232987628488483e-06, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.20798838138580322, "step": 3245, "valid_targets_mean": 2656.3, "valid_targets_min": 1177 }, { "epoch": 5.681818181818182, "grad_norm": 0.6061394916537475, "learning_rate": 4.179493726491144e-06, "loss": 0.297, "loss_nan_ranks": 0, "loss_rank_avg": 0.28469932079315186, "step": 3250, "valid_targets_mean": 3790.7, "valid_targets_min": 1247 }, { "epoch": 5.690559440559441, "grad_norm": 0.5514714164196605, "learning_rate": 4.126300522756692e-06, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.2420085370540619, "step": 3255, "valid_targets_mean": 4023.1, "valid_targets_min": 1003 }, { "epoch": 5.699300699300699, "grad_norm": 0.7165447495050303, "learning_rate": 4.073409028321289e-06, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.2511775493621826, "step": 3260, "valid_targets_mean": 2425.6, "valid_targets_min": 836 }, { "epoch": 5.708041958041958, "grad_norm": 0.5309431458422739, "learning_rate": 4.020820248486544e-06, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.312569260597229, "step": 3265, "valid_targets_mean": 4707.6, "valid_targets_min": 1005 }, { "epoch": 5.716783216783217, "grad_norm": 0.6205803951689329, "learning_rate": 3.968535182800423e-06, "loss": 0.3001, "loss_nan_ranks": 0, "loss_rank_avg": 0.283012330532074, "step": 3270, "valid_targets_mean": 3780.8, "valid_targets_min": 840 }, { "epoch": 5.725524475524476, "grad_norm": 0.5702696584364179, "learning_rate": 3.916554825038221e-06, "loss": 0.2865, "loss_nan_ranks": 0, "loss_rank_avg": 0.29808011651039124, "step": 3275, "valid_targets_mean": 3887.8, "valid_targets_min": 1299 }, { "epoch": 5.734265734265734, "grad_norm": 0.6299800822954458, "learning_rate": 3.864880163183709e-06, "loss": 0.2915, "loss_nan_ranks": 0, "loss_rank_avg": 0.17876118421554565, "step": 3280, "valid_targets_mean": 2609.9, "valid_targets_min": 1104 }, { "epoch": 5.743006993006993, "grad_norm": 0.5991337075244536, "learning_rate": 3.813512179410317e-06, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.28599756956100464, "step": 3285, "valid_targets_mean": 3688.8, "valid_targets_min": 1165 }, { "epoch": 5.751748251748252, "grad_norm": 0.5243673827463061, "learning_rate": 3.762451850062501e-06, "loss": 0.2918, "loss_nan_ranks": 0, "loss_rank_avg": 0.2722562551498413, "step": 3290, "valid_targets_mean": 4477.4, "valid_targets_min": 1031 }, { "epoch": 5.760489510489511, "grad_norm": 0.6658579790305317, "learning_rate": 3.711700145637156e-06, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.33141064643859863, "step": 3295, "valid_targets_mean": 3457.7, "valid_targets_min": 1188 }, { "epoch": 5.769230769230769, "grad_norm": 0.5388723983560816, "learning_rate": 3.6612580307652024e-06, "loss": 0.293, "loss_nan_ranks": 0, "loss_rank_avg": 0.309293270111084, "step": 3300, "valid_targets_mean": 5008.1, "valid_targets_min": 350 }, { "epoch": 5.777972027972028, "grad_norm": 0.5300494283794329, "learning_rate": 3.611126464193211e-06, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.3127099871635437, "step": 3305, "valid_targets_mean": 5129.1, "valid_targets_min": 1776 }, { "epoch": 5.786713286713287, "grad_norm": 0.5734939334413017, "learning_rate": 3.561306398765225e-06, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.2457369565963745, "step": 3310, "valid_targets_mean": 3891.1, "valid_targets_min": 1186 }, { "epoch": 5.795454545454545, "grad_norm": 0.5898212051083919, "learning_rate": 3.5117987814046074e-06, "loss": 0.2943, "loss_nan_ranks": 0, "loss_rank_avg": 0.22512537240982056, "step": 3315, "valid_targets_mean": 3410.9, "valid_targets_min": 1094 }, { "epoch": 5.804195804195804, "grad_norm": 0.6207274470955104, "learning_rate": 3.4626045530960696e-06, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.30430057644844055, "step": 3320, "valid_targets_mean": 4685.4, "valid_targets_min": 1113 }, { "epoch": 5.812937062937063, "grad_norm": 0.608742829096707, "learning_rate": 3.4137246488677866e-06, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.3098594546318054, "step": 3325, "valid_targets_mean": 3769.6, "valid_targets_min": 1045 }, { "epoch": 5.821678321678322, "grad_norm": 0.5846165269760552, "learning_rate": 3.365159997773606e-06, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.22525198757648468, "step": 3330, "valid_targets_mean": 3777.8, "valid_targets_min": 1666 }, { "epoch": 5.83041958041958, "grad_norm": 0.6111370595067496, "learning_rate": 3.3169115228754014e-06, "loss": 0.309, "loss_nan_ranks": 0, "loss_rank_avg": 0.36875244975090027, "step": 3335, "valid_targets_mean": 4112.8, "valid_targets_min": 753 }, { "epoch": 5.839160839160839, "grad_norm": 0.5387375942451661, "learning_rate": 3.268980141225537e-06, "loss": 0.3289, "loss_nan_ranks": 0, "loss_rank_avg": 0.31299394369125366, "step": 3340, "valid_targets_mean": 5053.8, "valid_targets_min": 1449 }, { "epoch": 5.847902097902098, "grad_norm": 0.6240330539437785, "learning_rate": 3.221366763849423e-06, "loss": 0.2531, "loss_nan_ranks": 0, "loss_rank_avg": 0.26625147461891174, "step": 3345, "valid_targets_mean": 3334.1, "valid_targets_min": 1340 }, { "epoch": 5.856643356643357, "grad_norm": 0.7043735642239611, "learning_rate": 3.1740722957281923e-06, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.3169170618057251, "step": 3350, "valid_targets_mean": 3898.0, "valid_targets_min": 974 }, { "epoch": 5.865384615384615, "grad_norm": 0.4821674121878327, "learning_rate": 3.127097635781533e-06, "loss": 0.2709, "loss_nan_ranks": 0, "loss_rank_avg": 0.2442520707845688, "step": 3355, "valid_targets_mean": 5463.6, "valid_targets_min": 1323 }, { "epoch": 5.874125874125874, "grad_norm": 0.59032654806126, "learning_rate": 3.080443676850575e-06, "loss": 0.3114, "loss_nan_ranks": 0, "loss_rank_avg": 0.3039432168006897, "step": 3360, "valid_targets_mean": 4510.3, "valid_targets_min": 1476 }, { "epoch": 5.882867132867133, "grad_norm": 0.5711335653285038, "learning_rate": 3.0341113056809113e-06, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.3196086883544922, "step": 3365, "valid_targets_mean": 4369.4, "valid_targets_min": 1253 }, { "epoch": 5.891608391608392, "grad_norm": 0.6147801856977855, "learning_rate": 2.9881014029057853e-06, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.34057629108428955, "step": 3370, "valid_targets_mean": 4283.4, "valid_targets_min": 1334 }, { "epoch": 5.90034965034965, "grad_norm": 0.5972285440857505, "learning_rate": 2.942414843029302e-06, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.2990839183330536, "step": 3375, "valid_targets_mean": 4576.2, "valid_targets_min": 885 }, { "epoch": 5.909090909090909, "grad_norm": 0.5952021910403875, "learning_rate": 2.89705249440984e-06, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.27879855036735535, "step": 3380, "valid_targets_mean": 3924.9, "valid_targets_min": 758 }, { "epoch": 5.9178321678321675, "grad_norm": 0.6227318532091863, "learning_rate": 2.8520152192435468e-06, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.22561070322990417, "step": 3385, "valid_targets_mean": 3241.6, "valid_targets_min": 835 }, { "epoch": 5.926573426573427, "grad_norm": 0.6036831338415529, "learning_rate": 2.807303873547931e-06, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.269223153591156, "step": 3390, "valid_targets_mean": 3960.1, "valid_targets_min": 1308 }, { "epoch": 5.935314685314685, "grad_norm": 0.6198564976381323, "learning_rate": 2.7629193071455974e-06, "loss": 0.2978, "loss_nan_ranks": 0, "loss_rank_avg": 0.2761087417602539, "step": 3395, "valid_targets_mean": 3745.8, "valid_targets_min": 1250 }, { "epoch": 5.944055944055944, "grad_norm": 0.5769269392848372, "learning_rate": 2.718862363648118e-06, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.28240329027175903, "step": 3400, "valid_targets_mean": 4084.9, "valid_targets_min": 838 }, { "epoch": 5.9527972027972025, "grad_norm": 0.5159296065059323, "learning_rate": 2.6751338804399685e-06, "loss": 0.3087, "loss_nan_ranks": 0, "loss_rank_avg": 0.33804747462272644, "step": 3405, "valid_targets_mean": 6029.0, "valid_targets_min": 1526 }, { "epoch": 5.961538461538462, "grad_norm": 0.5627855303755237, "learning_rate": 2.6317346886626192e-06, "loss": 0.299, "loss_nan_ranks": 0, "loss_rank_avg": 0.29597389698028564, "step": 3410, "valid_targets_mean": 4527.5, "valid_targets_min": 1235 }, { "epoch": 5.97027972027972, "grad_norm": 0.5297648101917568, "learning_rate": 2.5886656131987575e-06, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.2557566165924072, "step": 3415, "valid_targets_mean": 4257.1, "valid_targets_min": 851 }, { "epoch": 5.979020979020979, "grad_norm": 0.6191215344301044, "learning_rate": 2.5459274726565752e-06, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.23104539513587952, "step": 3420, "valid_targets_mean": 2965.7, "valid_targets_min": 1289 }, { "epoch": 5.9877622377622375, "grad_norm": 0.7122036934147264, "learning_rate": 2.5035210793542387e-06, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.31105631589889526, "step": 3425, "valid_targets_mean": 4595.3, "valid_targets_min": 923 }, { "epoch": 5.996503496503497, "grad_norm": 0.6248335921345303, "learning_rate": 2.461447239304444e-06, "loss": 0.2838, "loss_nan_ranks": 0, "loss_rank_avg": 0.31339454650878906, "step": 3430, "valid_targets_mean": 3528.1, "valid_targets_min": 839 }, { "epoch": 6.005244755244755, "grad_norm": 0.6546736256801129, "learning_rate": 2.41970675219908e-06, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.1906014084815979, "step": 3435, "valid_targets_mean": 2545.0, "valid_targets_min": 915 }, { "epoch": 6.013986013986014, "grad_norm": 0.546331877599847, "learning_rate": 2.378300411394041e-06, "loss": 0.2693, "loss_nan_ranks": 0, "loss_rank_avg": 0.21837225556373596, "step": 3440, "valid_targets_mean": 3521.7, "valid_targets_min": 844 }, { "epoch": 6.0227272727272725, "grad_norm": 0.5676929839026588, "learning_rate": 2.337229003894157e-06, "loss": 0.3256, "loss_nan_ranks": 0, "loss_rank_avg": 0.36682766675949097, "step": 3445, "valid_targets_mean": 4742.9, "valid_targets_min": 1237 }, { "epoch": 6.031468531468532, "grad_norm": 0.5669674632220835, "learning_rate": 2.2964933103382148e-06, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.28727206587791443, "step": 3450, "valid_targets_mean": 4004.6, "valid_targets_min": 1310 }, { "epoch": 6.04020979020979, "grad_norm": 0.6309898614135956, "learning_rate": 2.2560941049841346e-06, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.20886394381523132, "step": 3455, "valid_targets_mean": 2680.5, "valid_targets_min": 1059 }, { "epoch": 6.048951048951049, "grad_norm": 0.60928327793459, "learning_rate": 2.2160321556942544e-06, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.30445602536201477, "step": 3460, "valid_targets_mean": 4046.9, "valid_targets_min": 915 }, { "epoch": 6.0576923076923075, "grad_norm": 0.7833054139185534, "learning_rate": 2.1763082239207266e-06, "loss": 0.253, "loss_nan_ranks": 0, "loss_rank_avg": 0.21612828969955444, "step": 3465, "valid_targets_mean": 2976.7, "valid_targets_min": 1566 }, { "epoch": 6.066433566433567, "grad_norm": 0.6497425853670982, "learning_rate": 2.136923064691041e-06, "loss": 0.2543, "loss_nan_ranks": 0, "loss_rank_avg": 0.15709246695041656, "step": 3470, "valid_targets_mean": 2333.2, "valid_targets_min": 858 }, { "epoch": 6.075174825174825, "grad_norm": 0.6725133904006579, "learning_rate": 2.097877426593704e-06, "loss": 0.2637, "loss_nan_ranks": 0, "loss_rank_avg": 0.20932920277118683, "step": 3475, "valid_targets_mean": 2497.1, "valid_targets_min": 815 }, { "epoch": 6.083916083916084, "grad_norm": 0.6290252855540327, "learning_rate": 2.0591720517639713e-06, "loss": 0.3105, "loss_nan_ranks": 0, "loss_rank_avg": 0.2524038553237915, "step": 3480, "valid_targets_mean": 3004.4, "valid_targets_min": 823 }, { "epoch": 6.0926573426573425, "grad_norm": 0.6862544212215417, "learning_rate": 2.020807675869758e-06, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.2957307696342468, "step": 3485, "valid_targets_mean": 4532.2, "valid_targets_min": 361 }, { "epoch": 6.101398601398602, "grad_norm": 0.6485079485932239, "learning_rate": 1.9827850280976733e-06, "loss": 0.2767, "loss_nan_ranks": 0, "loss_rank_avg": 0.32891833782196045, "step": 3490, "valid_targets_mean": 4233.2, "valid_targets_min": 278 }, { "epoch": 6.11013986013986, "grad_norm": 0.6921512870006977, "learning_rate": 1.9451048311391375e-06, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.26255372166633606, "step": 3495, "valid_targets_mean": 3512.6, "valid_targets_min": 894 }, { "epoch": 6.118881118881119, "grad_norm": 0.6208115294079365, "learning_rate": 1.9077678011766455e-06, "loss": 0.3224, "loss_nan_ranks": 0, "loss_rank_avg": 0.29941844940185547, "step": 3500, "valid_targets_mean": 3561.2, "valid_targets_min": 1191 }, { "epoch": 6.1276223776223775, "grad_norm": 0.5916073069732769, "learning_rate": 1.8707746478701794e-06, "loss": 0.3104, "loss_nan_ranks": 0, "loss_rank_avg": 0.296660840511322, "step": 3505, "valid_targets_mean": 3865.4, "valid_targets_min": 1120 }, { "epoch": 6.136363636363637, "grad_norm": 0.5576227926843184, "learning_rate": 1.8341260743436873e-06, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.2193690687417984, "step": 3510, "valid_targets_mean": 3824.8, "valid_targets_min": 865 }, { "epoch": 6.145104895104895, "grad_norm": 0.5853811367031623, "learning_rate": 1.7978227771717405e-06, "loss": 0.2832, "loss_nan_ranks": 0, "loss_rank_avg": 0.3498114347457886, "step": 3515, "valid_targets_mean": 4405.4, "valid_targets_min": 1504 }, { "epoch": 6.153846153846154, "grad_norm": 0.6053214238879862, "learning_rate": 1.7618654463662954e-06, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.28211668133735657, "step": 3520, "valid_targets_mean": 3949.8, "valid_targets_min": 1235 }, { "epoch": 6.1625874125874125, "grad_norm": 0.566264654468671, "learning_rate": 1.7262547653635641e-06, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.2645253539085388, "step": 3525, "valid_targets_mean": 3999.5, "valid_targets_min": 968 }, { "epoch": 6.171328671328672, "grad_norm": 0.6113838491407106, "learning_rate": 1.6909914110110293e-06, "loss": 0.2567, "loss_nan_ranks": 0, "loss_rank_avg": 0.24374493956565857, "step": 3530, "valid_targets_mean": 3655.2, "valid_targets_min": 1315 }, { "epoch": 6.18006993006993, "grad_norm": 0.5494925652722575, "learning_rate": 1.656076053554594e-06, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.2420923113822937, "step": 3535, "valid_targets_mean": 4067.6, "valid_targets_min": 801 }, { "epoch": 6.188811188811189, "grad_norm": 0.6071906510133728, "learning_rate": 1.621509356625819e-06, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.26888033747673035, "step": 3540, "valid_targets_mean": 4184.9, "valid_targets_min": 1107 }, { "epoch": 6.1975524475524475, "grad_norm": 0.6406113556865684, "learning_rate": 1.5872919772293215e-06, "loss": 0.2574, "loss_nan_ranks": 0, "loss_rank_avg": 0.24279576539993286, "step": 3545, "valid_targets_mean": 3324.6, "valid_targets_min": 1078 }, { "epoch": 6.206293706293707, "grad_norm": 0.6003844929874508, "learning_rate": 1.5534245657302994e-06, "loss": 0.2954, "loss_nan_ranks": 0, "loss_rank_avg": 0.28774210810661316, "step": 3550, "valid_targets_mean": 4073.2, "valid_targets_min": 1522 }, { "epoch": 6.215034965034965, "grad_norm": 0.6802616494670375, "learning_rate": 1.5199077658421368e-06, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.24521152675151825, "step": 3555, "valid_targets_mean": 2741.4, "valid_targets_min": 897 }, { "epoch": 6.223776223776224, "grad_norm": 0.5311261915809192, "learning_rate": 1.486742214614205e-06, "loss": 0.296, "loss_nan_ranks": 0, "loss_rank_avg": 0.29008519649505615, "step": 3560, "valid_targets_mean": 4434.4, "valid_targets_min": 1423 }, { "epoch": 6.2325174825174825, "grad_norm": 0.574513939046325, "learning_rate": 1.4539285424197401e-06, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.32967033982276917, "step": 3565, "valid_targets_mean": 4577.4, "valid_targets_min": 1109 }, { "epoch": 6.241258741258742, "grad_norm": 0.49392742782010396, "learning_rate": 1.42146737294385e-06, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.3063806891441345, "step": 3570, "valid_targets_mean": 5692.9, "valid_targets_min": 1531 }, { "epoch": 6.25, "grad_norm": 0.5578568105254652, "learning_rate": 1.3893593231716685e-06, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.2709795832633972, "step": 3575, "valid_targets_mean": 4448.0, "valid_targets_min": 1255 }, { "epoch": 6.258741258741258, "grad_norm": 0.6101064186593799, "learning_rate": 1.3576050033766431e-06, "loss": 0.2661, "loss_nan_ranks": 0, "loss_rank_avg": 0.3113132119178772, "step": 3580, "valid_targets_mean": 3706.6, "valid_targets_min": 1213 }, { "epoch": 6.2674825174825175, "grad_norm": 0.6295757030791121, "learning_rate": 1.3262050171089125e-06, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.2644977271556854, "step": 3585, "valid_targets_mean": 3470.4, "valid_targets_min": 315 }, { "epoch": 6.276223776223776, "grad_norm": 0.5663034758396543, "learning_rate": 1.2951599611838494e-06, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.26824554800987244, "step": 3590, "valid_targets_mean": 3999.2, "valid_targets_min": 838 }, { "epoch": 6.284965034965035, "grad_norm": 0.6036200941709391, "learning_rate": 1.264470425670712e-06, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.3287750482559204, "step": 3595, "valid_targets_mean": 5751.5, "valid_targets_min": 1197 }, { "epoch": 6.293706293706293, "grad_norm": 0.5810804752661107, "learning_rate": 1.234136993881423e-06, "loss": 0.2526, "loss_nan_ranks": 0, "loss_rank_avg": 0.2942957282066345, "step": 3600, "valid_targets_mean": 4172.7, "valid_targets_min": 912 }, { "epoch": 6.3024475524475525, "grad_norm": 0.657214863100275, "learning_rate": 1.2041602423595e-06, "loss": 0.2634, "loss_nan_ranks": 0, "loss_rank_avg": 0.18747061491012573, "step": 3605, "valid_targets_mean": 2734.8, "valid_targets_min": 985 }, { "epoch": 6.311188811188811, "grad_norm": 0.6501996468721265, "learning_rate": 1.174540740869079e-06, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.32021254301071167, "step": 3610, "valid_targets_mean": 3323.9, "valid_targets_min": 749 }, { "epoch": 6.31993006993007, "grad_norm": 0.5803676942137402, "learning_rate": 1.1452790523840895e-06, "loss": 0.2754, "loss_nan_ranks": 0, "loss_rank_avg": 0.281261146068573, "step": 3615, "valid_targets_mean": 4163.1, "valid_targets_min": 771 }, { "epoch": 6.328671328671328, "grad_norm": 0.7055138161863601, "learning_rate": 1.1163757330775683e-06, "loss": 0.3053, "loss_nan_ranks": 0, "loss_rank_avg": 0.18472999334335327, "step": 3620, "valid_targets_mean": 2490.1, "valid_targets_min": 1264 }, { "epoch": 6.3374125874125875, "grad_norm": 0.6313383239462723, "learning_rate": 1.0878313323110624e-06, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.2720009684562683, "step": 3625, "valid_targets_mean": 3518.5, "valid_targets_min": 828 }, { "epoch": 6.346153846153846, "grad_norm": 0.6561844097817968, "learning_rate": 1.0596463926242117e-06, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.23926571011543274, "step": 3630, "valid_targets_mean": 2988.6, "valid_targets_min": 897 }, { "epoch": 6.354895104895105, "grad_norm": 0.5665310024576693, "learning_rate": 1.0318214497244194e-06, "loss": 0.3238, "loss_nan_ranks": 0, "loss_rank_avg": 0.3651200830936432, "step": 3635, "valid_targets_mean": 5215.1, "valid_targets_min": 1625 }, { "epoch": 6.363636363636363, "grad_norm": 0.6554284589319097, "learning_rate": 1.0043570324766905e-06, "loss": 0.2894, "loss_nan_ranks": 0, "loss_rank_avg": 0.24973063170909882, "step": 3640, "valid_targets_mean": 2915.8, "valid_targets_min": 777 }, { "epoch": 6.3723776223776225, "grad_norm": 0.7008129809196576, "learning_rate": 9.772536628935492e-07, "loss": 0.283, "loss_nan_ranks": 0, "loss_rank_avg": 0.24499808251857758, "step": 3645, "valid_targets_mean": 2670.0, "valid_targets_min": 1221 }, { "epoch": 6.381118881118881, "grad_norm": 0.7024012851039138, "learning_rate": 9.505118561251514e-07, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.2695966362953186, "step": 3650, "valid_targets_mean": 2731.5, "valid_targets_min": 866 }, { "epoch": 6.38986013986014, "grad_norm": 0.5845704369992565, "learning_rate": 9.241321204494658e-07, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.25256311893463135, "step": 3655, "valid_targets_mean": 4473.8, "valid_targets_min": 1264 }, { "epoch": 6.398601398601398, "grad_norm": 0.5813539539242096, "learning_rate": 8.981149572626214e-07, "loss": 0.2553, "loss_nan_ranks": 0, "loss_rank_avg": 0.152411550283432, "step": 3660, "valid_targets_mean": 2954.5, "valid_targets_min": 840 }, { "epoch": 6.4073426573426575, "grad_norm": 0.8400642322428409, "learning_rate": 8.724608610693952e-07, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.2882179915904999, "step": 3665, "valid_targets_mean": 3022.2, "valid_targets_min": 1200 }, { "epoch": 6.416083916083916, "grad_norm": 0.7360779762095463, "learning_rate": 8.471703194737846e-07, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.2204851359128952, "step": 3670, "valid_targets_mean": 2568.9, "valid_targets_min": 1137 }, { "epoch": 6.424825174825175, "grad_norm": 0.5801639551802711, "learning_rate": 8.222438131697541e-07, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.25313958525657654, "step": 3675, "valid_targets_mean": 3821.8, "valid_targets_min": 938 }, { "epoch": 6.433566433566433, "grad_norm": 0.6509857982198833, "learning_rate": 7.976818159321031e-07, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.24882566928863525, "step": 3680, "valid_targets_mean": 3058.3, "valid_targets_min": 867 }, { "epoch": 6.4423076923076925, "grad_norm": 0.5859694732821341, "learning_rate": 7.734847946074531e-07, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.23909510672092438, "step": 3685, "valid_targets_mean": 3752.7, "valid_targets_min": 1217 }, { "epoch": 6.451048951048951, "grad_norm": 0.4932257801456551, "learning_rate": 7.496532091053765e-07, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305898904800415, "step": 3690, "valid_targets_mean": 5985.6, "valid_targets_min": 1330 }, { "epoch": 6.45979020979021, "grad_norm": 0.6428645373849343, "learning_rate": 7.261875123896533e-07, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.33091801404953003, "step": 3695, "valid_targets_mean": 4158.1, "valid_targets_min": 836 }, { "epoch": 6.468531468531468, "grad_norm": 0.6419446507900263, "learning_rate": 7.030881504696708e-07, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.28880882263183594, "step": 3700, "valid_targets_mean": 4430.9, "valid_targets_min": 1343 }, { "epoch": 6.4772727272727275, "grad_norm": 0.6349223749579598, "learning_rate": 6.803555623919322e-07, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.22542111575603485, "step": 3705, "valid_targets_mean": 3429.0, "valid_targets_min": 1425 }, { "epoch": 6.486013986013986, "grad_norm": 0.5586249125018691, "learning_rate": 6.579901802317223e-07, "loss": 0.326, "loss_nan_ranks": 0, "loss_rank_avg": 0.3446670174598694, "step": 3710, "valid_targets_mean": 5845.7, "valid_targets_min": 1794 }, { "epoch": 6.494755244755245, "grad_norm": 0.5654988182171874, "learning_rate": 6.359924290848929e-07, "loss": 0.309, "loss_nan_ranks": 0, "loss_rank_avg": 0.37433212995529175, "step": 3715, "valid_targets_mean": 4621.6, "valid_targets_min": 1213 }, { "epoch": 6.503496503496503, "grad_norm": 0.5671227364089624, "learning_rate": 6.143627270597785e-07, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.17292237281799316, "step": 3720, "valid_targets_mean": 3233.8, "valid_targets_min": 1087 }, { "epoch": 6.5122377622377625, "grad_norm": 0.6425112452389675, "learning_rate": 5.931014852692541e-07, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.26524510979652405, "step": 3725, "valid_targets_mean": 3356.4, "valid_targets_min": 882 }, { "epoch": 6.520979020979021, "grad_norm": 0.5756543070733119, "learning_rate": 5.72209107822923e-07, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.29785022139549255, "step": 3730, "valid_targets_mean": 4071.3, "valid_targets_min": 1156 }, { "epoch": 6.52972027972028, "grad_norm": 0.6271284223823304, "learning_rate": 5.516859918194262e-07, "loss": 0.307, "loss_nan_ranks": 0, "loss_rank_avg": 0.29389727115631104, "step": 3735, "valid_targets_mean": 3572.2, "valid_targets_min": 968 }, { "epoch": 6.538461538461538, "grad_norm": 0.5863542188132574, "learning_rate": 5.315325273389094e-07, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.26336008310317993, "step": 3740, "valid_targets_mean": 4096.9, "valid_targets_min": 347 }, { "epoch": 6.5472027972027975, "grad_norm": 0.6259632998483117, "learning_rate": 5.117490974355943e-07, "loss": 0.3089, "loss_nan_ranks": 0, "loss_rank_avg": 0.30066174268722534, "step": 3745, "valid_targets_mean": 3837.0, "valid_targets_min": 1444 }, { "epoch": 6.555944055944056, "grad_norm": 0.5762913607782765, "learning_rate": 4.923360781305087e-07, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.30665403604507446, "step": 3750, "valid_targets_mean": 4425.5, "valid_targets_min": 400 }, { "epoch": 6.564685314685315, "grad_norm": 0.604842563995092, "learning_rate": 4.7329383840433395e-07, "loss": 0.2822, "loss_nan_ranks": 0, "loss_rank_avg": 0.24494880437850952, "step": 3755, "valid_targets_mean": 3657.3, "valid_targets_min": 1207 }, { "epoch": 6.573426573426573, "grad_norm": 0.6627025272241348, "learning_rate": 4.546227401903913e-07, "loss": 0.3036, "loss_nan_ranks": 0, "loss_rank_avg": 0.3197290599346161, "step": 3760, "valid_targets_mean": 3325.8, "valid_targets_min": 779 }, { "epoch": 6.5821678321678325, "grad_norm": 0.539869528159097, "learning_rate": 4.363231383677691e-07, "loss": 0.2681, "loss_nan_ranks": 0, "loss_rank_avg": 0.2869723439216614, "step": 3765, "valid_targets_mean": 5366.8, "valid_targets_min": 1013 }, { "epoch": 6.590909090909091, "grad_norm": 0.5724917365681328, "learning_rate": 4.1839538075456597e-07, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.2898808717727661, "step": 3770, "valid_targets_mean": 4081.4, "valid_targets_min": 1344 }, { "epoch": 6.59965034965035, "grad_norm": 0.6592760685566884, "learning_rate": 4.0083980810129876e-07, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.2967371940612793, "step": 3775, "valid_targets_mean": 3181.4, "valid_targets_min": 872 }, { "epoch": 6.608391608391608, "grad_norm": 0.606456437191496, "learning_rate": 3.8365675408439827e-07, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.24623604118824005, "step": 3780, "valid_targets_mean": 3611.8, "valid_targets_min": 1044 }, { "epoch": 6.617132867132867, "grad_norm": 0.5829659808615845, "learning_rate": 3.6684654529989704e-07, "loss": 0.2572, "loss_nan_ranks": 0, "loss_rank_avg": 0.2534424066543579, "step": 3785, "valid_targets_mean": 3794.0, "valid_targets_min": 665 }, { "epoch": 6.625874125874126, "grad_norm": 0.586621741689212, "learning_rate": 3.504095012572006e-07, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.2955080270767212, "step": 3790, "valid_targets_mean": 4248.8, "valid_targets_min": 1314 }, { "epoch": 6.634615384615385, "grad_norm": 0.6326737534702042, "learning_rate": 3.3434593437302155e-07, "loss": 0.315, "loss_nan_ranks": 0, "loss_rank_avg": 0.3392415940761566, "step": 3795, "valid_targets_mean": 3692.1, "valid_targets_min": 1609 }, { "epoch": 6.643356643356643, "grad_norm": 0.561790153450764, "learning_rate": 3.1865614996544834e-07, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.322073757648468, "step": 3800, "valid_targets_mean": 4551.2, "valid_targets_min": 785 }, { "epoch": 6.652097902097902, "grad_norm": 0.5628076005463111, "learning_rate": 3.0334044624812596e-07, "loss": 0.2849, "loss_nan_ranks": 0, "loss_rank_avg": 0.2843906581401825, "step": 3805, "valid_targets_mean": 4424.9, "valid_targets_min": 1046 }, { "epoch": 6.660839160839161, "grad_norm": 0.5160597220001579, "learning_rate": 2.883991143246023e-07, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.2697199583053589, "step": 3810, "valid_targets_mean": 4928.8, "valid_targets_min": 1110 }, { "epoch": 6.66958041958042, "grad_norm": 0.5931743945808303, "learning_rate": 2.73832438182795e-07, "loss": 0.2617, "loss_nan_ranks": 0, "loss_rank_avg": 0.2316768765449524, "step": 3815, "valid_targets_mean": 3766.6, "valid_targets_min": 1408 }, { "epoch": 6.678321678321678, "grad_norm": 0.5442096900994562, "learning_rate": 2.59640694689578e-07, "loss": 0.3055, "loss_nan_ranks": 0, "loss_rank_avg": 0.2675340175628662, "step": 3820, "valid_targets_mean": 4535.4, "valid_targets_min": 994 }, { "epoch": 6.687062937062937, "grad_norm": 1.8394774855479727, "learning_rate": 2.458241535855388e-07, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.26005691289901733, "step": 3825, "valid_targets_mean": 3036.9, "valid_targets_min": 1137 }, { "epoch": 6.695804195804196, "grad_norm": 0.6113943146191173, "learning_rate": 2.32383077479843e-07, "loss": 0.3076, "loss_nan_ranks": 0, "loss_rank_avg": 0.33162689208984375, "step": 3830, "valid_targets_mean": 4674.4, "valid_targets_min": 906 }, { "epoch": 6.704545454545455, "grad_norm": 0.6602273502952561, "learning_rate": 2.1931772184523358e-07, "loss": 0.2879, "loss_nan_ranks": 0, "loss_rank_avg": 0.309783935546875, "step": 3835, "valid_targets_mean": 3429.7, "valid_targets_min": 1079 }, { "epoch": 6.713286713286713, "grad_norm": 0.5736876331423237, "learning_rate": 2.0662833501319702e-07, "loss": 0.2892, "loss_nan_ranks": 0, "loss_rank_avg": 0.32325828075408936, "step": 3840, "valid_targets_mean": 4180.1, "valid_targets_min": 1209 }, { "epoch": 6.722027972027972, "grad_norm": 0.6126276173990889, "learning_rate": 1.9431515816922042e-07, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.2594378888607025, "step": 3845, "valid_targets_mean": 3517.1, "valid_targets_min": 1114 }, { "epoch": 6.730769230769231, "grad_norm": 0.58394492206243, "learning_rate": 1.8237842534822636e-07, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.2913021743297577, "step": 3850, "valid_targets_mean": 4055.2, "valid_targets_min": 1327 }, { "epoch": 6.739510489510489, "grad_norm": 0.7192431832478173, "learning_rate": 1.7081836343010748e-07, "loss": 0.2643, "loss_nan_ranks": 0, "loss_rank_avg": 0.22975113987922668, "step": 3855, "valid_targets_mean": 2542.4, "valid_targets_min": 1030 }, { "epoch": 6.748251748251748, "grad_norm": 0.5767349334206501, "learning_rate": 1.5963519213542555e-07, "loss": 0.302, "loss_nan_ranks": 0, "loss_rank_avg": 0.30083373188972473, "step": 3860, "valid_targets_mean": 4077.9, "valid_targets_min": 1071 }, { "epoch": 6.756993006993007, "grad_norm": 0.6081230019210105, "learning_rate": 1.4882912402123696e-07, "loss": 0.2919, "loss_nan_ranks": 0, "loss_rank_avg": 0.3036191463470459, "step": 3865, "valid_targets_mean": 3846.3, "valid_targets_min": 1381 }, { "epoch": 6.765734265734266, "grad_norm": 0.5891570706997271, "learning_rate": 1.3840036447704042e-07, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.20486155152320862, "step": 3870, "valid_targets_mean": 3797.2, "valid_targets_min": 363 }, { "epoch": 6.774475524475524, "grad_norm": 0.6322766168986574, "learning_rate": 1.2834911172088683e-07, "loss": 0.2843, "loss_nan_ranks": 0, "loss_rank_avg": 0.31095296144485474, "step": 3875, "valid_targets_mean": 3419.8, "valid_targets_min": 788 }, { "epoch": 6.783216783216783, "grad_norm": 0.6409732017990925, "learning_rate": 1.1867555679560217e-07, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.2345668077468872, "step": 3880, "valid_targets_mean": 3109.5, "valid_targets_min": 792 }, { "epoch": 6.791958041958042, "grad_norm": 0.6299652829670256, "learning_rate": 1.093798835651616e-07, "loss": 0.3018, "loss_nan_ranks": 0, "loss_rank_avg": 0.20473377406597137, "step": 3885, "valid_targets_mean": 3211.1, "valid_targets_min": 1014 }, { "epoch": 6.800699300699301, "grad_norm": 0.6490254006725523, "learning_rate": 1.0046226871119002e-07, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.28175103664398193, "step": 3890, "valid_targets_mean": 3185.8, "valid_targets_min": 915 }, { "epoch": 6.809440559440559, "grad_norm": 0.623847951653859, "learning_rate": 9.192288172961139e-08, "loss": 0.2862, "loss_nan_ranks": 0, "loss_rank_avg": 0.24998612701892853, "step": 3895, "valid_targets_mean": 3280.8, "valid_targets_min": 1436 }, { "epoch": 6.818181818181818, "grad_norm": 0.5647723189271752, "learning_rate": 8.376188492742021e-08, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.28807640075683594, "step": 3900, "valid_targets_mean": 4534.2, "valid_targets_min": 875 }, { "epoch": 6.826923076923077, "grad_norm": 0.5941267825959952, "learning_rate": 7.597943341959957e-08, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.2007588893175125, "step": 3905, "valid_targets_mean": 3297.1, "valid_targets_min": 1462 }, { "epoch": 6.835664335664336, "grad_norm": 0.6353613704744627, "learning_rate": 6.857567512617236e-08, "loss": 0.2994, "loss_nan_ranks": 0, "loss_rank_avg": 0.26361724734306335, "step": 3910, "valid_targets_mean": 3440.0, "valid_targets_min": 1558 }, { "epoch": 6.844405594405594, "grad_norm": 0.5656132531908707, "learning_rate": 6.155075076939244e-08, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.30361640453338623, "step": 3915, "valid_targets_mean": 4592.8, "valid_targets_min": 1209 }, { "epoch": 6.853146853146853, "grad_norm": 0.6310367427887863, "learning_rate": 5.490479387106007e-08, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.2142931967973709, "step": 3920, "valid_targets_mean": 3075.1, "valid_targets_min": 304 }, { "epoch": 6.861888111888112, "grad_norm": 0.6165604607896683, "learning_rate": 4.863793074999512e-08, "loss": 0.2996, "loss_nan_ranks": 0, "loss_rank_avg": 0.24841853976249695, "step": 3925, "valid_targets_mean": 3701.6, "valid_targets_min": 819 }, { "epoch": 6.870629370629371, "grad_norm": 0.5061668762750048, "learning_rate": 4.275028051963892e-08, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.24676506221294403, "step": 3930, "valid_targets_mean": 4298.7, "valid_targets_min": 754 }, { "epoch": 6.879370629370629, "grad_norm": 0.6960871564818618, "learning_rate": 3.7241955085773884e-08, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.22061927616596222, "step": 3935, "valid_targets_mean": 2478.1, "valid_targets_min": 1043 }, { "epoch": 6.888111888111888, "grad_norm": 0.6033700639408716, "learning_rate": 3.211305914441187e-08, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.2619025707244873, "step": 3940, "valid_targets_mean": 3731.0, "valid_targets_min": 777 }, { "epoch": 6.896853146853147, "grad_norm": 0.5730719084236546, "learning_rate": 2.736369017979579e-08, "loss": 0.2622, "loss_nan_ranks": 0, "loss_rank_avg": 0.25423169136047363, "step": 3945, "valid_targets_mean": 3761.8, "valid_targets_min": 1318 }, { "epoch": 6.905594405594406, "grad_norm": 0.5714109307509674, "learning_rate": 2.2993938462554377e-08, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.31169724464416504, "step": 3950, "valid_targets_mean": 4320.3, "valid_targets_min": 1288 }, { "epoch": 6.914335664335664, "grad_norm": 0.7039855872325952, "learning_rate": 1.9003887047972515e-08, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.2564855217933655, "step": 3955, "valid_targets_mean": 2501.0, "valid_targets_min": 258 }, { "epoch": 6.923076923076923, "grad_norm": 0.5977123819404943, "learning_rate": 1.5393611774434657e-08, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.28014615178108215, "step": 3960, "valid_targets_mean": 3639.7, "valid_targets_min": 1208 }, { "epoch": 6.931818181818182, "grad_norm": 0.8262715036574306, "learning_rate": 1.2163181261959368e-08, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.3190450668334961, "step": 3965, "valid_targets_mean": 4795.8, "valid_targets_min": 1200 }, { "epoch": 6.940559440559441, "grad_norm": 0.6693168848678276, "learning_rate": 9.312656910911432e-09, "loss": 0.2707, "loss_nan_ranks": 0, "loss_rank_avg": 0.28227052092552185, "step": 3970, "valid_targets_mean": 3110.6, "valid_targets_min": 860 }, { "epoch": 6.949300699300699, "grad_norm": 0.7086238255439974, "learning_rate": 6.8420929008317094e-09, "loss": 0.2721, "loss_nan_ranks": 0, "loss_rank_avg": 0.23945844173431396, "step": 3975, "valid_targets_mean": 2615.2, "valid_targets_min": 1022 }, { "epoch": 6.958041958041958, "grad_norm": 0.6720432782965369, "learning_rate": 4.751536189397943e-09, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.1829328089952469, "step": 3980, "valid_targets_mean": 2545.9, "valid_targets_min": 1284 }, { "epoch": 6.966783216783217, "grad_norm": 0.6533371659227324, "learning_rate": 3.041026511545475e-09, "loss": 0.2582, "loss_nan_ranks": 0, "loss_rank_avg": 0.17008773982524872, "step": 3985, "valid_targets_mean": 2636.8, "valid_targets_min": 1230 }, { "epoch": 6.975524475524476, "grad_norm": 0.5251441298018588, "learning_rate": 1.7105963787078517e-09, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.33975541591644287, "step": 3990, "valid_targets_mean": 5142.2, "valid_targets_min": 1149 }, { "epoch": 6.984265734265734, "grad_norm": 0.6173950688495906, "learning_rate": 7.602710781884348e-10, "loss": 0.2756, "loss_nan_ranks": 0, "loss_rank_avg": 0.27754876017570496, "step": 3995, "valid_targets_mean": 3394.9, "valid_targets_min": 1074 }, { "epoch": 6.993006993006993, "grad_norm": 0.6366022888173039, "learning_rate": 1.9006867270077168e-10, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.24022555351257324, "step": 4000, "valid_targets_mean": 3167.0, "valid_targets_min": 1252 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.23146472871303558, "step": 4004, "total_flos": 735767221108736.0, "train_loss": 0.3356110471766907, "train_runtime": 16919.046, "train_samples_per_second": 3.782, "train_steps_per_second": 0.237, "valid_targets_mean": 3788.2, "valid_targets_min": 1011 } ], "logging_steps": 5, "max_steps": 4004, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 1500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 735767221108736.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }