{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 5026, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.006963788300835654, "grad_norm": 16.70025919180339, "learning_rate": 3.180914512922465e-07, "loss": 0.6604, "loss_nan_ranks": 0, "loss_rank_avg": 0.31003373861312866, "step": 5, "valid_targets_mean": 7389.0, "valid_targets_min": 5627 }, { "epoch": 0.013927576601671309, "grad_norm": 15.950547440699722, "learning_rate": 7.157057654075547e-07, "loss": 0.6983, "loss_nan_ranks": 0, "loss_rank_avg": 0.23548319935798645, "step": 10, "valid_targets_mean": 1294.8, "valid_targets_min": 422 }, { "epoch": 0.020891364902506964, "grad_norm": 13.622952098366161, "learning_rate": 1.113320079522863e-06, "loss": 0.6693, "loss_nan_ranks": 0, "loss_rank_avg": 0.31765997409820557, "step": 15, "valid_targets_mean": 8539.9, "valid_targets_min": 6761 }, { "epoch": 0.027855153203342618, "grad_norm": 9.836072650243178, "learning_rate": 1.5109343936381709e-06, "loss": 0.5881, "loss_nan_ranks": 0, "loss_rank_avg": 0.27282822132110596, "step": 20, "valid_targets_mean": 7579.0, "valid_targets_min": 6174 }, { "epoch": 0.034818941504178275, "grad_norm": 6.354639801298961, "learning_rate": 1.9085487077534792e-06, "loss": 0.5734, "loss_nan_ranks": 0, "loss_rank_avg": 0.2713155746459961, "step": 25, "valid_targets_mean": 7328.2, "valid_targets_min": 4839 }, { "epoch": 0.04178272980501393, "grad_norm": 5.430407653710302, "learning_rate": 2.3061630218687873e-06, "loss": 0.559, "loss_nan_ranks": 0, "loss_rank_avg": 0.29282844066619873, "step": 30, "valid_targets_mean": 6838.2, "valid_targets_min": 5034 }, { "epoch": 0.04874651810584958, "grad_norm": 4.877388127505224, "learning_rate": 2.703777335984096e-06, "loss": 0.5283, "loss_nan_ranks": 0, "loss_rank_avg": 0.25860846042633057, "step": 35, "valid_targets_mean": 7248.2, "valid_targets_min": 5567 }, { "epoch": 0.055710306406685235, "grad_norm": 2.846484730228359, "learning_rate": 3.101391650099404e-06, "loss": 0.4665, "loss_nan_ranks": 0, "loss_rank_avg": 0.21636009216308594, "step": 40, "valid_targets_mean": 6234.0, "valid_targets_min": 5603 }, { "epoch": 0.06267409470752089, "grad_norm": 2.963648252530947, "learning_rate": 3.499005964214712e-06, "loss": 0.4547, "loss_nan_ranks": 0, "loss_rank_avg": 0.10212111473083496, "step": 45, "valid_targets_mean": 602.0, "valid_targets_min": 152 }, { "epoch": 0.06963788300835655, "grad_norm": 1.0973687974221902, "learning_rate": 3.89662027833002e-06, "loss": 0.4081, "loss_nan_ranks": 0, "loss_rank_avg": 0.20101504027843475, "step": 50, "valid_targets_mean": 7299.9, "valid_targets_min": 6158 }, { "epoch": 0.0766016713091922, "grad_norm": 0.8984488229396836, "learning_rate": 4.294234592445328e-06, "loss": 0.4052, "loss_nan_ranks": 0, "loss_rank_avg": 0.1902889907360077, "step": 55, "valid_targets_mean": 6140.0, "valid_targets_min": 4648 }, { "epoch": 0.08356545961002786, "grad_norm": 0.78646128561226, "learning_rate": 4.6918489065606366e-06, "loss": 0.3897, "loss_nan_ranks": 0, "loss_rank_avg": 0.1944657266139984, "step": 60, "valid_targets_mean": 6603.0, "valid_targets_min": 4882 }, { "epoch": 0.0905292479108635, "grad_norm": 0.6308887930432894, "learning_rate": 5.089463220675944e-06, "loss": 0.371, "loss_nan_ranks": 0, "loss_rank_avg": 0.1896740198135376, "step": 65, "valid_targets_mean": 8015.0, "valid_targets_min": 6344 }, { "epoch": 0.09749303621169916, "grad_norm": 0.7528753110445529, "learning_rate": 5.487077534791253e-06, "loss": 0.3587, "loss_nan_ranks": 0, "loss_rank_avg": 0.17312809824943542, "step": 70, "valid_targets_mean": 6305.2, "valid_targets_min": 4622 }, { "epoch": 0.10445682451253482, "grad_norm": 0.5487849390115586, "learning_rate": 5.8846918489065606e-06, "loss": 0.3612, "loss_nan_ranks": 0, "loss_rank_avg": 0.18349185585975647, "step": 75, "valid_targets_mean": 7890.8, "valid_targets_min": 5485 }, { "epoch": 0.11142061281337047, "grad_norm": 0.5189028061387841, "learning_rate": 6.28230616302187e-06, "loss": 0.3552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1606183648109436, "step": 80, "valid_targets_mean": 7016.6, "valid_targets_min": 4960 }, { "epoch": 0.11838440111420613, "grad_norm": 0.5214627334126402, "learning_rate": 6.679920477137178e-06, "loss": 0.3415, "loss_nan_ranks": 0, "loss_rank_avg": 0.160720095038414, "step": 85, "valid_targets_mean": 6527.1, "valid_targets_min": 5399 }, { "epoch": 0.12534818941504178, "grad_norm": 0.6006447673375296, "learning_rate": 7.077534791252486e-06, "loss": 0.3419, "loss_nan_ranks": 0, "loss_rank_avg": 0.17021866142749786, "step": 90, "valid_targets_mean": 4995.0, "valid_targets_min": 618 }, { "epoch": 0.13231197771587744, "grad_norm": 0.49819624129860873, "learning_rate": 7.475149105367794e-06, "loss": 0.3511, "loss_nan_ranks": 0, "loss_rank_avg": 0.1750391721725464, "step": 95, "valid_targets_mean": 7219.4, "valid_targets_min": 5764 }, { "epoch": 0.1392757660167131, "grad_norm": 0.49092772422498776, "learning_rate": 7.872763419483102e-06, "loss": 0.3305, "loss_nan_ranks": 0, "loss_rank_avg": 0.17389681935310364, "step": 100, "valid_targets_mean": 7998.5, "valid_targets_min": 5902 }, { "epoch": 0.14623955431754876, "grad_norm": 0.5105786705340714, "learning_rate": 8.27037773359841e-06, "loss": 0.3031, "loss_nan_ranks": 0, "loss_rank_avg": 0.13476799428462982, "step": 105, "valid_targets_mean": 7377.4, "valid_targets_min": 5015 }, { "epoch": 0.1532033426183844, "grad_norm": 0.4395069780745515, "learning_rate": 8.667992047713719e-06, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.134280264377594, "step": 110, "valid_targets_mean": 6794.0, "valid_targets_min": 5283 }, { "epoch": 0.16016713091922005, "grad_norm": 0.5344731312163281, "learning_rate": 9.065606361829027e-06, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.17999088764190674, "step": 115, "valid_targets_mean": 6656.4, "valid_targets_min": 4364 }, { "epoch": 0.1671309192200557, "grad_norm": 0.46349547442614725, "learning_rate": 9.463220675944334e-06, "loss": 0.3083, "loss_nan_ranks": 0, "loss_rank_avg": 0.1460513472557068, "step": 120, "valid_targets_mean": 7178.4, "valid_targets_min": 4448 }, { "epoch": 0.17409470752089137, "grad_norm": 0.49695390233410575, "learning_rate": 9.860834990059643e-06, "loss": 0.304, "loss_nan_ranks": 0, "loss_rank_avg": 0.17316694557666779, "step": 125, "valid_targets_mean": 7619.8, "valid_targets_min": 5737 }, { "epoch": 0.181058495821727, "grad_norm": 0.4131284400571314, "learning_rate": 1.0258449304174951e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.13033336400985718, "step": 130, "valid_targets_mean": 8754.4, "valid_targets_min": 5752 }, { "epoch": 0.18802228412256267, "grad_norm": 0.46954213145258955, "learning_rate": 1.065606361829026e-05, "loss": 0.267, "loss_nan_ranks": 0, "loss_rank_avg": 0.14443400502204895, "step": 135, "valid_targets_mean": 6341.0, "valid_targets_min": 4543 }, { "epoch": 0.19498607242339833, "grad_norm": 0.5305150388984193, "learning_rate": 1.1053677932405567e-05, "loss": 0.2569, "loss_nan_ranks": 0, "loss_rank_avg": 0.14701451361179352, "step": 140, "valid_targets_mean": 7181.9, "valid_targets_min": 4563 }, { "epoch": 0.201949860724234, "grad_norm": 1.1100672340753313, "learning_rate": 1.1451292246520875e-05, "loss": 0.3149, "loss_nan_ranks": 0, "loss_rank_avg": 0.11581391841173172, "step": 145, "valid_targets_mean": 1104.4, "valid_targets_min": 161 }, { "epoch": 0.20891364902506965, "grad_norm": 0.42654296534182173, "learning_rate": 1.1848906560636184e-05, "loss": 0.2978, "loss_nan_ranks": 0, "loss_rank_avg": 0.13008113205432892, "step": 150, "valid_targets_mean": 7018.2, "valid_targets_min": 5424 }, { "epoch": 0.21587743732590528, "grad_norm": 0.4847320156022274, "learning_rate": 1.2246520874751492e-05, "loss": 0.3005, "loss_nan_ranks": 0, "loss_rank_avg": 0.15399551391601562, "step": 155, "valid_targets_mean": 7738.4, "valid_targets_min": 5329 }, { "epoch": 0.22284122562674094, "grad_norm": 0.5316398632314259, "learning_rate": 1.26441351888668e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.14879417419433594, "step": 160, "valid_targets_mean": 6426.6, "valid_targets_min": 5560 }, { "epoch": 0.2298050139275766, "grad_norm": 0.64130569981037, "learning_rate": 1.3041749502982108e-05, "loss": 0.2979, "loss_nan_ranks": 0, "loss_rank_avg": 0.15116575360298157, "step": 165, "valid_targets_mean": 6169.9, "valid_targets_min": 3446 }, { "epoch": 0.23676880222841226, "grad_norm": 0.4742255633480007, "learning_rate": 1.3439363817097418e-05, "loss": 0.284, "loss_nan_ranks": 0, "loss_rank_avg": 0.14647752046585083, "step": 170, "valid_targets_mean": 7204.6, "valid_targets_min": 5381 }, { "epoch": 0.24373259052924792, "grad_norm": 0.47419429273153524, "learning_rate": 1.3836978131212723e-05, "loss": 0.2885, "loss_nan_ranks": 0, "loss_rank_avg": 0.14805693924427032, "step": 175, "valid_targets_mean": 7600.4, "valid_targets_min": 5241 }, { "epoch": 0.25069637883008355, "grad_norm": 0.4888837565186023, "learning_rate": 1.4234592445328033e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.15302909910678864, "step": 180, "valid_targets_mean": 7098.5, "valid_targets_min": 5607 }, { "epoch": 0.2576601671309192, "grad_norm": 0.5085230199199996, "learning_rate": 1.4632206759443342e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.14871110022068024, "step": 185, "valid_targets_mean": 6955.1, "valid_targets_min": 5530 }, { "epoch": 0.2646239554317549, "grad_norm": 0.47969863426103976, "learning_rate": 1.502982107355865e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.14307832717895508, "step": 190, "valid_targets_mean": 6748.1, "valid_targets_min": 5364 }, { "epoch": 0.27158774373259054, "grad_norm": 0.5300381897608597, "learning_rate": 1.5427435387673956e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.13810153305530548, "step": 195, "valid_targets_mean": 6273.9, "valid_targets_min": 5438 }, { "epoch": 0.2785515320334262, "grad_norm": 0.4680707912423161, "learning_rate": 1.5825049701789266e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.13786497712135315, "step": 200, "valid_targets_mean": 6419.5, "valid_targets_min": 4879 }, { "epoch": 0.28551532033426186, "grad_norm": 0.4720452212866539, "learning_rate": 1.6222664015904573e-05, "loss": 0.2793, "loss_nan_ranks": 0, "loss_rank_avg": 0.13714374601840973, "step": 205, "valid_targets_mean": 6483.4, "valid_targets_min": 4309 }, { "epoch": 0.2924791086350975, "grad_norm": 0.5255652733594837, "learning_rate": 1.662027833001988e-05, "loss": 0.2755, "loss_nan_ranks": 0, "loss_rank_avg": 0.1564159393310547, "step": 210, "valid_targets_mean": 6825.0, "valid_targets_min": 5205 }, { "epoch": 0.2994428969359331, "grad_norm": 0.49603459688272655, "learning_rate": 1.701789264413519e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.12593704462051392, "step": 215, "valid_targets_mean": 6729.4, "valid_targets_min": 5200 }, { "epoch": 0.3064066852367688, "grad_norm": 0.509332149215568, "learning_rate": 1.74155069582505e-05, "loss": 0.2696, "loss_nan_ranks": 0, "loss_rank_avg": 0.13264459371566772, "step": 220, "valid_targets_mean": 6094.0, "valid_targets_min": 5302 }, { "epoch": 0.31337047353760444, "grad_norm": 0.5608083132142618, "learning_rate": 1.7813121272365807e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.14229202270507812, "step": 225, "valid_targets_mean": 7140.0, "valid_targets_min": 5270 }, { "epoch": 0.3203342618384401, "grad_norm": 0.4518894667306929, "learning_rate": 1.8210735586481114e-05, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.12612324953079224, "step": 230, "valid_targets_mean": 7425.0, "valid_targets_min": 5281 }, { "epoch": 0.32729805013927576, "grad_norm": 0.5269894067130169, "learning_rate": 1.8608349900596424e-05, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.16548216342926025, "step": 235, "valid_targets_mean": 7063.4, "valid_targets_min": 5386 }, { "epoch": 0.3342618384401114, "grad_norm": 0.5088318301963545, "learning_rate": 1.900596421471173e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.1421387791633606, "step": 240, "valid_targets_mean": 6827.0, "valid_targets_min": 4547 }, { "epoch": 0.3412256267409471, "grad_norm": 0.8073008646600404, "learning_rate": 1.9403578528827038e-05, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.08542703092098236, "step": 245, "valid_targets_mean": 2047.0, "valid_targets_min": 165 }, { "epoch": 0.34818941504178275, "grad_norm": 0.4927784128489709, "learning_rate": 1.9801192842942348e-05, "loss": 0.2596, "loss_nan_ranks": 0, "loss_rank_avg": 0.13067278265953064, "step": 250, "valid_targets_mean": 6754.1, "valid_targets_min": 5196 }, { "epoch": 0.3551532033426184, "grad_norm": 0.5689943591952936, "learning_rate": 2.0198807157057655e-05, "loss": 0.2606, "loss_nan_ranks": 0, "loss_rank_avg": 0.13194392621517181, "step": 255, "valid_targets_mean": 5985.6, "valid_targets_min": 5028 }, { "epoch": 0.362116991643454, "grad_norm": 0.6584472361090068, "learning_rate": 2.0596421471172965e-05, "loss": 0.2658, "loss_nan_ranks": 0, "loss_rank_avg": 0.12018608301877975, "step": 260, "valid_targets_mean": 5963.9, "valid_targets_min": 5237 }, { "epoch": 0.36908077994428967, "grad_norm": 0.507426793822691, "learning_rate": 2.0994035785288272e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.1359572857618332, "step": 265, "valid_targets_mean": 6319.0, "valid_targets_min": 5412 }, { "epoch": 0.37604456824512533, "grad_norm": 0.4533447276132855, "learning_rate": 2.139165009940358e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.10632900148630142, "step": 270, "valid_targets_mean": 7125.8, "valid_targets_min": 5080 }, { "epoch": 0.383008356545961, "grad_norm": 0.5072627844159278, "learning_rate": 2.1789264413518886e-05, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.12942767143249512, "step": 275, "valid_targets_mean": 6123.5, "valid_targets_min": 4521 }, { "epoch": 0.38997214484679665, "grad_norm": 2.3716958270807, "learning_rate": 2.2186878727634196e-05, "loss": 0.3214, "loss_nan_ranks": 0, "loss_rank_avg": 0.23617935180664062, "step": 280, "valid_targets_mean": 1886.0, "valid_targets_min": 1111 }, { "epoch": 0.3969359331476323, "grad_norm": 1.5308735634592507, "learning_rate": 2.2584493041749503e-05, "loss": 0.3968, "loss_nan_ranks": 0, "loss_rank_avg": 0.19828379154205322, "step": 285, "valid_targets_mean": 1497.6, "valid_targets_min": 893 }, { "epoch": 0.403899721448468, "grad_norm": 1.1543013502299828, "learning_rate": 2.2982107355864813e-05, "loss": 0.3449, "loss_nan_ranks": 0, "loss_rank_avg": 0.1195836067199707, "step": 290, "valid_targets_mean": 1356.0, "valid_targets_min": 914 }, { "epoch": 0.41086350974930363, "grad_norm": 1.094348041750749, "learning_rate": 2.3379721669980124e-05, "loss": 0.3274, "loss_nan_ranks": 0, "loss_rank_avg": 0.13568729162216187, "step": 295, "valid_targets_mean": 1324.5, "valid_targets_min": 680 }, { "epoch": 0.4178272980501393, "grad_norm": 0.9321428551455399, "learning_rate": 2.377733598409543e-05, "loss": 0.3174, "loss_nan_ranks": 0, "loss_rank_avg": 0.14562851190567017, "step": 300, "valid_targets_mean": 1931.8, "valid_targets_min": 876 }, { "epoch": 0.42479108635097496, "grad_norm": 1.2058603525575806, "learning_rate": 2.4174950298210734e-05, "loss": 0.3023, "loss_nan_ranks": 0, "loss_rank_avg": 0.1342366337776184, "step": 305, "valid_targets_mean": 1292.2, "valid_targets_min": 734 }, { "epoch": 0.43175487465181056, "grad_norm": 1.2425037495378959, "learning_rate": 2.4572564612326044e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.1206846684217453, "step": 310, "valid_targets_mean": 1469.6, "valid_targets_min": 655 }, { "epoch": 0.4387186629526462, "grad_norm": 0.970667265555978, "learning_rate": 2.4970178926441354e-05, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.1465504765510559, "step": 315, "valid_targets_mean": 1548.4, "valid_targets_min": 737 }, { "epoch": 0.4456824512534819, "grad_norm": 1.0165307573128308, "learning_rate": 2.536779324055666e-05, "loss": 0.2969, "loss_nan_ranks": 0, "loss_rank_avg": 0.1261579394340515, "step": 320, "valid_targets_mean": 1316.5, "valid_targets_min": 759 }, { "epoch": 0.45264623955431754, "grad_norm": 0.9803325403945289, "learning_rate": 2.576540755467197e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.10474079847335815, "step": 325, "valid_targets_mean": 1249.6, "valid_targets_min": 753 }, { "epoch": 0.4596100278551532, "grad_norm": 0.9660896867872805, "learning_rate": 2.616302186878728e-05, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.17885830998420715, "step": 330, "valid_targets_mean": 1833.0, "valid_targets_min": 927 }, { "epoch": 0.46657381615598886, "grad_norm": 0.9889163176342366, "learning_rate": 2.656063618290259e-05, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.1363910287618637, "step": 335, "valid_targets_mean": 1338.4, "valid_targets_min": 679 }, { "epoch": 0.4735376044568245, "grad_norm": 1.061457665973345, "learning_rate": 2.6958250497017892e-05, "loss": 0.2733, "loss_nan_ranks": 0, "loss_rank_avg": 0.12158133089542389, "step": 340, "valid_targets_mean": 1244.6, "valid_targets_min": 771 }, { "epoch": 0.4805013927576602, "grad_norm": 1.0563598410355024, "learning_rate": 2.7355864811133202e-05, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.12138071656227112, "step": 345, "valid_targets_mean": 1732.5, "valid_targets_min": 986 }, { "epoch": 0.48746518105849584, "grad_norm": 1.1235998467468378, "learning_rate": 2.775347912524851e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.11856169253587723, "step": 350, "valid_targets_mean": 1389.9, "valid_targets_min": 1103 }, { "epoch": 0.49442896935933145, "grad_norm": 0.942754195687271, "learning_rate": 2.815109343936382e-05, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.14676061272621155, "step": 355, "valid_targets_mean": 1593.2, "valid_targets_min": 675 }, { "epoch": 0.5013927576601671, "grad_norm": 0.927084600615998, "learning_rate": 2.8548707753479126e-05, "loss": 0.2662, "loss_nan_ranks": 0, "loss_rank_avg": 0.16312474012374878, "step": 360, "valid_targets_mean": 1926.6, "valid_targets_min": 974 }, { "epoch": 0.5083565459610028, "grad_norm": 1.0089719119822702, "learning_rate": 2.8946322067594437e-05, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.16004151105880737, "step": 365, "valid_targets_mean": 1953.1, "valid_targets_min": 869 }, { "epoch": 0.5153203342618384, "grad_norm": 1.0547290812174692, "learning_rate": 2.9343936381709747e-05, "loss": 0.2683, "loss_nan_ranks": 0, "loss_rank_avg": 0.11815130710601807, "step": 370, "valid_targets_mean": 1327.2, "valid_targets_min": 1023 }, { "epoch": 0.5222841225626741, "grad_norm": 1.091197129252169, "learning_rate": 2.974155069582505e-05, "loss": 0.271, "loss_nan_ranks": 0, "loss_rank_avg": 0.14482921361923218, "step": 375, "valid_targets_mean": 1717.9, "valid_targets_min": 709 }, { "epoch": 0.5292479108635098, "grad_norm": 1.041832550945947, "learning_rate": 3.0139165009940357e-05, "loss": 0.2561, "loss_nan_ranks": 0, "loss_rank_avg": 0.111148402094841, "step": 380, "valid_targets_mean": 1139.9, "valid_targets_min": 658 }, { "epoch": 0.5362116991643454, "grad_norm": 1.0373743215959594, "learning_rate": 3.053677932405567e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.12807971239089966, "step": 385, "valid_targets_mean": 1444.8, "valid_targets_min": 662 }, { "epoch": 0.5431754874651811, "grad_norm": 0.9362737502243705, "learning_rate": 3.0934393638170974e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.0938352644443512, "step": 390, "valid_targets_mean": 1242.2, "valid_targets_min": 859 }, { "epoch": 0.5501392757660167, "grad_norm": 0.9658781825606017, "learning_rate": 3.133200795228629e-05, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.149136483669281, "step": 395, "valid_targets_mean": 1569.2, "valid_targets_min": 950 }, { "epoch": 0.5571030640668524, "grad_norm": 1.1094086785951527, "learning_rate": 3.1729622266401595e-05, "loss": 0.2579, "loss_nan_ranks": 0, "loss_rank_avg": 0.12185294181108475, "step": 400, "valid_targets_mean": 1539.8, "valid_targets_min": 686 }, { "epoch": 0.564066852367688, "grad_norm": 0.8987556090799284, "learning_rate": 3.21272365805169e-05, "loss": 0.2507, "loss_nan_ranks": 0, "loss_rank_avg": 0.13875404000282288, "step": 405, "valid_targets_mean": 1610.6, "valid_targets_min": 702 }, { "epoch": 0.5710306406685237, "grad_norm": 0.9570507306238789, "learning_rate": 3.252485089463221e-05, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.09257258474826813, "step": 410, "valid_targets_mean": 1190.4, "valid_targets_min": 779 }, { "epoch": 0.5779944289693594, "grad_norm": 1.041172830465715, "learning_rate": 3.2922465208747515e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.13315311074256897, "step": 415, "valid_targets_mean": 1467.1, "valid_targets_min": 822 }, { "epoch": 0.584958217270195, "grad_norm": 0.986140542035632, "learning_rate": 3.332007952286282e-05, "loss": 0.2411, "loss_nan_ranks": 0, "loss_rank_avg": 0.10449384897947311, "step": 420, "valid_targets_mean": 1350.5, "valid_targets_min": 868 }, { "epoch": 0.5919220055710307, "grad_norm": 1.065472844147368, "learning_rate": 3.3717693836978136e-05, "loss": 0.2507, "loss_nan_ranks": 0, "loss_rank_avg": 0.10323739796876907, "step": 425, "valid_targets_mean": 1283.5, "valid_targets_min": 781 }, { "epoch": 0.5988857938718662, "grad_norm": 0.9665463285582397, "learning_rate": 3.411530815109344e-05, "loss": 0.251, "loss_nan_ranks": 0, "loss_rank_avg": 0.10586751997470856, "step": 430, "valid_targets_mean": 1303.2, "valid_targets_min": 793 }, { "epoch": 0.6058495821727019, "grad_norm": 1.2852362210237431, "learning_rate": 3.451292246520875e-05, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.10657232999801636, "step": 435, "valid_targets_mean": 1309.1, "valid_targets_min": 806 }, { "epoch": 0.6128133704735376, "grad_norm": 0.8736026107192932, "learning_rate": 3.491053677932406e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.1021880954504013, "step": 440, "valid_targets_mean": 1397.6, "valid_targets_min": 803 }, { "epoch": 0.6197771587743732, "grad_norm": 1.0411104476153328, "learning_rate": 3.530815109343936e-05, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.0923558846116066, "step": 445, "valid_targets_mean": 1187.8, "valid_targets_min": 660 }, { "epoch": 0.6267409470752089, "grad_norm": 0.9460837866342159, "learning_rate": 3.570576540755467e-05, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.10013886541128159, "step": 450, "valid_targets_mean": 1547.0, "valid_targets_min": 853 }, { "epoch": 0.6337047353760445, "grad_norm": 0.9098298102835145, "learning_rate": 3.6103379721669984e-05, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.1290132701396942, "step": 455, "valid_targets_mean": 1704.2, "valid_targets_min": 719 }, { "epoch": 0.6406685236768802, "grad_norm": 0.9535602596956675, "learning_rate": 3.650099403578529e-05, "loss": 0.2486, "loss_nan_ranks": 0, "loss_rank_avg": 0.08892850577831268, "step": 460, "valid_targets_mean": 1255.0, "valid_targets_min": 765 }, { "epoch": 0.6476323119777159, "grad_norm": 0.9327456495578426, "learning_rate": 3.68986083499006e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.11986593157052994, "step": 465, "valid_targets_mean": 1550.8, "valid_targets_min": 875 }, { "epoch": 0.6545961002785515, "grad_norm": 1.0928873361476414, "learning_rate": 3.729622266401591e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.12141738831996918, "step": 470, "valid_targets_mean": 1362.0, "valid_targets_min": 739 }, { "epoch": 0.6615598885793872, "grad_norm": 0.9405266158146244, "learning_rate": 3.769383697813122e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.13972696661949158, "step": 475, "valid_targets_mean": 1666.8, "valid_targets_min": 760 }, { "epoch": 0.6685236768802229, "grad_norm": 0.9803157445663641, "learning_rate": 3.8091451292246525e-05, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.10272186994552612, "step": 480, "valid_targets_mean": 1319.6, "valid_targets_min": 1046 }, { "epoch": 0.6754874651810585, "grad_norm": 0.8300161576779523, "learning_rate": 3.848906560636183e-05, "loss": 0.254, "loss_nan_ranks": 0, "loss_rank_avg": 0.13779720664024353, "step": 485, "valid_targets_mean": 1727.9, "valid_targets_min": 851 }, { "epoch": 0.6824512534818942, "grad_norm": 0.958305960647266, "learning_rate": 3.888667992047714e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.129207044839859, "step": 490, "valid_targets_mean": 1643.2, "valid_targets_min": 907 }, { "epoch": 0.6894150417827298, "grad_norm": 0.9358380856267636, "learning_rate": 3.9284294234592445e-05, "loss": 0.2581, "loss_nan_ranks": 0, "loss_rank_avg": 0.11121398210525513, "step": 495, "valid_targets_mean": 1478.5, "valid_targets_min": 764 }, { "epoch": 0.6963788300835655, "grad_norm": 0.8280865710705787, "learning_rate": 3.968190854870776e-05, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.1098678931593895, "step": 500, "valid_targets_mean": 1522.6, "valid_targets_min": 822 }, { "epoch": 0.7033426183844012, "grad_norm": 0.8854144055119295, "learning_rate": 3.999999517556397e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.11844191700220108, "step": 505, "valid_targets_mean": 1589.0, "valid_targets_min": 982 }, { "epoch": 0.7103064066852368, "grad_norm": 0.889147230178005, "learning_rate": 3.9999826320547226e-05, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.12125623971223831, "step": 510, "valid_targets_mean": 1574.8, "valid_targets_min": 816 }, { "epoch": 0.7172701949860725, "grad_norm": 1.0297104353022954, "learning_rate": 3.999941624605637e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.12160146236419678, "step": 515, "valid_targets_mean": 1422.0, "valid_targets_min": 721 }, { "epoch": 0.724233983286908, "grad_norm": 0.9715916674508144, "learning_rate": 3.999876495703734e-05, "loss": 0.2319, "loss_nan_ranks": 0, "loss_rank_avg": 0.08852733671665192, "step": 520, "valid_targets_mean": 1150.6, "valid_targets_min": 741 }, { "epoch": 0.7311977715877437, "grad_norm": 0.9348675328466968, "learning_rate": 3.999787246134539e-05, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.1302892565727234, "step": 525, "valid_targets_mean": 1684.2, "valid_targets_min": 734 }, { "epoch": 0.7381615598885793, "grad_norm": 0.9829460553497974, "learning_rate": 3.999673876974498e-05, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.14294780790805817, "step": 530, "valid_targets_mean": 1937.1, "valid_targets_min": 744 }, { "epoch": 0.745125348189415, "grad_norm": 1.00886311547871, "learning_rate": 3.9995363895909654e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.1358570158481598, "step": 535, "valid_targets_mean": 1842.2, "valid_targets_min": 620 }, { "epoch": 0.7520891364902507, "grad_norm": 0.9029995225438505, "learning_rate": 3.9993747856421865e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.13714322447776794, "step": 540, "valid_targets_mean": 1637.6, "valid_targets_min": 785 }, { "epoch": 0.7590529247910863, "grad_norm": 0.8367188043813011, "learning_rate": 3.99918906707728e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.11780621111392975, "step": 545, "valid_targets_mean": 1969.9, "valid_targets_min": 740 }, { "epoch": 0.766016713091922, "grad_norm": 0.9884389058338642, "learning_rate": 3.9989792361362124e-05, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.1071939691901207, "step": 550, "valid_targets_mean": 1432.1, "valid_targets_min": 711 }, { "epoch": 0.7729805013927576, "grad_norm": 0.9502178485105263, "learning_rate": 3.99874529534977e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.12912839651107788, "step": 555, "valid_targets_mean": 1695.6, "valid_targets_min": 1122 }, { "epoch": 0.7799442896935933, "grad_norm": 0.9668592085821732, "learning_rate": 3.9984872475395325e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.12528224289417267, "step": 560, "valid_targets_mean": 1524.5, "valid_targets_min": 722 }, { "epoch": 0.786908077994429, "grad_norm": 0.8799325389323717, "learning_rate": 3.998205095817833e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.10128602385520935, "step": 565, "valid_targets_mean": 1289.2, "valid_targets_min": 661 }, { "epoch": 0.7938718662952646, "grad_norm": 0.9446705425289179, "learning_rate": 3.997898843587727e-05, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.1078827977180481, "step": 570, "valid_targets_mean": 1519.5, "valid_targets_min": 1011 }, { "epoch": 0.8008356545961003, "grad_norm": 0.8325950401643598, "learning_rate": 3.997568494542946e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.12279678881168365, "step": 575, "valid_targets_mean": 1731.4, "valid_targets_min": 1277 }, { "epoch": 0.807799442896936, "grad_norm": 0.898136637442764, "learning_rate": 3.997214052667856e-05, "loss": 0.2232, "loss_nan_ranks": 0, "loss_rank_avg": 0.11773974448442459, "step": 580, "valid_targets_mean": 1486.1, "valid_targets_min": 807 }, { "epoch": 0.8147632311977716, "grad_norm": 0.8718990576135462, "learning_rate": 3.996835522237408e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.13190338015556335, "step": 585, "valid_targets_mean": 1549.9, "valid_targets_min": 679 }, { "epoch": 0.8217270194986073, "grad_norm": 0.9293519703318798, "learning_rate": 3.9964329078170874e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.11136806011199951, "step": 590, "valid_targets_mean": 1656.0, "valid_targets_min": 1294 }, { "epoch": 0.8286908077994429, "grad_norm": 0.9027962521886033, "learning_rate": 3.996006214262858e-05, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.10627582669258118, "step": 595, "valid_targets_mean": 1368.8, "valid_targets_min": 790 }, { "epoch": 0.8356545961002786, "grad_norm": 0.9202444501195384, "learning_rate": 3.995555446721104e-05, "loss": 0.2293, "loss_nan_ranks": 0, "loss_rank_avg": 0.12929676473140717, "step": 600, "valid_targets_mean": 1765.8, "valid_targets_min": 592 }, { "epoch": 0.8426183844011143, "grad_norm": 0.8667866984685644, "learning_rate": 3.9950806106285694e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.12393373250961304, "step": 605, "valid_targets_mean": 1586.8, "valid_targets_min": 662 }, { "epoch": 0.8495821727019499, "grad_norm": 0.9721183405017587, "learning_rate": 3.9945817117122884e-05, "loss": 0.2379, "loss_nan_ranks": 0, "loss_rank_avg": 0.1137949600815773, "step": 610, "valid_targets_mean": 1336.9, "valid_targets_min": 622 }, { "epoch": 0.8565459610027855, "grad_norm": 0.9071022828100963, "learning_rate": 3.994058755989521e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.07271943986415863, "step": 615, "valid_targets_mean": 1097.1, "valid_targets_min": 625 }, { "epoch": 0.8635097493036211, "grad_norm": 0.9327235573302172, "learning_rate": 3.993511749767676e-05, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.09269745647907257, "step": 620, "valid_targets_mean": 1484.9, "valid_targets_min": 888 }, { "epoch": 0.8704735376044568, "grad_norm": 0.8523136084427271, "learning_rate": 3.992940699644238e-05, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.12552563846111298, "step": 625, "valid_targets_mean": 1757.0, "valid_targets_min": 635 }, { "epoch": 0.8774373259052924, "grad_norm": 0.9675785553764196, "learning_rate": 3.9923456125066886e-05, "loss": 0.2412, "loss_nan_ranks": 0, "loss_rank_avg": 0.1370333880186081, "step": 630, "valid_targets_mean": 1476.1, "valid_targets_min": 522 }, { "epoch": 0.8844011142061281, "grad_norm": 0.9240372392580922, "learning_rate": 3.9917264955324205e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.10322962701320648, "step": 635, "valid_targets_mean": 1230.9, "valid_targets_min": 697 }, { "epoch": 0.8913649025069638, "grad_norm": 0.8039407980641069, "learning_rate": 3.991083356188651e-05, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.12441124022006989, "step": 640, "valid_targets_mean": 1671.0, "valid_targets_min": 1010 }, { "epoch": 0.8983286908077994, "grad_norm": 0.901298627076697, "learning_rate": 3.9904162022323356e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.11574780941009521, "step": 645, "valid_targets_mean": 1411.0, "valid_targets_min": 769 }, { "epoch": 0.9052924791086351, "grad_norm": 0.8076274204627811, "learning_rate": 3.9897250417100685e-05, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.097521111369133, "step": 650, "valid_targets_mean": 1298.6, "valid_targets_min": 745 }, { "epoch": 0.9122562674094707, "grad_norm": 0.8790050634268944, "learning_rate": 3.9890098829579936e-05, "loss": 0.2284, "loss_nan_ranks": 0, "loss_rank_avg": 0.09707553684711456, "step": 655, "valid_targets_mean": 1118.9, "valid_targets_min": 680 }, { "epoch": 0.9192200557103064, "grad_norm": 0.8222830712195175, "learning_rate": 3.988270734601694e-05, "loss": 0.222, "loss_nan_ranks": 0, "loss_rank_avg": 0.13638588786125183, "step": 660, "valid_targets_mean": 1905.9, "valid_targets_min": 1347 }, { "epoch": 0.9261838440111421, "grad_norm": 0.9010068300752175, "learning_rate": 3.987507605556098e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.16486553847789764, "step": 665, "valid_targets_mean": 1636.0, "valid_targets_min": 851 }, { "epoch": 0.9331476323119777, "grad_norm": 0.8103801455626374, "learning_rate": 3.9867205050253635e-05, "loss": 0.224, "loss_nan_ranks": 0, "loss_rank_avg": 0.09920711815357208, "step": 670, "valid_targets_mean": 1457.2, "valid_targets_min": 903 }, { "epoch": 0.9401114206128134, "grad_norm": 0.8043472181124449, "learning_rate": 3.9859094425027726e-05, "loss": 0.2217, "loss_nan_ranks": 0, "loss_rank_avg": 0.12532712519168854, "step": 675, "valid_targets_mean": 1674.4, "valid_targets_min": 1240 }, { "epoch": 0.947075208913649, "grad_norm": 0.8118897965994559, "learning_rate": 3.985074427770614e-05, "loss": 0.2201, "loss_nan_ranks": 0, "loss_rank_avg": 0.09223470091819763, "step": 680, "valid_targets_mean": 1697.1, "valid_targets_min": 917 }, { "epoch": 0.9540389972144847, "grad_norm": 0.9472041237654983, "learning_rate": 3.9842154709000665e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.09532526135444641, "step": 685, "valid_targets_mean": 1580.9, "valid_targets_min": 930 }, { "epoch": 0.9610027855153204, "grad_norm": 0.8083428002058612, "learning_rate": 3.983332582251074e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.11902359873056412, "step": 690, "valid_targets_mean": 1655.1, "valid_targets_min": 1227 }, { "epoch": 0.967966573816156, "grad_norm": 0.8148921698054701, "learning_rate": 3.982425772472228e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.11095002293586731, "step": 695, "valid_targets_mean": 1565.8, "valid_targets_min": 870 }, { "epoch": 0.9749303621169917, "grad_norm": 2.1396789291672396, "learning_rate": 3.9814950525006315e-05, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.10898259282112122, "step": 700, "valid_targets_mean": 1564.6, "valid_targets_min": 822 }, { "epoch": 0.9818941504178273, "grad_norm": 0.8780065601127116, "learning_rate": 3.980540433561771e-05, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.10233960300683975, "step": 705, "valid_targets_mean": 1540.5, "valid_targets_min": 1214 }, { "epoch": 0.9888579387186629, "grad_norm": 0.8908774625256577, "learning_rate": 3.979561927169381e-05, "loss": 0.2206, "loss_nan_ranks": 0, "loss_rank_avg": 0.10410676151514053, "step": 710, "valid_targets_mean": 1268.6, "valid_targets_min": 591 }, { "epoch": 0.9958217270194986, "grad_norm": 0.8377782810822102, "learning_rate": 3.978559545125303e-05, "loss": 0.2351, "loss_nan_ranks": 0, "loss_rank_avg": 0.08468751609325409, "step": 715, "valid_targets_mean": 1232.5, "valid_targets_min": 646 }, { "epoch": 1.0027855153203342, "grad_norm": 0.5045448459523831, "learning_rate": 3.977533299519347e-05, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.12714359164237976, "step": 720, "valid_targets_mean": 8514.0, "valid_targets_min": 6788 }, { "epoch": 1.00974930362117, "grad_norm": 0.5387200781137093, "learning_rate": 3.97648320272914e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.13830497860908508, "step": 725, "valid_targets_mean": 6668.0, "valid_targets_min": 5933 }, { "epoch": 1.0167130919220055, "grad_norm": 0.6200314371011584, "learning_rate": 3.9754092674199816e-05, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.12560366094112396, "step": 730, "valid_targets_mean": 4107.0, "valid_targets_min": 161 }, { "epoch": 1.0236768802228413, "grad_norm": 0.41903186731709363, "learning_rate": 3.974311506544692e-05, "loss": 0.2614, "loss_nan_ranks": 0, "loss_rank_avg": 0.11801932752132416, "step": 735, "valid_targets_mean": 7946.0, "valid_targets_min": 5596 }, { "epoch": 1.0306406685236769, "grad_norm": 0.43595924603479874, "learning_rate": 3.973189933343449e-05, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.13217604160308838, "step": 740, "valid_targets_mean": 7392.8, "valid_targets_min": 5629 }, { "epoch": 1.0376044568245126, "grad_norm": 0.5245267930858062, "learning_rate": 3.972044561343636e-05, "loss": 0.2511, "loss_nan_ranks": 0, "loss_rank_avg": 0.12668457627296448, "step": 745, "valid_targets_mean": 6879.6, "valid_targets_min": 5113 }, { "epoch": 1.0445682451253482, "grad_norm": 0.4794835613989842, "learning_rate": 3.970875404359675e-05, "loss": 0.27, "loss_nan_ranks": 0, "loss_rank_avg": 0.1310746967792511, "step": 750, "valid_targets_mean": 6919.5, "valid_targets_min": 5080 }, { "epoch": 1.051532033426184, "grad_norm": 0.47039907099593237, "learning_rate": 3.969682476492858e-05, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.1175151839852333, "step": 755, "valid_targets_mean": 6377.0, "valid_targets_min": 3939 }, { "epoch": 1.0584958217270195, "grad_norm": 0.4472868406904229, "learning_rate": 3.968465792131184e-05, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.12472754716873169, "step": 760, "valid_targets_mean": 6392.2, "valid_targets_min": 4355 }, { "epoch": 1.065459610027855, "grad_norm": 0.5109948443641175, "learning_rate": 3.9672253659491776e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.14166294038295746, "step": 765, "valid_targets_mean": 5196.5, "valid_targets_min": 137 }, { "epoch": 1.0724233983286908, "grad_norm": 0.3950884119973961, "learning_rate": 3.965961212907716e-05, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.10841463506221771, "step": 770, "valid_targets_mean": 7344.4, "valid_targets_min": 5244 }, { "epoch": 1.0793871866295264, "grad_norm": 0.39325931847169565, "learning_rate": 3.9646733482538486e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.10372970998287201, "step": 775, "valid_targets_mean": 7921.0, "valid_targets_min": 5311 }, { "epoch": 1.0863509749303621, "grad_norm": 0.39685130314701833, "learning_rate": 3.963361787520612e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.12329264730215073, "step": 780, "valid_targets_mean": 7931.2, "valid_targets_min": 6015 }, { "epoch": 1.0933147632311977, "grad_norm": 0.36954967114170856, "learning_rate": 3.9620265465268423e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.11054964363574982, "step": 785, "valid_targets_mean": 7640.8, "valid_targets_min": 5248 }, { "epoch": 1.1002785515320335, "grad_norm": 0.39689900322648536, "learning_rate": 3.960667641376987e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.11496052145957947, "step": 790, "valid_targets_mean": 7249.6, "valid_targets_min": 5217 }, { "epoch": 1.107242339832869, "grad_norm": 0.433531433289986, "learning_rate": 3.959285088460908e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.13216888904571533, "step": 795, "valid_targets_mean": 7619.9, "valid_targets_min": 5094 }, { "epoch": 1.1142061281337048, "grad_norm": 0.39505484410680386, "learning_rate": 3.957878904453683e-05, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.11113603413105011, "step": 800, "valid_targets_mean": 7732.8, "valid_targets_min": 5842 }, { "epoch": 1.1211699164345403, "grad_norm": 0.4052047229981209, "learning_rate": 3.9564491063154084e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.12098728865385056, "step": 805, "valid_targets_mean": 7952.9, "valid_targets_min": 5494 }, { "epoch": 1.128133704735376, "grad_norm": 0.417279220495771, "learning_rate": 3.9549957112909914e-05, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.12448830902576447, "step": 810, "valid_targets_mean": 8001.0, "valid_targets_min": 5454 }, { "epoch": 1.1350974930362117, "grad_norm": 0.5319248244035725, "learning_rate": 3.9535187369099437e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.09340626001358032, "step": 815, "valid_targets_mean": 2985.1, "valid_targets_min": 1896 }, { "epoch": 1.1420612813370474, "grad_norm": 0.39891658368515515, "learning_rate": 3.952018200986169e-05, "loss": 0.2183, "loss_nan_ranks": 0, "loss_rank_avg": 0.10278548300266266, "step": 820, "valid_targets_mean": 6714.6, "valid_targets_min": 4917 }, { "epoch": 1.149025069637883, "grad_norm": 0.4249036845709375, "learning_rate": 3.950494121617749e-05, "loss": 0.2296, "loss_nan_ranks": 0, "loss_rank_avg": 0.1260872483253479, "step": 825, "valid_targets_mean": 7595.2, "valid_targets_min": 5488 }, { "epoch": 1.1559888579387188, "grad_norm": 0.45070868901900607, "learning_rate": 3.9489465171867254e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.1257646679878235, "step": 830, "valid_targets_mean": 7046.1, "valid_targets_min": 5579 }, { "epoch": 1.1629526462395543, "grad_norm": 0.4439435807963078, "learning_rate": 3.947375406358874e-05, "loss": 0.2402, "loss_nan_ranks": 0, "loss_rank_avg": 0.1169155091047287, "step": 835, "valid_targets_mean": 7108.0, "valid_targets_min": 4963 }, { "epoch": 1.16991643454039, "grad_norm": 0.44221583815751264, "learning_rate": 3.9457808080834884e-05, "loss": 0.2344, "loss_nan_ranks": 0, "loss_rank_avg": 0.11854035407304764, "step": 840, "valid_targets_mean": 6810.1, "valid_targets_min": 5666 }, { "epoch": 1.1768802228412256, "grad_norm": 0.4316908401901056, "learning_rate": 3.944162741593142e-05, "loss": 0.225, "loss_nan_ranks": 0, "loss_rank_avg": 0.11046448349952698, "step": 845, "valid_targets_mean": 8068.5, "valid_targets_min": 5524 }, { "epoch": 1.1838440111420612, "grad_norm": 0.4180604360052473, "learning_rate": 3.9425212264034626e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.09698522835969925, "step": 850, "valid_targets_mean": 6553.8, "valid_targets_min": 3621 }, { "epoch": 1.190807799442897, "grad_norm": 0.4189841877717661, "learning_rate": 3.940856282312893e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.10995703935623169, "step": 855, "valid_targets_mean": 6762.5, "valid_targets_min": 4968 }, { "epoch": 1.1977715877437327, "grad_norm": 0.45595104424848715, "learning_rate": 3.9391679294024543e-05, "loss": 0.2224, "loss_nan_ranks": 0, "loss_rank_avg": 0.11162762343883514, "step": 860, "valid_targets_mean": 6143.9, "valid_targets_min": 4917 }, { "epoch": 1.2047353760445683, "grad_norm": 0.5851346783403598, "learning_rate": 3.937456188035504e-05, "loss": 0.2377, "loss_nan_ranks": 0, "loss_rank_avg": 0.16354359686374664, "step": 865, "valid_targets_mean": 4583.8, "valid_targets_min": 215 }, { "epoch": 1.2116991643454038, "grad_norm": 0.4055676263805544, "learning_rate": 3.935721078857489e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.11995077133178711, "step": 870, "valid_targets_mean": 7317.1, "valid_targets_min": 4948 }, { "epoch": 1.2186629526462396, "grad_norm": 0.42172517542326765, "learning_rate": 3.9339626227956966e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.12088988721370697, "step": 875, "valid_targets_mean": 6437.6, "valid_targets_min": 4510 }, { "epoch": 1.2256267409470751, "grad_norm": 0.4535203146647295, "learning_rate": 3.932180841059004e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.13094569742679596, "step": 880, "valid_targets_mean": 7707.9, "valid_targets_min": 5796 }, { "epoch": 1.232590529247911, "grad_norm": 0.418577272093497, "learning_rate": 3.93037575513762e-05, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.11241194605827332, "step": 885, "valid_targets_mean": 7900.9, "valid_targets_min": 5643 }, { "epoch": 1.2395543175487465, "grad_norm": 0.4344807498847784, "learning_rate": 3.9285473868028287e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.12634864449501038, "step": 890, "valid_targets_mean": 7627.2, "valid_targets_min": 5742 }, { "epoch": 1.2465181058495822, "grad_norm": 0.40801176738421346, "learning_rate": 3.9266957581067215e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.13307298719882965, "step": 895, "valid_targets_mean": 8725.6, "valid_targets_min": 5141 }, { "epoch": 1.2534818941504178, "grad_norm": 0.4451588968606175, "learning_rate": 3.924820891381939e-05, "loss": 0.2309, "loss_nan_ranks": 0, "loss_rank_avg": 0.12867535650730133, "step": 900, "valid_targets_mean": 6967.8, "valid_targets_min": 6088 }, { "epoch": 1.2604456824512535, "grad_norm": 0.4207887725907819, "learning_rate": 3.922922809241397e-05, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.10731957852840424, "step": 905, "valid_targets_mean": 7140.1, "valid_targets_min": 4834 }, { "epoch": 1.267409470752089, "grad_norm": 0.43935252315939416, "learning_rate": 3.92100153457801e-05, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.10727177560329437, "step": 910, "valid_targets_mean": 6706.9, "valid_targets_min": 5108 }, { "epoch": 1.2743732590529249, "grad_norm": 0.4987156443279082, "learning_rate": 3.9190570905644254e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.11678919196128845, "step": 915, "valid_targets_mean": 5931.4, "valid_targets_min": 4708 }, { "epoch": 1.2813370473537604, "grad_norm": 0.4407354572740225, "learning_rate": 3.917089500652733e-05, "loss": 0.2273, "loss_nan_ranks": 0, "loss_rank_avg": 0.10812367498874664, "step": 920, "valid_targets_mean": 7145.6, "valid_targets_min": 5280 }, { "epoch": 1.2883008356545962, "grad_norm": 0.7644739613411758, "learning_rate": 3.915098788574191e-05, "loss": 0.2231, "loss_nan_ranks": 0, "loss_rank_avg": 0.0803007185459137, "step": 925, "valid_targets_mean": 1554.9, "valid_targets_min": 592 }, { "epoch": 1.2952646239554317, "grad_norm": 0.45530435313643286, "learning_rate": 3.913084978338931e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.12958484888076782, "step": 930, "valid_targets_mean": 7069.5, "valid_targets_min": 4765 }, { "epoch": 1.3022284122562673, "grad_norm": 0.4187104102266161, "learning_rate": 3.911048094235679e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.11318781226873398, "step": 935, "valid_targets_mean": 6193.4, "valid_targets_min": 5587 }, { "epoch": 1.309192200557103, "grad_norm": 0.4642694802664071, "learning_rate": 3.9089881608314534e-05, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.11810522526502609, "step": 940, "valid_targets_mean": 6612.2, "valid_targets_min": 4894 }, { "epoch": 1.3161559888579388, "grad_norm": 0.40454438050769786, "learning_rate": 3.9069052029712713e-05, "loss": 0.2201, "loss_nan_ranks": 0, "loss_rank_avg": 0.10395780950784683, "step": 945, "valid_targets_mean": 6605.9, "valid_targets_min": 3795 }, { "epoch": 1.3231197771587744, "grad_norm": 0.4215605431440107, "learning_rate": 3.9047992457778524e-05, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.11420217156410217, "step": 950, "valid_targets_mean": 7186.8, "valid_targets_min": 4890 }, { "epoch": 1.33008356545961, "grad_norm": 0.620429539040831, "learning_rate": 3.90267031465131e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.1147976964712143, "step": 955, "valid_targets_mean": 6544.4, "valid_targets_min": 4615 }, { "epoch": 1.3370473537604457, "grad_norm": 0.47863602052631893, "learning_rate": 3.9005184352688514e-05, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.1220189705491066, "step": 960, "valid_targets_mean": 6339.2, "valid_targets_min": 4798 }, { "epoch": 1.3440111420612815, "grad_norm": 0.6133989682966983, "learning_rate": 3.89834363358446e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.1313786804676056, "step": 965, "valid_targets_mean": 4558.8, "valid_targets_min": 148 }, { "epoch": 1.350974930362117, "grad_norm": 0.45702297334659797, "learning_rate": 3.896145935828592e-05, "loss": 0.2258, "loss_nan_ranks": 0, "loss_rank_avg": 0.124158576130867, "step": 970, "valid_targets_mean": 6807.9, "valid_targets_min": 5164 }, { "epoch": 1.3579387186629526, "grad_norm": 0.4313724233091901, "learning_rate": 3.893925368507852e-05, "loss": 0.2178, "loss_nan_ranks": 0, "loss_rank_avg": 0.11191289126873016, "step": 975, "valid_targets_mean": 7011.8, "valid_targets_min": 4974 }, { "epoch": 1.3649025069637883, "grad_norm": 0.46720364315569657, "learning_rate": 3.891681958404675e-05, "loss": 0.2258, "loss_nan_ranks": 0, "loss_rank_avg": 0.10171587765216827, "step": 980, "valid_targets_mean": 5794.2, "valid_targets_min": 4809 }, { "epoch": 1.371866295264624, "grad_norm": 0.43110533517562993, "learning_rate": 3.8894157325770085e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.10188580304384232, "step": 985, "valid_targets_mean": 6401.8, "valid_targets_min": 4842 }, { "epoch": 1.3788300835654597, "grad_norm": 0.44932522936305014, "learning_rate": 3.887126718357978e-05, "loss": 0.2193, "loss_nan_ranks": 0, "loss_rank_avg": 0.1125284880399704, "step": 990, "valid_targets_mean": 6182.1, "valid_targets_min": 5116 }, { "epoch": 1.3857938718662952, "grad_norm": 0.42140650517718253, "learning_rate": 3.884814943355565e-05, "loss": 0.2192, "loss_nan_ranks": 0, "loss_rank_avg": 0.10108678042888641, "step": 995, "valid_targets_mean": 6165.1, "valid_targets_min": 5764 }, { "epoch": 1.392757660167131, "grad_norm": 0.9460709949341402, "learning_rate": 3.882480435452268e-05, "loss": 0.2509, "loss_nan_ranks": 0, "loss_rank_avg": 0.09195755422115326, "step": 1000, "valid_targets_mean": 1428.2, "valid_targets_min": 1062 }, { "epoch": 1.3997214484679665, "grad_norm": 1.0910007125977519, "learning_rate": 3.88012322280477e-05, "loss": 0.2267, "loss_nan_ranks": 0, "loss_rank_avg": 0.10902673006057739, "step": 1005, "valid_targets_mean": 1663.0, "valid_targets_min": 960 }, { "epoch": 1.4066852367688023, "grad_norm": 0.8694966611159818, "learning_rate": 3.877743333843599e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.10752002894878387, "step": 1010, "valid_targets_mean": 1476.5, "valid_targets_min": 933 }, { "epoch": 1.4136490250696379, "grad_norm": 0.8363762394596167, "learning_rate": 3.875340797272781e-05, "loss": 0.2181, "loss_nan_ranks": 0, "loss_rank_avg": 0.10708215087652206, "step": 1015, "valid_targets_mean": 1478.1, "valid_targets_min": 881 }, { "epoch": 1.4206128133704734, "grad_norm": 0.9058452941123465, "learning_rate": 3.872915642069499e-05, "loss": 0.2195, "loss_nan_ranks": 0, "loss_rank_avg": 0.1283268928527832, "step": 1020, "valid_targets_mean": 1640.6, "valid_targets_min": 869 }, { "epoch": 1.4275766016713092, "grad_norm": 1.1890706352537899, "learning_rate": 3.87046789748374e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.11645996570587158, "step": 1025, "valid_targets_mean": 1709.0, "valid_targets_min": 1090 }, { "epoch": 1.434540389972145, "grad_norm": 0.8343148724615661, "learning_rate": 3.867997593037943e-05, "loss": 0.2117, "loss_nan_ranks": 0, "loss_rank_avg": 0.08550204336643219, "step": 1030, "valid_targets_mean": 1157.9, "valid_targets_min": 761 }, { "epoch": 1.4415041782729805, "grad_norm": 0.7596563407523057, "learning_rate": 3.865504758526644e-05, "loss": 0.2283, "loss_nan_ranks": 0, "loss_rank_avg": 0.1036420613527298, "step": 1035, "valid_targets_mean": 1553.6, "valid_targets_min": 1241 }, { "epoch": 1.448467966573816, "grad_norm": 0.8589106034441814, "learning_rate": 3.8629894240161153e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.09890624135732651, "step": 1040, "valid_targets_mean": 1538.1, "valid_targets_min": 733 }, { "epoch": 1.4554317548746518, "grad_norm": 0.7911151876930106, "learning_rate": 3.8604516198440036e-05, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.06528353691101074, "step": 1045, "valid_targets_mean": 1250.6, "valid_targets_min": 835 }, { "epoch": 1.4623955431754876, "grad_norm": 0.787767064205962, "learning_rate": 3.857891376618965e-05, "loss": 0.2079, "loss_nan_ranks": 0, "loss_rank_avg": 0.12352828681468964, "step": 1050, "valid_targets_mean": 1596.2, "valid_targets_min": 1046 }, { "epoch": 1.4693593314763231, "grad_norm": 0.8571652833546958, "learning_rate": 3.855308725220293e-05, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.10267695039510727, "step": 1055, "valid_targets_mean": 1646.5, "valid_targets_min": 797 }, { "epoch": 1.4763231197771587, "grad_norm": 0.9386572516522071, "learning_rate": 3.85270369679755e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.1088155061006546, "step": 1060, "valid_targets_mean": 1448.9, "valid_targets_min": 570 }, { "epoch": 1.4832869080779945, "grad_norm": 0.8090527333348528, "learning_rate": 3.850076322770186e-05, "loss": 0.2018, "loss_nan_ranks": 0, "loss_rank_avg": 0.07706055045127869, "step": 1065, "valid_targets_mean": 1164.1, "valid_targets_min": 548 }, { "epoch": 1.49025069637883, "grad_norm": 0.888098593113638, "learning_rate": 3.847426634827167e-05, "loss": 0.2002, "loss_nan_ranks": 0, "loss_rank_avg": 0.1056225374341011, "step": 1070, "valid_targets_mean": 1338.0, "valid_targets_min": 682 }, { "epoch": 1.4972144846796658, "grad_norm": 0.7475892854829238, "learning_rate": 3.844754664926586e-05, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.10795626044273376, "step": 1075, "valid_targets_mean": 1632.8, "valid_targets_min": 896 }, { "epoch": 1.5041782729805013, "grad_norm": 0.7767225037367806, "learning_rate": 3.842060445295283e-05, "loss": 0.2178, "loss_nan_ranks": 0, "loss_rank_avg": 0.13912582397460938, "step": 1080, "valid_targets_mean": 1806.5, "valid_targets_min": 597 }, { "epoch": 1.511142061281337, "grad_norm": 0.8482626365324997, "learning_rate": 3.839344008428451e-05, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.09307943284511566, "step": 1085, "valid_targets_mean": 1289.9, "valid_targets_min": 706 }, { "epoch": 1.5181058495821727, "grad_norm": 0.7497328533096577, "learning_rate": 3.836605387089248e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.06710005551576614, "step": 1090, "valid_targets_mean": 1354.1, "valid_targets_min": 754 }, { "epoch": 1.5250696378830084, "grad_norm": 0.7897926297952617, "learning_rate": 3.8338446143084015e-05, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.0963955968618393, "step": 1095, "valid_targets_mean": 1461.9, "valid_targets_min": 819 }, { "epoch": 1.532033426183844, "grad_norm": 0.8054353338785877, "learning_rate": 3.8310617233838094e-05, "loss": 0.2164, "loss_nan_ranks": 0, "loss_rank_avg": 0.08029267191886902, "step": 1100, "valid_targets_mean": 1225.5, "valid_targets_min": 684 }, { "epoch": 1.5389972144846795, "grad_norm": 0.9118859088683984, "learning_rate": 3.828256747880137e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.10978655517101288, "step": 1105, "valid_targets_mean": 1282.2, "valid_targets_min": 711 }, { "epoch": 1.5459610027855153, "grad_norm": 0.7673580373354333, "learning_rate": 3.825429721628411e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.11380324512720108, "step": 1110, "valid_targets_mean": 1634.8, "valid_targets_min": 1190 }, { "epoch": 1.552924791086351, "grad_norm": 0.8522675201936903, "learning_rate": 3.822580678725621e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.10675722360610962, "step": 1115, "valid_targets_mean": 1615.9, "valid_targets_min": 774 }, { "epoch": 1.5598885793871866, "grad_norm": 0.7180000643578018, "learning_rate": 3.819709653534295e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.10761082917451859, "step": 1120, "valid_targets_mean": 1848.4, "valid_targets_min": 734 }, { "epoch": 1.5668523676880222, "grad_norm": 0.8256061679097826, "learning_rate": 3.8168166806820924e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.10491684079170227, "step": 1125, "valid_targets_mean": 1570.6, "valid_targets_min": 1011 }, { "epoch": 1.573816155988858, "grad_norm": 0.800219846734056, "learning_rate": 3.813901795061387e-05, "loss": 0.2072, "loss_nan_ranks": 0, "loss_rank_avg": 0.1188449040055275, "step": 1130, "valid_targets_mean": 1697.0, "valid_targets_min": 803 }, { "epoch": 1.5807799442896937, "grad_norm": 0.7849874656744029, "learning_rate": 3.810965031828843e-05, "loss": 0.2079, "loss_nan_ranks": 0, "loss_rank_avg": 0.08988340198993683, "step": 1135, "valid_targets_mean": 1307.1, "valid_targets_min": 782 }, { "epoch": 1.5877437325905293, "grad_norm": 0.7519337668408274, "learning_rate": 3.808006426404991e-05, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.10832203924655914, "step": 1140, "valid_targets_mean": 1596.6, "valid_targets_min": 646 }, { "epoch": 1.5947075208913648, "grad_norm": 0.7913090801912336, "learning_rate": 3.805026014473803e-05, "loss": 0.2113, "loss_nan_ranks": 0, "loss_rank_avg": 0.14530369639396667, "step": 1145, "valid_targets_mean": 1817.5, "valid_targets_min": 922 }, { "epoch": 1.6016713091922006, "grad_norm": 0.8006210281974334, "learning_rate": 3.802023831982262e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.11583166569471359, "step": 1150, "valid_targets_mean": 1822.2, "valid_targets_min": 796 }, { "epoch": 1.6086350974930363, "grad_norm": 0.8429365694331502, "learning_rate": 3.798999915139926e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.10505574196577072, "step": 1155, "valid_targets_mean": 1542.4, "valid_targets_min": 903 }, { "epoch": 1.615598885793872, "grad_norm": 0.9071692515157804, "learning_rate": 3.795954300418494e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.11454838514328003, "step": 1160, "valid_targets_mean": 1459.5, "valid_targets_min": 780 }, { "epoch": 1.6225626740947074, "grad_norm": 0.7700813936036295, "learning_rate": 3.792887024551363e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.10751248896121979, "step": 1165, "valid_targets_mean": 1581.1, "valid_targets_min": 783 }, { "epoch": 1.6295264623955432, "grad_norm": 0.7587182482455052, "learning_rate": 3.7897981245331895e-05, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.07905155420303345, "step": 1170, "valid_targets_mean": 1342.1, "valid_targets_min": 662 }, { "epoch": 1.636490250696379, "grad_norm": 0.8016804160384552, "learning_rate": 3.786687637619437e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.08902774751186371, "step": 1175, "valid_targets_mean": 1269.1, "valid_targets_min": 724 }, { "epoch": 1.6434540389972145, "grad_norm": 0.8762625648078411, "learning_rate": 3.783555601325933e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.11289331316947937, "step": 1180, "valid_targets_mean": 1510.1, "valid_targets_min": 966 }, { "epoch": 1.65041782729805, "grad_norm": 0.8362696841731547, "learning_rate": 3.7804020534284125e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.08795975148677826, "step": 1185, "valid_targets_mean": 1327.8, "valid_targets_min": 773 }, { "epoch": 1.6573816155988856, "grad_norm": 0.8217589431615828, "learning_rate": 3.7772270319620655e-05, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.08339729905128479, "step": 1190, "valid_targets_mean": 1353.2, "valid_targets_min": 807 }, { "epoch": 1.6643454038997214, "grad_norm": 0.8481129752613321, "learning_rate": 3.774030575221073e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.07550103962421417, "step": 1195, "valid_targets_mean": 1142.5, "valid_targets_min": 782 }, { "epoch": 1.6713091922005572, "grad_norm": 0.7883067686921773, "learning_rate": 3.770812721758151e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.112126424908638, "step": 1200, "valid_targets_mean": 1849.9, "valid_targets_min": 634 }, { "epoch": 1.6782729805013927, "grad_norm": 0.7411457071163579, "learning_rate": 3.7675735103840844e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.10241081565618515, "step": 1205, "valid_targets_mean": 1599.6, "valid_targets_min": 573 }, { "epoch": 1.6852367688022283, "grad_norm": 0.7086572852054175, "learning_rate": 3.7643129801672535e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.11208580434322357, "step": 1210, "valid_targets_mean": 1994.9, "valid_targets_min": 1102 }, { "epoch": 1.692200557103064, "grad_norm": 0.8779677269614039, "learning_rate": 3.76103117043317e-05, "loss": 0.2095, "loss_nan_ranks": 0, "loss_rank_avg": 0.07884174585342407, "step": 1215, "valid_targets_mean": 1239.2, "valid_targets_min": 841 }, { "epoch": 1.6991643454038998, "grad_norm": 0.7715841944120366, "learning_rate": 3.757728120763998e-05, "loss": 0.1967, "loss_nan_ranks": 0, "loss_rank_avg": 0.09706147015094757, "step": 1220, "valid_targets_mean": 1467.5, "valid_targets_min": 956 }, { "epoch": 1.7061281337047354, "grad_norm": 0.8840496408494232, "learning_rate": 3.754403870998079e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.10566884279251099, "step": 1225, "valid_targets_mean": 1300.9, "valid_targets_min": 857 }, { "epoch": 1.713091922005571, "grad_norm": 0.9178621719926586, "learning_rate": 3.7510584612294506e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.10823386162519455, "step": 1230, "valid_targets_mean": 1389.8, "valid_targets_min": 808 }, { "epoch": 1.7200557103064067, "grad_norm": 0.938154160967897, "learning_rate": 3.747691931807362e-05, "loss": 0.1897, "loss_nan_ranks": 0, "loss_rank_avg": 0.08545945584774017, "step": 1235, "valid_targets_mean": 1303.8, "valid_targets_min": 677 }, { "epoch": 1.7270194986072425, "grad_norm": 0.8217723401413547, "learning_rate": 3.744304323335787e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.0866972804069519, "step": 1240, "valid_targets_mean": 1220.1, "valid_targets_min": 727 }, { "epoch": 1.733983286908078, "grad_norm": 0.7965558518328687, "learning_rate": 3.7408956766729406e-05, "loss": 0.1997, "loss_nan_ranks": 0, "loss_rank_avg": 0.0839056596159935, "step": 1245, "valid_targets_mean": 1262.0, "valid_targets_min": 726 }, { "epoch": 1.7409470752089136, "grad_norm": 0.7985361430147639, "learning_rate": 3.737466032930775e-05, "loss": 0.2069, "loss_nan_ranks": 0, "loss_rank_avg": 0.11801943182945251, "step": 1250, "valid_targets_mean": 1615.0, "valid_targets_min": 669 }, { "epoch": 1.7479108635097493, "grad_norm": 0.7163362819024491, "learning_rate": 3.7340154334744933e-05, "loss": 0.1998, "loss_nan_ranks": 0, "loss_rank_avg": 0.11403729021549225, "step": 1255, "valid_targets_mean": 1806.5, "valid_targets_min": 792 }, { "epoch": 1.754874651810585, "grad_norm": 0.76114767590763, "learning_rate": 3.7305439199220466e-05, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.09969079494476318, "step": 1260, "valid_targets_mean": 1627.6, "valid_targets_min": 736 }, { "epoch": 1.7618384401114207, "grad_norm": 0.7967512334914618, "learning_rate": 3.727051534143631e-05, "loss": 0.2039, "loss_nan_ranks": 0, "loss_rank_avg": 0.14327603578567505, "step": 1265, "valid_targets_mean": 1822.9, "valid_targets_min": 694 }, { "epoch": 1.7688022284122562, "grad_norm": 0.7047699568272487, "learning_rate": 3.723538318261186e-05, "loss": 0.1954, "loss_nan_ranks": 0, "loss_rank_avg": 0.1259545087814331, "step": 1270, "valid_targets_mean": 1848.9, "valid_targets_min": 1437 }, { "epoch": 1.775766016713092, "grad_norm": 0.7684434862741877, "learning_rate": 3.720004314647884e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.12424354255199432, "step": 1275, "valid_targets_mean": 1852.4, "valid_targets_min": 809 }, { "epoch": 1.7827298050139275, "grad_norm": 0.7865791196195834, "learning_rate": 3.7164495659276195e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.09065093100070953, "step": 1280, "valid_targets_mean": 1375.5, "valid_targets_min": 790 }, { "epoch": 1.7896935933147633, "grad_norm": 0.8290020685682563, "learning_rate": 3.712874114974496e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.0918719470500946, "step": 1285, "valid_targets_mean": 1338.8, "valid_targets_min": 750 }, { "epoch": 1.7966573816155988, "grad_norm": 0.7994498344708911, "learning_rate": 3.7092780049123076e-05, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.12238575518131256, "step": 1290, "valid_targets_mean": 1778.8, "valid_targets_min": 826 }, { "epoch": 1.8036211699164344, "grad_norm": 0.7645358833299734, "learning_rate": 3.7056612791140204e-05, "loss": 0.1938, "loss_nan_ranks": 0, "loss_rank_avg": 0.08983242511749268, "step": 1295, "valid_targets_mean": 1600.8, "valid_targets_min": 907 }, { "epoch": 1.8105849582172702, "grad_norm": 0.7839077663753583, "learning_rate": 3.7020239812012473e-05, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.1056416928768158, "step": 1300, "valid_targets_mean": 1474.5, "valid_targets_min": 1093 }, { "epoch": 1.817548746518106, "grad_norm": 0.76163948748665, "learning_rate": 3.698366155043724e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.10014639794826508, "step": 1305, "valid_targets_mean": 1577.2, "valid_targets_min": 1119 }, { "epoch": 1.8245125348189415, "grad_norm": 1.7707818510491133, "learning_rate": 3.694687844758779e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.11413945257663727, "step": 1310, "valid_targets_mean": 1512.1, "valid_targets_min": 700 }, { "epoch": 1.831476323119777, "grad_norm": 0.7668240309562283, "learning_rate": 3.6909890947108016e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.07934726029634476, "step": 1315, "valid_targets_mean": 1288.2, "valid_targets_min": 810 }, { "epoch": 1.8384401114206128, "grad_norm": 0.8996028117422565, "learning_rate": 3.687269949510705e-05, "loss": 0.2007, "loss_nan_ranks": 0, "loss_rank_avg": 0.09808281809091568, "step": 1320, "valid_targets_mean": 1328.9, "valid_targets_min": 635 }, { "epoch": 1.8454038997214486, "grad_norm": 0.8176602096459092, "learning_rate": 3.6835304540153914e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.11697147786617279, "step": 1325, "valid_targets_mean": 1542.5, "valid_targets_min": 673 }, { "epoch": 1.8523676880222841, "grad_norm": 1.1979420435140948, "learning_rate": 3.67977065332721e-05, "loss": 0.2077, "loss_nan_ranks": 0, "loss_rank_avg": 0.1085534319281578, "step": 1330, "valid_targets_mean": 1215.6, "valid_targets_min": 641 }, { "epoch": 1.8593314763231197, "grad_norm": 0.8466439137236119, "learning_rate": 3.6759905927934115e-05, "loss": 0.1943, "loss_nan_ranks": 0, "loss_rank_avg": 0.08859957754611969, "step": 1335, "valid_targets_mean": 1222.6, "valid_targets_min": 701 }, { "epoch": 1.8662952646239555, "grad_norm": 0.7520419595750739, "learning_rate": 3.672190318005603e-05, "loss": 0.211, "loss_nan_ranks": 0, "loss_rank_avg": 0.10533758252859116, "step": 1340, "valid_targets_mean": 1850.6, "valid_targets_min": 1202 }, { "epoch": 1.8732590529247912, "grad_norm": 0.7954441568911064, "learning_rate": 3.6683698747991963e-05, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.07728315144777298, "step": 1345, "valid_targets_mean": 1265.5, "valid_targets_min": 657 }, { "epoch": 1.8802228412256268, "grad_norm": 0.8167699792397287, "learning_rate": 3.6645293092528565e-05, "loss": 0.2028, "loss_nan_ranks": 0, "loss_rank_avg": 0.09353001415729523, "step": 1350, "valid_targets_mean": 1388.0, "valid_targets_min": 672 }, { "epoch": 1.8871866295264623, "grad_norm": 0.7414620593948343, "learning_rate": 3.660668667687946e-05, "loss": 0.1954, "loss_nan_ranks": 0, "loss_rank_avg": 0.119552381336689, "step": 1355, "valid_targets_mean": 1813.6, "valid_targets_min": 1019 }, { "epoch": 1.894150417827298, "grad_norm": 0.8151102750049719, "learning_rate": 3.6567879966679667e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.07849185168743134, "step": 1360, "valid_targets_mean": 1114.6, "valid_targets_min": 732 }, { "epoch": 1.9011142061281339, "grad_norm": 0.8226820998476463, "learning_rate": 3.6528873429979946e-05, "loss": 0.2021, "loss_nan_ranks": 0, "loss_rank_avg": 0.07085934281349182, "step": 1365, "valid_targets_mean": 1194.5, "valid_targets_min": 634 }, { "epoch": 1.9080779944289694, "grad_norm": 0.6954859825201096, "learning_rate": 3.64896675372412e-05, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.10201038420200348, "step": 1370, "valid_targets_mean": 1756.5, "valid_targets_min": 905 }, { "epoch": 1.915041782729805, "grad_norm": 0.7713340565719015, "learning_rate": 3.645026276132877e-05, "loss": 0.1925, "loss_nan_ranks": 0, "loss_rank_avg": 0.1128055602312088, "step": 1375, "valid_targets_mean": 1554.9, "valid_targets_min": 596 }, { "epoch": 1.9220055710306405, "grad_norm": 0.7927271064032854, "learning_rate": 3.6410659577506773e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.07899089902639389, "step": 1380, "valid_targets_mean": 1214.6, "valid_targets_min": 687 }, { "epoch": 1.9289693593314763, "grad_norm": 0.7718601693739504, "learning_rate": 3.63708584634323e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.11290781199932098, "step": 1385, "valid_targets_mean": 1955.1, "valid_targets_min": 1199 }, { "epoch": 1.935933147632312, "grad_norm": 0.7193801549469071, "learning_rate": 3.6330859899149694e-05, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.10013289004564285, "step": 1390, "valid_targets_mean": 1758.6, "valid_targets_min": 1214 }, { "epoch": 1.9428969359331476, "grad_norm": 0.726016091373521, "learning_rate": 3.629066436708481e-05, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.09914419054985046, "step": 1395, "valid_targets_mean": 1711.5, "valid_targets_min": 1122 }, { "epoch": 1.9498607242339832, "grad_norm": 0.8210382354675453, "learning_rate": 3.625027235203909e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.09899426996707916, "step": 1400, "valid_targets_mean": 1489.6, "valid_targets_min": 850 }, { "epoch": 1.956824512534819, "grad_norm": 0.7429817246292151, "learning_rate": 3.6209684341183803e-05, "loss": 0.1786, "loss_nan_ranks": 0, "loss_rank_avg": 0.08339495956897736, "step": 1405, "valid_targets_mean": 1572.4, "valid_targets_min": 1318 }, { "epoch": 1.9637883008356547, "grad_norm": 0.7739403851396445, "learning_rate": 3.6168900824054135e-05, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.1083778664469719, "step": 1410, "valid_targets_mean": 1500.0, "valid_targets_min": 1043 }, { "epoch": 1.9707520891364902, "grad_norm": 0.7568148924154536, "learning_rate": 3.612792229254327e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.11948154121637344, "step": 1415, "valid_targets_mean": 1774.9, "valid_targets_min": 920 }, { "epoch": 1.9777158774373258, "grad_norm": 0.6992261616231107, "learning_rate": 3.608674924089651e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.10174979269504547, "step": 1420, "valid_targets_mean": 1547.1, "valid_targets_min": 847 }, { "epoch": 1.9846796657381616, "grad_norm": 0.7035138286444061, "learning_rate": 3.6045382165705255e-05, "loss": 0.1942, "loss_nan_ranks": 0, "loss_rank_avg": 0.10589592158794403, "step": 1425, "valid_targets_mean": 1769.4, "valid_targets_min": 738 }, { "epoch": 1.9916434540389973, "grad_norm": 0.8155181230292006, "learning_rate": 3.600382156590104e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.10955852270126343, "step": 1430, "valid_targets_mean": 1540.1, "valid_targets_min": 594 }, { "epoch": 1.998607242339833, "grad_norm": 0.6347666367578908, "learning_rate": 3.5962067942749516e-05, "loss": 0.1994, "loss_nan_ranks": 0, "loss_rank_avg": 0.10341192036867142, "step": 1435, "valid_targets_mean": 2228.6, "valid_targets_min": 1393 }, { "epoch": 2.0055710306406684, "grad_norm": 0.5577761958239622, "learning_rate": 3.592012179984442e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.18662209808826447, "step": 1440, "valid_targets_mean": 8029.9, "valid_targets_min": 6142 }, { "epoch": 2.012534818941504, "grad_norm": 0.483618877635035, "learning_rate": 3.587798364310146e-05, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.11201878637075424, "step": 1445, "valid_targets_mean": 6664.0, "valid_targets_min": 5470 }, { "epoch": 2.01949860724234, "grad_norm": 0.5185691459202105, "learning_rate": 3.583565398075226e-05, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.11615484952926636, "step": 1450, "valid_targets_mean": 7126.9, "valid_targets_min": 5368 }, { "epoch": 2.0264623955431755, "grad_norm": 0.438228030552986, "learning_rate": 3.579313332333819e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.10276132822036743, "step": 1455, "valid_targets_mean": 7634.9, "valid_targets_min": 5614 }, { "epoch": 2.033426183844011, "grad_norm": 0.3948344228513168, "learning_rate": 3.575042218370423e-05, "loss": 0.2174, "loss_nan_ranks": 0, "loss_rank_avg": 0.1019166111946106, "step": 1460, "valid_targets_mean": 8630.8, "valid_targets_min": 6362 }, { "epoch": 2.0403899721448466, "grad_norm": 0.4535316383686147, "learning_rate": 3.570752107699281e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.10765604674816132, "step": 1465, "valid_targets_mean": 7383.6, "valid_targets_min": 5844 }, { "epoch": 2.0473537604456826, "grad_norm": 0.4216201437635594, "learning_rate": 3.566443052063751e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.12464028596878052, "step": 1470, "valid_targets_mean": 8017.0, "valid_targets_min": 5283 }, { "epoch": 2.054317548746518, "grad_norm": 0.3816491538208156, "learning_rate": 3.5621151034356927e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.09279941767454147, "step": 1475, "valid_targets_mean": 7051.1, "valid_targets_min": 4135 }, { "epoch": 2.0612813370473537, "grad_norm": 0.41992932447893627, "learning_rate": 3.557768314014834e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.09113673865795135, "step": 1480, "valid_targets_mean": 5370.4, "valid_targets_min": 3919 }, { "epoch": 2.0682451253481893, "grad_norm": 0.3912975995428693, "learning_rate": 3.5534027362281436e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.0919366329908371, "step": 1485, "valid_targets_mean": 6063.6, "valid_targets_min": 4863 }, { "epoch": 2.0752089136490253, "grad_norm": 0.4107622241608645, "learning_rate": 3.549018422729197e-05, "loss": 0.2167, "loss_nan_ranks": 0, "loss_rank_avg": 0.10401890426874161, "step": 1490, "valid_targets_mean": 7001.2, "valid_targets_min": 6020 }, { "epoch": 2.082172701949861, "grad_norm": 0.39061276611048656, "learning_rate": 3.544615426397543e-05, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.101812943816185, "step": 1495, "valid_targets_mean": 6181.9, "valid_targets_min": 4669 }, { "epoch": 2.0891364902506964, "grad_norm": 0.38035206361099594, "learning_rate": 3.5401938003380666e-05, "loss": 0.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.09549552947282791, "step": 1500, "valid_targets_mean": 6250.2, "valid_targets_min": 4900 }, { "epoch": 2.096100278551532, "grad_norm": 0.43005142535025387, "learning_rate": 3.5357535978803455e-05, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.09210428595542908, "step": 1505, "valid_targets_mean": 7156.4, "valid_targets_min": 5323 }, { "epoch": 2.103064066852368, "grad_norm": 0.40901081252647176, "learning_rate": 3.53129487257801e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.10530374944210052, "step": 1510, "valid_targets_mean": 7215.8, "valid_targets_min": 4720 }, { "epoch": 2.1100278551532035, "grad_norm": 0.412691959227041, "learning_rate": 3.5268176782080967e-05, "loss": 0.2108, "loss_nan_ranks": 0, "loss_rank_avg": 0.10234518349170685, "step": 1515, "valid_targets_mean": 6550.8, "valid_targets_min": 5739 }, { "epoch": 2.116991643454039, "grad_norm": 0.3904193639606634, "learning_rate": 3.522322068770397e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.10454997420310974, "step": 1520, "valid_targets_mean": 6726.8, "valid_targets_min": 4540 }, { "epoch": 2.1239554317548746, "grad_norm": 0.5086857986092044, "learning_rate": 3.51780809848681e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.11639285087585449, "step": 1525, "valid_targets_mean": 4573.4, "valid_targets_min": 1039 }, { "epoch": 2.13091922005571, "grad_norm": 0.4916720484004185, "learning_rate": 3.513275821800684e-05, "loss": 0.2247, "loss_nan_ranks": 0, "loss_rank_avg": 0.10517747700214386, "step": 1530, "valid_targets_mean": 6430.0, "valid_targets_min": 5412 }, { "epoch": 2.137883008356546, "grad_norm": 0.7279504673107768, "learning_rate": 3.5087252933761654e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.03320852294564247, "step": 1535, "valid_targets_mean": 583.1, "valid_targets_min": 158 }, { "epoch": 2.1448467966573816, "grad_norm": 0.38537163974446353, "learning_rate": 3.504156568097533e-05, "loss": 0.1918, "loss_nan_ranks": 0, "loss_rank_avg": 0.10623390972614288, "step": 1540, "valid_targets_mean": 8230.9, "valid_targets_min": 5061 }, { "epoch": 2.151810584958217, "grad_norm": 0.41759228803004284, "learning_rate": 3.4995697010685415e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.11333325505256653, "step": 1545, "valid_targets_mean": 7238.9, "valid_targets_min": 5112 }, { "epoch": 2.1587743732590527, "grad_norm": 0.4142412953268547, "learning_rate": 3.4949647476117535e-05, "loss": 0.204, "loss_nan_ranks": 0, "loss_rank_avg": 0.09155681729316711, "step": 1550, "valid_targets_mean": 6322.8, "valid_targets_min": 4867 }, { "epoch": 2.1657381615598887, "grad_norm": 0.38370921033703687, "learning_rate": 3.4903417632678746e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.10269880294799805, "step": 1555, "valid_targets_mean": 7887.0, "valid_targets_min": 6004 }, { "epoch": 2.1727019498607243, "grad_norm": 0.3711170733226334, "learning_rate": 3.4857008037950814e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.09217008948326111, "step": 1560, "valid_targets_mean": 7090.2, "valid_targets_min": 4917 }, { "epoch": 2.17966573816156, "grad_norm": 0.3940923954443781, "learning_rate": 3.481041925168349e-05, "loss": 0.1942, "loss_nan_ranks": 0, "loss_rank_avg": 0.09533364325761795, "step": 1565, "valid_targets_mean": 7441.9, "valid_targets_min": 4202 }, { "epoch": 2.1866295264623954, "grad_norm": 0.38589644774474163, "learning_rate": 3.476365183578779e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.09489143639802933, "step": 1570, "valid_targets_mean": 7901.8, "valid_targets_min": 5060 }, { "epoch": 2.1935933147632314, "grad_norm": 0.32887624393579473, "learning_rate": 3.471670635432919e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.08562236279249191, "step": 1575, "valid_targets_mean": 8557.6, "valid_targets_min": 6331 }, { "epoch": 2.200557103064067, "grad_norm": 0.45867578912244944, "learning_rate": 3.466958337352082e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.09923288971185684, "step": 1580, "valid_targets_mean": 4976.4, "valid_targets_min": 2847 }, { "epoch": 2.2075208913649025, "grad_norm": 0.4238519335072428, "learning_rate": 3.462228346171664e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.11293122917413712, "step": 1585, "valid_targets_mean": 7129.1, "valid_targets_min": 5331 }, { "epoch": 2.214484679665738, "grad_norm": 0.4164534419411376, "learning_rate": 3.457480718940461e-05, "loss": 0.2147, "loss_nan_ranks": 0, "loss_rank_avg": 0.1091599240899086, "step": 1590, "valid_targets_mean": 6864.0, "valid_targets_min": 4697 }, { "epoch": 2.2214484679665736, "grad_norm": 0.42010359781278844, "learning_rate": 3.4527155129199766e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.10069143772125244, "step": 1595, "valid_targets_mean": 6631.9, "valid_targets_min": 4623 }, { "epoch": 2.2284122562674096, "grad_norm": 0.43617878030396867, "learning_rate": 3.447932785583735e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.09616230428218842, "step": 1600, "valid_targets_mean": 6330.4, "valid_targets_min": 5424 }, { "epoch": 2.235376044568245, "grad_norm": 0.41414881589071445, "learning_rate": 3.4431325946165847e-05, "loss": 0.2036, "loss_nan_ranks": 0, "loss_rank_avg": 0.09712429344654083, "step": 1605, "valid_targets_mean": 6814.8, "valid_targets_min": 4964 }, { "epoch": 2.2423398328690807, "grad_norm": 0.4444215191301066, "learning_rate": 3.438314997914006e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.11258673667907715, "step": 1610, "valid_targets_mean": 6915.8, "valid_targets_min": 5321 }, { "epoch": 2.2493036211699167, "grad_norm": 0.41522878354353365, "learning_rate": 3.433480053581412e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.10380226373672485, "step": 1615, "valid_targets_mean": 6464.5, "valid_targets_min": 5185 }, { "epoch": 2.256267409470752, "grad_norm": 0.4467050398625796, "learning_rate": 3.4286278199334436e-05, "loss": 0.2077, "loss_nan_ranks": 0, "loss_rank_avg": 0.10517797619104385, "step": 1620, "valid_targets_mean": 7048.6, "valid_targets_min": 4913 }, { "epoch": 2.2632311977715878, "grad_norm": 0.4232921124371884, "learning_rate": 3.4237583554932726e-05, "loss": 0.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.11401194334030151, "step": 1625, "valid_targets_mean": 7469.2, "valid_targets_min": 5426 }, { "epoch": 2.2701949860724233, "grad_norm": 0.4259278689375421, "learning_rate": 3.4188717189918915e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.10883718729019165, "step": 1630, "valid_targets_mean": 6819.4, "valid_targets_min": 5286 }, { "epoch": 2.277158774373259, "grad_norm": 0.412251669431946, "learning_rate": 3.413967969367406e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.10999740660190582, "step": 1635, "valid_targets_mean": 7107.5, "valid_targets_min": 5201 }, { "epoch": 2.284122562674095, "grad_norm": 0.42374140207835653, "learning_rate": 3.4090471657643254e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.09911487251520157, "step": 1640, "valid_targets_mean": 5642.6, "valid_targets_min": 4838 }, { "epoch": 2.2910863509749304, "grad_norm": 0.9807420220774704, "learning_rate": 3.404109367532847e-05, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.19164110720157623, "step": 1645, "valid_targets_mean": 2054.1, "valid_targets_min": 134 }, { "epoch": 2.298050139275766, "grad_norm": 0.5566049180562685, "learning_rate": 3.399154634228144e-05, "loss": 0.2081, "loss_nan_ranks": 0, "loss_rank_avg": 0.0960545465350151, "step": 1650, "valid_targets_mean": 6686.4, "valid_targets_min": 5256 }, { "epoch": 2.3050139275766015, "grad_norm": 0.4253696878618078, "learning_rate": 3.394183025609644e-05, "loss": 0.1998, "loss_nan_ranks": 0, "loss_rank_avg": 0.1074969694018364, "step": 1655, "valid_targets_mean": 6216.6, "valid_targets_min": 5542 }, { "epoch": 2.3119777158774375, "grad_norm": 0.4131104336589319, "learning_rate": 3.3891946016403056e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.10091003775596619, "step": 1660, "valid_targets_mean": 6486.1, "valid_targets_min": 5531 }, { "epoch": 2.318941504178273, "grad_norm": 0.45874934809459283, "learning_rate": 3.384189422485904e-05, "loss": 0.1992, "loss_nan_ranks": 0, "loss_rank_avg": 0.09876036643981934, "step": 1665, "valid_targets_mean": 5797.4, "valid_targets_min": 3911 }, { "epoch": 2.3259052924791086, "grad_norm": 0.4246615076495944, "learning_rate": 3.3791675485142974e-05, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.10160474479198456, "step": 1670, "valid_targets_mean": 6357.5, "valid_targets_min": 5195 }, { "epoch": 2.332869080779944, "grad_norm": 0.43609990408164573, "learning_rate": 3.374129040294701e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.10332215577363968, "step": 1675, "valid_targets_mean": 5808.9, "valid_targets_min": 4959 }, { "epoch": 2.33983286908078, "grad_norm": 0.5400090427254614, "learning_rate": 3.369073958596958e-05, "loss": 0.2043, "loss_nan_ranks": 0, "loss_rank_avg": 0.06865261495113373, "step": 1680, "valid_targets_mean": 2591.5, "valid_targets_min": 842 }, { "epoch": 2.3467966573816157, "grad_norm": 0.457933957702517, "learning_rate": 3.364002364390805e-05, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.09762382507324219, "step": 1685, "valid_targets_mean": 6006.9, "valid_targets_min": 4769 }, { "epoch": 2.3537604456824512, "grad_norm": 0.4088785055658562, "learning_rate": 3.358914318845138e-05, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.09737879037857056, "step": 1690, "valid_targets_mean": 6764.2, "valid_targets_min": 5046 }, { "epoch": 2.360724233983287, "grad_norm": 0.47400359842514794, "learning_rate": 3.353809883327273e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.10614047944545746, "step": 1695, "valid_targets_mean": 6055.8, "valid_targets_min": 5182 }, { "epoch": 2.3676880222841223, "grad_norm": 0.44156250020466503, "learning_rate": 3.348689119402209e-05, "loss": 0.1989, "loss_nan_ranks": 0, "loss_rank_avg": 0.10033164173364639, "step": 1700, "valid_targets_mean": 7101.6, "valid_targets_min": 5366 }, { "epoch": 2.3746518105849583, "grad_norm": 0.41213498850675423, "learning_rate": 3.343552088831878e-05, "loss": 0.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.1027466282248497, "step": 1705, "valid_targets_mean": 7111.9, "valid_targets_min": 5192 }, { "epoch": 2.381615598885794, "grad_norm": 0.5040432860111047, "learning_rate": 3.338398853574411e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.09895579516887665, "step": 1710, "valid_targets_mean": 5509.9, "valid_targets_min": 4790 }, { "epoch": 2.3885793871866294, "grad_norm": 1.1363379165814331, "learning_rate": 3.333229475783383e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.11968301236629486, "step": 1715, "valid_targets_mean": 1581.9, "valid_targets_min": 864 }, { "epoch": 2.3955431754874654, "grad_norm": 0.8698074566188687, "learning_rate": 3.3280440178070635e-05, "loss": 0.2104, "loss_nan_ranks": 0, "loss_rank_avg": 0.09715799242258072, "step": 1720, "valid_targets_mean": 1333.2, "valid_targets_min": 632 }, { "epoch": 2.402506963788301, "grad_norm": 0.8444689746099655, "learning_rate": 3.322842542187669e-05, "loss": 0.194, "loss_nan_ranks": 0, "loss_rank_avg": 0.10113231092691422, "step": 1725, "valid_targets_mean": 1602.9, "valid_targets_min": 875 }, { "epoch": 2.4094707520891365, "grad_norm": 1.1270431114328114, "learning_rate": 3.317625111660605e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.1020176112651825, "step": 1730, "valid_targets_mean": 1340.4, "valid_targets_min": 701 }, { "epoch": 2.416434540389972, "grad_norm": 0.7839393431669954, "learning_rate": 3.3123917891537085e-05, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.11173247545957565, "step": 1735, "valid_targets_mean": 1792.9, "valid_targets_min": 898 }, { "epoch": 2.4233983286908076, "grad_norm": 0.7608101315047425, "learning_rate": 3.307142637786496e-05, "loss": 0.187, "loss_nan_ranks": 0, "loss_rank_avg": 0.09726438671350479, "step": 1740, "valid_targets_mean": 1433.1, "valid_targets_min": 1070 }, { "epoch": 2.4303621169916436, "grad_norm": 0.851244310222369, "learning_rate": 3.3018777208693916e-05, "loss": 0.1976, "loss_nan_ranks": 0, "loss_rank_avg": 0.10597909986972809, "step": 1745, "valid_targets_mean": 1589.5, "valid_targets_min": 970 }, { "epoch": 2.437325905292479, "grad_norm": 0.7562891748345674, "learning_rate": 3.2965971019029716e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.08589346706867218, "step": 1750, "valid_targets_mean": 1270.5, "valid_targets_min": 648 }, { "epoch": 2.4442896935933147, "grad_norm": 0.8072271025740217, "learning_rate": 3.291300844577196e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.1143551915884018, "step": 1755, "valid_targets_mean": 1674.5, "valid_targets_min": 727 }, { "epoch": 2.4512534818941503, "grad_norm": 0.8040766542030429, "learning_rate": 3.28598901277064e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.07331328094005585, "step": 1760, "valid_targets_mean": 1406.0, "valid_targets_min": 770 }, { "epoch": 2.4582172701949863, "grad_norm": 0.7600004146401925, "learning_rate": 3.280661670549723e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.08032012730836868, "step": 1765, "valid_targets_mean": 1381.2, "valid_targets_min": 572 }, { "epoch": 2.465181058495822, "grad_norm": 0.8186128164361567, "learning_rate": 3.275318882167938e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.11326928436756134, "step": 1770, "valid_targets_mean": 1580.4, "valid_targets_min": 633 }, { "epoch": 2.4721448467966574, "grad_norm": 0.7878473077583293, "learning_rate": 3.269960712065074e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.09199025481939316, "step": 1775, "valid_targets_mean": 1478.8, "valid_targets_min": 923 }, { "epoch": 2.479108635097493, "grad_norm": 0.7408103486539382, "learning_rate": 3.264587224866442e-05, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.08334987610578537, "step": 1780, "valid_targets_mean": 1401.0, "valid_targets_min": 740 }, { "epoch": 2.486072423398329, "grad_norm": 0.7785323575154897, "learning_rate": 3.2591984853820926e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.08059869706630707, "step": 1785, "valid_targets_mean": 1588.9, "valid_targets_min": 870 }, { "epoch": 2.4930362116991645, "grad_norm": 0.7501213652690097, "learning_rate": 3.2537945586060336e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.12979084253311157, "step": 1790, "valid_targets_mean": 2008.4, "valid_targets_min": 1042 }, { "epoch": 2.5, "grad_norm": 0.769300550573875, "learning_rate": 3.248375509715452e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.07505079358816147, "step": 1795, "valid_targets_mean": 1209.0, "valid_targets_min": 870 }, { "epoch": 2.5069637883008355, "grad_norm": 0.8297708977009772, "learning_rate": 3.242941404069921e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.09335260093212128, "step": 1800, "valid_targets_mean": 1535.5, "valid_targets_min": 740 }, { "epoch": 2.513927576601671, "grad_norm": 0.731844058605371, "learning_rate": 3.237492307210614e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.09308585524559021, "step": 1805, "valid_targets_mean": 1642.9, "valid_targets_min": 906 }, { "epoch": 2.520891364902507, "grad_norm": 0.8193149089522122, "learning_rate": 3.2320282848595174e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.09537345170974731, "step": 1810, "valid_targets_mean": 1570.5, "valid_targets_min": 814 }, { "epoch": 2.5278551532033426, "grad_norm": 0.8371651941131215, "learning_rate": 3.226549402918631e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.08008214086294174, "step": 1815, "valid_targets_mean": 1722.1, "valid_targets_min": 832 }, { "epoch": 2.534818941504178, "grad_norm": 0.7018441413273226, "learning_rate": 3.221055727469182e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.06970568746328354, "step": 1820, "valid_targets_mean": 1453.5, "valid_targets_min": 891 }, { "epoch": 2.541782729805014, "grad_norm": 0.7963146448093934, "learning_rate": 3.21554732477082e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.11181323230266571, "step": 1825, "valid_targets_mean": 1584.4, "valid_targets_min": 734 }, { "epoch": 2.5487465181058497, "grad_norm": 0.7592311759031534, "learning_rate": 3.2100242612608213e-05, "loss": 0.1705, "loss_nan_ranks": 0, "loss_rank_avg": 0.08187158405780792, "step": 1830, "valid_targets_mean": 1495.2, "valid_targets_min": 737 }, { "epoch": 2.5557103064066853, "grad_norm": 0.773359400074154, "learning_rate": 3.204486603553289e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.0989374965429306, "step": 1835, "valid_targets_mean": 1737.0, "valid_targets_min": 872 }, { "epoch": 2.562674094707521, "grad_norm": 0.7743236506768809, "learning_rate": 3.1989344184383476e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.09391649067401886, "step": 1840, "valid_targets_mean": 1431.6, "valid_targets_min": 805 }, { "epoch": 2.5696378830083564, "grad_norm": 0.7358590006225955, "learning_rate": 3.1933677728813364e-05, "loss": 0.1816, "loss_nan_ranks": 0, "loss_rank_avg": 0.10584774613380432, "step": 1845, "valid_targets_mean": 2060.2, "valid_targets_min": 1253 }, { "epoch": 2.5766016713091924, "grad_norm": 0.7193105312572781, "learning_rate": 3.1877867340220045e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.10305032879114151, "step": 1850, "valid_targets_mean": 2063.9, "valid_targets_min": 1264 }, { "epoch": 2.583565459610028, "grad_norm": 0.7695266994780475, "learning_rate": 3.1821913691736995e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.0683041363954544, "step": 1855, "valid_targets_mean": 1036.5, "valid_targets_min": 613 }, { "epoch": 2.5905292479108635, "grad_norm": 0.7101389867132969, "learning_rate": 3.1765817458225546e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.08477064967155457, "step": 1860, "valid_targets_mean": 1674.4, "valid_targets_min": 768 }, { "epoch": 2.597493036211699, "grad_norm": 0.8599774854634431, "learning_rate": 3.170957931626679e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.080399289727211, "step": 1865, "valid_targets_mean": 1249.8, "valid_targets_min": 714 }, { "epoch": 2.6044568245125346, "grad_norm": 0.7993028212492834, "learning_rate": 3.165319994415336e-05, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.06606724113225937, "step": 1870, "valid_targets_mean": 1114.8, "valid_targets_min": 800 }, { "epoch": 2.6114206128133706, "grad_norm": 0.7781447333017487, "learning_rate": 3.159668002188128e-05, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.10036128759384155, "step": 1875, "valid_targets_mean": 1780.9, "valid_targets_min": 933 }, { "epoch": 2.618384401114206, "grad_norm": 0.8858832068872401, "learning_rate": 3.1540020231141774e-05, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.07642105966806412, "step": 1880, "valid_targets_mean": 1113.6, "valid_targets_min": 746 }, { "epoch": 2.6253481894150417, "grad_norm": 0.8236948964912306, "learning_rate": 3.148322125531302e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.09135651588439941, "step": 1885, "valid_targets_mean": 1265.0, "valid_targets_min": 814 }, { "epoch": 2.6323119777158777, "grad_norm": 0.7402380099739323, "learning_rate": 3.142628377945191e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.10815448313951492, "step": 1890, "valid_targets_mean": 1652.1, "valid_targets_min": 635 }, { "epoch": 2.639275766016713, "grad_norm": 0.7766341389183821, "learning_rate": 3.1369208490285824e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.06988343596458435, "step": 1895, "valid_targets_mean": 1231.2, "valid_targets_min": 739 }, { "epoch": 2.6462395543175488, "grad_norm": 0.790490819348294, "learning_rate": 3.13119960762043e-05, "loss": 0.1739, "loss_nan_ranks": 0, "loss_rank_avg": 0.10846837610006332, "step": 1900, "valid_targets_mean": 1682.4, "valid_targets_min": 831 }, { "epoch": 2.6532033426183843, "grad_norm": 0.8701861923326255, "learning_rate": 3.125464722725074e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.08927632868289948, "step": 1905, "valid_targets_mean": 1571.6, "valid_targets_min": 1015 }, { "epoch": 2.66016713091922, "grad_norm": 0.7672559496303158, "learning_rate": 3.119716263511412e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.07645729184150696, "step": 1910, "valid_targets_mean": 1276.8, "valid_targets_min": 711 }, { "epoch": 2.667130919220056, "grad_norm": 0.7633251851517129, "learning_rate": 3.1139542993120615e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.05591302365064621, "step": 1915, "valid_targets_mean": 1147.5, "valid_targets_min": 733 }, { "epoch": 2.6740947075208914, "grad_norm": 0.8548710751284283, "learning_rate": 3.108178899622524e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.11267301440238953, "step": 1920, "valid_targets_mean": 1604.0, "valid_targets_min": 953 }, { "epoch": 2.681058495821727, "grad_norm": 0.7154752716285275, "learning_rate": 3.102390134100349e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.08892469853162766, "step": 1925, "valid_targets_mean": 1784.0, "valid_targets_min": 1011 }, { "epoch": 2.688022284122563, "grad_norm": 0.7886303529310777, "learning_rate": 3.096588072564291e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.10861388593912125, "step": 1930, "valid_targets_mean": 1729.0, "valid_targets_min": 1143 }, { "epoch": 2.6949860724233985, "grad_norm": 0.7782781896814367, "learning_rate": 3.09077278499347e-05, "loss": 0.1723, "loss_nan_ranks": 0, "loss_rank_avg": 0.0805855244398117, "step": 1935, "valid_targets_mean": 1483.9, "valid_targets_min": 699 }, { "epoch": 2.701949860724234, "grad_norm": 0.7716708466878998, "learning_rate": 3.084944341526524e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.07467707991600037, "step": 1940, "valid_targets_mean": 1198.4, "valid_targets_min": 680 }, { "epoch": 2.7089136490250696, "grad_norm": 0.7956657891036718, "learning_rate": 3.079102812460769e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.08717083930969238, "step": 1945, "valid_targets_mean": 1365.2, "valid_targets_min": 687 }, { "epoch": 2.715877437325905, "grad_norm": 0.8040752534275205, "learning_rate": 3.0732482682513435e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.06229158490896225, "step": 1950, "valid_targets_mean": 1142.9, "valid_targets_min": 835 }, { "epoch": 2.722841225626741, "grad_norm": 0.7747436174550746, "learning_rate": 3.067380779510365e-05, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.07470732927322388, "step": 1955, "valid_targets_mean": 1316.9, "valid_targets_min": 829 }, { "epoch": 2.7298050139275767, "grad_norm": 0.7825972178164834, "learning_rate": 3.061500417006076e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.09210141003131866, "step": 1960, "valid_targets_mean": 1739.2, "valid_targets_min": 1138 }, { "epoch": 2.7367688022284122, "grad_norm": 0.696392311199642, "learning_rate": 3.0556072516619896e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.07831001281738281, "step": 1965, "valid_targets_mean": 1592.2, "valid_targets_min": 1174 }, { "epoch": 2.743732590529248, "grad_norm": 0.7770652602858239, "learning_rate": 3.0497013545560354e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.08863939344882965, "step": 1970, "valid_targets_mean": 1543.1, "valid_targets_min": 554 }, { "epoch": 2.7506963788300833, "grad_norm": 0.7372103268972405, "learning_rate": 3.043782796919701e-05, "loss": 0.1711, "loss_nan_ranks": 0, "loss_rank_avg": 0.08466736972332001, "step": 1975, "valid_targets_mean": 1430.0, "valid_targets_min": 843 }, { "epoch": 2.7576601671309193, "grad_norm": 0.7288721894678064, "learning_rate": 3.0378516501371752e-05, "loss": 0.1694, "loss_nan_ranks": 0, "loss_rank_avg": 0.08267127722501755, "step": 1980, "valid_targets_mean": 1622.9, "valid_targets_min": 849 }, { "epoch": 2.764623955431755, "grad_norm": 0.819855661582502, "learning_rate": 3.0319079857444844e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.08106249570846558, "step": 1985, "valid_targets_mean": 1429.0, "valid_targets_min": 612 }, { "epoch": 2.7715877437325904, "grad_norm": 0.7552847804482032, "learning_rate": 3.0259518754286302e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.07017084956169128, "step": 1990, "valid_targets_mean": 1283.0, "valid_targets_min": 782 }, { "epoch": 2.7785515320334264, "grad_norm": 0.8464332743776155, "learning_rate": 3.0199833910267286e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.09966123104095459, "step": 1995, "valid_targets_mean": 1457.0, "valid_targets_min": 926 }, { "epoch": 2.785515320334262, "grad_norm": 0.7123507198714567, "learning_rate": 3.0140026045251357e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.0700862854719162, "step": 2000, "valid_targets_mean": 1399.6, "valid_targets_min": 822 }, { "epoch": 2.7924791086350975, "grad_norm": 0.7070416875399016, "learning_rate": 3.0080095880585884e-05, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.07886691391468048, "step": 2005, "valid_targets_mean": 1464.6, "valid_targets_min": 670 }, { "epoch": 2.799442896935933, "grad_norm": 0.7839739267460378, "learning_rate": 3.002004413909326e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.08037430047988892, "step": 2010, "valid_targets_mean": 1504.8, "valid_targets_min": 647 }, { "epoch": 2.8064066852367686, "grad_norm": 0.7325386392599472, "learning_rate": 2.995987154506228e-05, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.06354961544275284, "step": 2015, "valid_targets_mean": 1276.9, "valid_targets_min": 791 }, { "epoch": 2.8133704735376046, "grad_norm": 0.7963527637303378, "learning_rate": 2.98995788242393e-05, "loss": 0.1682, "loss_nan_ranks": 0, "loss_rank_avg": 0.07502847909927368, "step": 2020, "valid_targets_mean": 1291.4, "valid_targets_min": 746 }, { "epoch": 2.82033426183844, "grad_norm": 0.7325341255976993, "learning_rate": 2.9839166703819572e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.06790463626384735, "step": 2025, "valid_targets_mean": 1409.1, "valid_targets_min": 892 }, { "epoch": 2.8272980501392757, "grad_norm": 1.0267772645703437, "learning_rate": 2.97786359124384e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.10208472609519958, "step": 2030, "valid_targets_mean": 1581.9, "valid_targets_min": 914 }, { "epoch": 2.8342618384401113, "grad_norm": 0.7487266217807981, "learning_rate": 2.971798718016242e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.07919836044311523, "step": 2035, "valid_targets_mean": 1647.6, "valid_targets_min": 636 }, { "epoch": 2.841225626740947, "grad_norm": 0.9158258240874332, "learning_rate": 2.9657221238480746e-05, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.0867113322019577, "step": 2040, "valid_targets_mean": 1523.5, "valid_targets_min": 641 }, { "epoch": 2.848189415041783, "grad_norm": 0.8495953544791401, "learning_rate": 2.9596338820296163e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.09921315312385559, "step": 2045, "valid_targets_mean": 1629.4, "valid_targets_min": 1020 }, { "epoch": 2.8551532033426184, "grad_norm": 1.1190071551544958, "learning_rate": 2.953534065991631e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.08030430972576141, "step": 2050, "valid_targets_mean": 1163.4, "valid_targets_min": 729 }, { "epoch": 2.862116991643454, "grad_norm": 0.7607775978376603, "learning_rate": 2.947422749304476e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.10393047332763672, "step": 2055, "valid_targets_mean": 1613.2, "valid_targets_min": 1001 }, { "epoch": 2.86908077994429, "grad_norm": 0.783991662666305, "learning_rate": 2.9413000056772225e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.0888073593378067, "step": 2060, "valid_targets_mean": 1567.0, "valid_targets_min": 1175 }, { "epoch": 2.8760445682451254, "grad_norm": 0.7826353186492123, "learning_rate": 2.9351659089567622e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.10893246531486511, "step": 2065, "valid_targets_mean": 1609.0, "valid_targets_min": 892 }, { "epoch": 2.883008356545961, "grad_norm": 0.7934696501334912, "learning_rate": 2.9290205331269158e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.08275732398033142, "step": 2070, "valid_targets_mean": 1425.2, "valid_targets_min": 801 }, { "epoch": 2.8899721448467965, "grad_norm": 0.7172842896059596, "learning_rate": 2.9228639523075432e-05, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.08390860259532928, "step": 2075, "valid_targets_mean": 1462.4, "valid_targets_min": 564 }, { "epoch": 2.896935933147632, "grad_norm": 0.8356533188243083, "learning_rate": 2.9166962407536496e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.08387964218854904, "step": 2080, "valid_targets_mean": 1749.1, "valid_targets_min": 651 }, { "epoch": 2.903899721448468, "grad_norm": 0.780853509813084, "learning_rate": 2.910517472854487e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.07162684202194214, "step": 2085, "valid_targets_mean": 1161.0, "valid_targets_min": 716 }, { "epoch": 2.9108635097493036, "grad_norm": 0.7403317269239412, "learning_rate": 2.9043277231326606e-05, "loss": 0.1673, "loss_nan_ranks": 0, "loss_rank_avg": 0.08211035281419754, "step": 2090, "valid_targets_mean": 1425.6, "valid_targets_min": 744 }, { "epoch": 2.917827298050139, "grad_norm": 0.7512823712045082, "learning_rate": 2.8981270662432258e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.0736178457736969, "step": 2095, "valid_targets_mean": 1391.1, "valid_targets_min": 1218 }, { "epoch": 2.924791086350975, "grad_norm": 0.8217643276597543, "learning_rate": 2.8919155769727932e-05, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.09656500816345215, "step": 2100, "valid_targets_mean": 1724.5, "valid_targets_min": 793 }, { "epoch": 2.9317548746518107, "grad_norm": 0.7855411813191986, "learning_rate": 2.8856933302386224e-05, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.07395291328430176, "step": 2105, "valid_targets_mean": 1366.8, "valid_targets_min": 846 }, { "epoch": 2.9387186629526463, "grad_norm": 0.9080574970183085, "learning_rate": 2.879460401087718e-05, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.09661687910556793, "step": 2110, "valid_targets_mean": 1772.1, "valid_targets_min": 979 }, { "epoch": 2.945682451253482, "grad_norm": 0.7185745540261005, "learning_rate": 2.873216864695928e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.09203220903873444, "step": 2115, "valid_targets_mean": 1778.9, "valid_targets_min": 1093 }, { "epoch": 2.9526462395543174, "grad_norm": 0.8058469860251909, "learning_rate": 2.8669627963670348e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.0805043950676918, "step": 2120, "valid_targets_mean": 1510.8, "valid_targets_min": 595 }, { "epoch": 2.9596100278551534, "grad_norm": 0.8161844468728507, "learning_rate": 2.8606982715318467e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.08108193427324295, "step": 2125, "valid_targets_mean": 1330.4, "valid_targets_min": 868 }, { "epoch": 2.966573816155989, "grad_norm": 0.8048088395167377, "learning_rate": 2.8544233657472893e-05, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.10407143086194992, "step": 2130, "valid_targets_mean": 1504.2, "valid_targets_min": 914 }, { "epoch": 2.9735376044568245, "grad_norm": 0.7696287813690902, "learning_rate": 2.8481381546954944e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.10349928587675095, "step": 2135, "valid_targets_mean": 1972.9, "valid_targets_min": 1080 }, { "epoch": 2.98050139275766, "grad_norm": 0.7248553330646451, "learning_rate": 2.8418427141828836e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.08698803186416626, "step": 2140, "valid_targets_mean": 1519.6, "valid_targets_min": 658 }, { "epoch": 2.9874651810584956, "grad_norm": 0.8081002064785113, "learning_rate": 2.835537120139261e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.07442046701908112, "step": 2145, "valid_targets_mean": 1362.0, "valid_targets_min": 1018 }, { "epoch": 2.9944289693593316, "grad_norm": 0.7441884200422766, "learning_rate": 2.8292214486168887e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.1013420969247818, "step": 2150, "valid_targets_mean": 1623.0, "valid_targets_min": 1041 }, { "epoch": 3.001392757660167, "grad_norm": 0.582670213892772, "learning_rate": 2.8228957757895787e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.10588406026363373, "step": 2155, "valid_targets_mean": 8215.2, "valid_targets_min": 6163 }, { "epoch": 3.0083565459610027, "grad_norm": 0.45807589528981335, "learning_rate": 2.816560177951765e-05, "loss": 0.214, "loss_nan_ranks": 0, "loss_rank_avg": 0.10979750752449036, "step": 2160, "valid_targets_mean": 8594.4, "valid_targets_min": 6006 }, { "epoch": 3.0153203342618387, "grad_norm": 0.5425898684830011, "learning_rate": 2.810214731517592e-05, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.0921827107667923, "step": 2165, "valid_targets_mean": 3578.4, "valid_targets_min": 289 }, { "epoch": 3.022284122562674, "grad_norm": 0.41010535238599494, "learning_rate": 2.8038595130199846e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.10162421315908432, "step": 2170, "valid_targets_mean": 7019.9, "valid_targets_min": 4985 }, { "epoch": 3.0292479108635098, "grad_norm": 0.408252787870625, "learning_rate": 2.7974945991097343e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.09866312146186829, "step": 2175, "valid_targets_mean": 6956.6, "valid_targets_min": 1457 }, { "epoch": 3.0362116991643453, "grad_norm": 0.376422224239574, "learning_rate": 2.791120066554565e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.09282627701759338, "step": 2180, "valid_targets_mean": 7361.6, "valid_targets_min": 4961 }, { "epoch": 3.043175487465181, "grad_norm": 0.4174310411579024, "learning_rate": 2.7847359922382154e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.12435085326433182, "step": 2185, "valid_targets_mean": 7058.5, "valid_targets_min": 5985 }, { "epoch": 3.050139275766017, "grad_norm": 0.40649864588422974, "learning_rate": 2.7783424531595057e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.11022967100143433, "step": 2190, "valid_targets_mean": 7664.2, "valid_targets_min": 5169 }, { "epoch": 3.0571030640668524, "grad_norm": 0.3894067905652123, "learning_rate": 2.7719395264314125e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.09706021845340729, "step": 2195, "valid_targets_mean": 7111.8, "valid_targets_min": 5348 }, { "epoch": 3.064066852367688, "grad_norm": 0.4571915199208844, "learning_rate": 2.7655272892801376e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.0859590619802475, "step": 2200, "valid_targets_mean": 4238.9, "valid_targets_min": 152 }, { "epoch": 3.0710306406685235, "grad_norm": 0.442146850622646, "learning_rate": 2.7591058190441754e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.0988345593214035, "step": 2205, "valid_targets_mean": 7199.4, "valid_targets_min": 4258 }, { "epoch": 3.0779944289693595, "grad_norm": 0.3888970877948061, "learning_rate": 2.7526751931733824e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.09356151521205902, "step": 2210, "valid_targets_mean": 7243.4, "valid_targets_min": 5831 }, { "epoch": 3.084958217270195, "grad_norm": 0.3880326891417797, "learning_rate": 2.7462354892280428e-05, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.09559017419815063, "step": 2215, "valid_targets_mean": 6950.6, "valid_targets_min": 3862 }, { "epoch": 3.0919220055710306, "grad_norm": 0.38716280782428913, "learning_rate": 2.7397867848779296e-05, "loss": 0.1883, "loss_nan_ranks": 0, "loss_rank_avg": 0.10002546012401581, "step": 2220, "valid_targets_mean": 6991.9, "valid_targets_min": 5696 }, { "epoch": 3.098885793871866, "grad_norm": 0.3892772405020075, "learning_rate": 2.733329157901373e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.1018202155828476, "step": 2225, "valid_targets_mean": 6963.5, "valid_targets_min": 4947 }, { "epoch": 3.105849582172702, "grad_norm": 0.3954300382500997, "learning_rate": 2.7268626861843176e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.08901640772819519, "step": 2230, "valid_targets_mean": 6436.9, "valid_targets_min": 4988 }, { "epoch": 3.1128133704735377, "grad_norm": 0.38253440455307475, "learning_rate": 2.7203874477193867e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.09357216954231262, "step": 2235, "valid_targets_mean": 7518.0, "valid_targets_min": 5476 }, { "epoch": 3.1197771587743732, "grad_norm": 0.37760495023063456, "learning_rate": 2.7139035206049392e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.0883115828037262, "step": 2240, "valid_targets_mean": 7422.6, "valid_targets_min": 5226 }, { "epoch": 3.1267409470752088, "grad_norm": 0.4492359216101069, "learning_rate": 2.707410983044128e-05, "loss": 0.1991, "loss_nan_ranks": 0, "loss_rank_avg": 0.12339232116937637, "step": 2245, "valid_targets_mean": 7080.0, "valid_targets_min": 3753 }, { "epoch": 3.1337047353760448, "grad_norm": 0.478752949833473, "learning_rate": 2.7009099133439588e-05, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.10847386717796326, "step": 2250, "valid_targets_mean": 6064.6, "valid_targets_min": 5161 }, { "epoch": 3.1406685236768803, "grad_norm": 0.41876052780288764, "learning_rate": 2.6944003899143424e-05, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.09066791832447052, "step": 2255, "valid_targets_mean": 7388.1, "valid_targets_min": 5795 }, { "epoch": 3.147632311977716, "grad_norm": 0.4035596406534088, "learning_rate": 2.6878824912671526e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.0864686593413353, "step": 2260, "valid_targets_mean": 7696.0, "valid_targets_min": 4658 }, { "epoch": 3.1545961002785514, "grad_norm": 0.3924938647790918, "learning_rate": 2.6813562960152754e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.10020910203456879, "step": 2265, "valid_targets_mean": 7799.1, "valid_targets_min": 5508 }, { "epoch": 3.1615598885793874, "grad_norm": 0.39783779066844704, "learning_rate": 2.6748218828716637e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.0940442681312561, "step": 2270, "valid_targets_mean": 7341.6, "valid_targets_min": 6454 }, { "epoch": 3.168523676880223, "grad_norm": 0.40685251066765943, "learning_rate": 2.6682793306483875e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.08199045807123184, "step": 2275, "valid_targets_mean": 6818.0, "valid_targets_min": 4392 }, { "epoch": 3.1754874651810585, "grad_norm": 0.3774943376487801, "learning_rate": 2.6617287182556818e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.08261384814977646, "step": 2280, "valid_targets_mean": 7857.6, "valid_targets_min": 5394 }, { "epoch": 3.182451253481894, "grad_norm": 0.3962509851654937, "learning_rate": 2.6551701247009974e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.07782858610153198, "step": 2285, "valid_targets_mean": 8314.1, "valid_targets_min": 4837 }, { "epoch": 3.1894150417827296, "grad_norm": 0.3805935986013425, "learning_rate": 2.6486036290880447e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.07052335143089294, "step": 2290, "valid_targets_mean": 7368.2, "valid_targets_min": 6027 }, { "epoch": 3.1963788300835656, "grad_norm": 0.4494256622684818, "learning_rate": 2.6420293106158425e-05, "loss": 0.1742, "loss_nan_ranks": 0, "loss_rank_avg": 0.09394653886556625, "step": 2295, "valid_targets_mean": 6435.0, "valid_targets_min": 4238 }, { "epoch": 3.203342618384401, "grad_norm": 1.3891357549119348, "learning_rate": 2.6354472485777627e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.05725764483213425, "step": 2300, "valid_targets_mean": 247.8, "valid_targets_min": 137 }, { "epoch": 3.2103064066852367, "grad_norm": 0.44440730067879897, "learning_rate": 2.6288575223605703e-05, "loss": 0.1942, "loss_nan_ranks": 0, "loss_rank_avg": 0.09099040925502777, "step": 2305, "valid_targets_mean": 6807.0, "valid_targets_min": 5165 }, { "epoch": 3.2172701949860723, "grad_norm": 0.47854206372685043, "learning_rate": 2.622260211443471e-05, "loss": 0.2009, "loss_nan_ranks": 0, "loss_rank_avg": 0.10358612984418869, "step": 2310, "valid_targets_mean": 6989.9, "valid_targets_min": 5104 }, { "epoch": 3.2242339832869082, "grad_norm": 0.40218643285685773, "learning_rate": 2.615655395397149e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.10578115284442902, "step": 2315, "valid_targets_mean": 6692.2, "valid_targets_min": 5068 }, { "epoch": 3.231197771587744, "grad_norm": 0.4823984099669414, "learning_rate": 2.6090431538828095e-05, "loss": 0.1926, "loss_nan_ranks": 0, "loss_rank_avg": 0.11674507707357407, "step": 2320, "valid_targets_mean": 7419.6, "valid_targets_min": 5578 }, { "epoch": 3.2381615598885793, "grad_norm": 0.3808006367102266, "learning_rate": 2.6024235666512154e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.09444583207368851, "step": 2325, "valid_targets_mean": 7536.5, "valid_targets_min": 5075 }, { "epoch": 3.245125348189415, "grad_norm": 0.3735886845835376, "learning_rate": 2.5957967135417272e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.08822908252477646, "step": 2330, "valid_targets_mean": 7221.5, "valid_targets_min": 5841 }, { "epoch": 3.252089136490251, "grad_norm": 0.38530492214279993, "learning_rate": 2.5891626744813413e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.0928116887807846, "step": 2335, "valid_targets_mean": 7287.5, "valid_targets_min": 5151 }, { "epoch": 3.2590529247910864, "grad_norm": 0.431169270507617, "learning_rate": 2.5825215294837213e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.09144345670938492, "step": 2340, "valid_targets_mean": 6738.4, "valid_targets_min": 4042 }, { "epoch": 3.266016713091922, "grad_norm": 0.42057933866822494, "learning_rate": 2.5758733586482402e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.10509088635444641, "step": 2345, "valid_targets_mean": 6331.0, "valid_targets_min": 5496 }, { "epoch": 3.2729805013927575, "grad_norm": 0.43887987652105004, "learning_rate": 2.5692182421590062e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.0931042730808258, "step": 2350, "valid_targets_mean": 6271.1, "valid_targets_min": 4695 }, { "epoch": 3.279944289693593, "grad_norm": 0.6506631337130584, "learning_rate": 2.5625562602839024e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.09925953298807144, "step": 2355, "valid_targets_mean": 5790.8, "valid_targets_min": 5021 }, { "epoch": 3.286908077994429, "grad_norm": 0.5048077739195413, "learning_rate": 2.555887493373614e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.07177004218101501, "step": 2360, "valid_targets_mean": 3386.8, "valid_targets_min": 2279 }, { "epoch": 3.2938718662952646, "grad_norm": 0.6120098262207729, "learning_rate": 2.549212021860662e-05, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.09277001023292542, "step": 2365, "valid_targets_mean": 6240.5, "valid_targets_min": 5093 }, { "epoch": 3.3008356545961, "grad_norm": 0.7108808669473043, "learning_rate": 2.542529926258433e-05, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.09597060084342957, "step": 2370, "valid_targets_mean": 6329.5, "valid_targets_min": 4589 }, { "epoch": 3.307799442896936, "grad_norm": 0.3884309764014742, "learning_rate": 2.5358412871602046e-05, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.0994221642613411, "step": 2375, "valid_targets_mean": 7589.2, "valid_targets_min": 4963 }, { "epoch": 3.3147632311977717, "grad_norm": 0.43936327155895843, "learning_rate": 2.5291461852381788e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.07934075593948364, "step": 2380, "valid_targets_mean": 5577.9, "valid_targets_min": 4458 }, { "epoch": 3.3217270194986073, "grad_norm": 0.4459328442427666, "learning_rate": 2.522444701242505e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.0892050564289093, "step": 2385, "valid_targets_mean": 5432.5, "valid_targets_min": 4433 }, { "epoch": 3.328690807799443, "grad_norm": 0.5161665476844713, "learning_rate": 2.5157369160003066e-05, "loss": 0.1883, "loss_nan_ranks": 0, "loss_rank_avg": 0.09683055430650711, "step": 2390, "valid_targets_mean": 6361.8, "valid_targets_min": 5201 }, { "epoch": 3.3356545961002784, "grad_norm": 0.45408075599291947, "learning_rate": 2.509022910414708e-05, "loss": 0.1913, "loss_nan_ranks": 0, "loss_rank_avg": 0.08833605796098709, "step": 2395, "valid_targets_mean": 5824.4, "valid_targets_min": 5129 }, { "epoch": 3.3426183844011144, "grad_norm": 0.7702050101973215, "learning_rate": 2.5023027654638576e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.10458929091691971, "step": 2400, "valid_targets_mean": 1637.6, "valid_targets_min": 137 }, { "epoch": 3.34958217270195, "grad_norm": 0.4785675018453149, "learning_rate": 2.4955765621999505e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.09321224689483643, "step": 2405, "valid_targets_mean": 6474.6, "valid_targets_min": 4751 }, { "epoch": 3.3565459610027855, "grad_norm": 0.413066098207994, "learning_rate": 2.4888443817482517e-05, "loss": 0.1821, "loss_nan_ranks": 0, "loss_rank_avg": 0.10013020038604736, "step": 2410, "valid_targets_mean": 7186.2, "valid_targets_min": 5358 }, { "epoch": 3.363509749303621, "grad_norm": 0.3906129731653948, "learning_rate": 2.4821063053061184e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.09480290114879608, "step": 2415, "valid_targets_mean": 7126.8, "valid_targets_min": 4078 }, { "epoch": 3.370473537604457, "grad_norm": 0.45841696400076865, "learning_rate": 2.4753624141420182e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.09096138924360275, "step": 2420, "valid_targets_mean": 7022.1, "valid_targets_min": 4940 }, { "epoch": 3.3774373259052926, "grad_norm": 0.4351904530245512, "learning_rate": 2.4686127895945517e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.09502632170915604, "step": 2425, "valid_targets_mean": 5900.6, "valid_targets_min": 4779 }, { "epoch": 3.384401114206128, "grad_norm": 0.47258906281645247, "learning_rate": 2.4618575130714707e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.09541469812393188, "step": 2430, "valid_targets_mean": 6290.1, "valid_targets_min": 4620 }, { "epoch": 3.3913649025069637, "grad_norm": 0.886229632768184, "learning_rate": 2.4550966660486944e-05, "loss": 0.1915, "loss_nan_ranks": 0, "loss_rank_avg": 0.07395320385694504, "step": 2435, "valid_targets_mean": 1162.2, "valid_targets_min": 788 }, { "epoch": 3.3983286908077996, "grad_norm": 0.7835854833673302, "learning_rate": 2.4483303300693296e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.08432234823703766, "step": 2440, "valid_targets_mean": 1500.6, "valid_targets_min": 957 }, { "epoch": 3.405292479108635, "grad_norm": 0.7364784582289423, "learning_rate": 2.4415585867426854e-05, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.07511076331138611, "step": 2445, "valid_targets_mean": 1371.2, "valid_targets_min": 796 }, { "epoch": 3.4122562674094707, "grad_norm": 0.9103744401835016, "learning_rate": 2.434781517743289e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.09593386203050613, "step": 2450, "valid_targets_mean": 1433.6, "valid_targets_min": 697 }, { "epoch": 3.4192200557103063, "grad_norm": 0.7736223123121384, "learning_rate": 2.4279992048099016e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.07917076349258423, "step": 2455, "valid_targets_mean": 1578.9, "valid_targets_min": 638 }, { "epoch": 3.426183844011142, "grad_norm": 0.7034601262769054, "learning_rate": 2.4212117297445307e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.07970526069402695, "step": 2460, "valid_targets_mean": 1746.4, "valid_targets_min": 727 }, { "epoch": 3.433147632311978, "grad_norm": 0.7382178076531261, "learning_rate": 2.4144191744114457e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.06873296201229095, "step": 2465, "valid_targets_mean": 1309.9, "valid_targets_min": 761 }, { "epoch": 3.4401114206128134, "grad_norm": 0.8425832615711547, "learning_rate": 2.4076216207361904e-05, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.09206151962280273, "step": 2470, "valid_targets_mean": 1368.6, "valid_targets_min": 714 }, { "epoch": 3.447075208913649, "grad_norm": 0.8395407250078996, "learning_rate": 2.4008191507045913e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.08047881722450256, "step": 2475, "valid_targets_mean": 1491.8, "valid_targets_min": 867 }, { "epoch": 3.4540389972144845, "grad_norm": 0.7755881495928278, "learning_rate": 2.3940118463617745e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.09353938698768616, "step": 2480, "valid_targets_mean": 1994.0, "valid_targets_min": 790 }, { "epoch": 3.4610027855153205, "grad_norm": 0.7814533436270437, "learning_rate": 2.3871997898111707e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.08098438382148743, "step": 2485, "valid_targets_mean": 1523.4, "valid_targets_min": 896 }, { "epoch": 3.467966573816156, "grad_norm": 0.8288270044083298, "learning_rate": 2.3803830632135284e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.08329111337661743, "step": 2490, "valid_targets_mean": 1790.1, "valid_targets_min": 1009 }, { "epoch": 3.4749303621169916, "grad_norm": 0.7061032285936508, "learning_rate": 2.3735617487859224e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.06442536413669586, "step": 2495, "valid_targets_mean": 1394.0, "valid_targets_min": 717 }, { "epoch": 3.481894150417827, "grad_norm": 0.9020364718977384, "learning_rate": 2.3667359288007612e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.06079908832907677, "step": 2500, "valid_targets_mean": 1129.0, "valid_targets_min": 659 }, { "epoch": 3.488857938718663, "grad_norm": 0.7566586323370277, "learning_rate": 2.3599056855847937e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.07075653970241547, "step": 2505, "valid_targets_mean": 1466.9, "valid_targets_min": 642 }, { "epoch": 3.4958217270194987, "grad_norm": 0.7734326889825535, "learning_rate": 2.353071101518121e-05, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.054345741868019104, "step": 2510, "valid_targets_mean": 1129.4, "valid_targets_min": 765 }, { "epoch": 3.502785515320334, "grad_norm": 0.804981371612974, "learning_rate": 2.346232259033196e-05, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.07415035367012024, "step": 2515, "valid_targets_mean": 1322.8, "valid_targets_min": 631 }, { "epoch": 3.5097493036211698, "grad_norm": 0.9012347000535628, "learning_rate": 2.3393892406138354e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.09443515539169312, "step": 2520, "valid_targets_mean": 1612.0, "valid_targets_min": 623 }, { "epoch": 3.5167130919220053, "grad_norm": 0.8529475358392916, "learning_rate": 2.332542128794221e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.060877248644828796, "step": 2525, "valid_targets_mean": 1402.1, "valid_targets_min": 940 }, { "epoch": 3.5236768802228413, "grad_norm": 0.7346114867964298, "learning_rate": 2.325691006157905e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.06927518546581268, "step": 2530, "valid_targets_mean": 1337.8, "valid_targets_min": 776 }, { "epoch": 3.530640668523677, "grad_norm": 0.7848390780850379, "learning_rate": 2.3188359553368157e-05, "loss": 0.1593, "loss_nan_ranks": 0, "loss_rank_avg": 0.08660085499286652, "step": 2535, "valid_targets_mean": 1525.5, "valid_targets_min": 623 }, { "epoch": 3.5376044568245124, "grad_norm": 0.7918791101050114, "learning_rate": 2.3119770590102585e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.08223545551300049, "step": 2540, "valid_targets_mean": 1441.0, "valid_targets_min": 693 }, { "epoch": 3.5445682451253484, "grad_norm": 0.9253216126700171, "learning_rate": 2.3051143999039198e-05, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.042962588369846344, "step": 2545, "valid_targets_mean": 847.9, "valid_targets_min": 611 }, { "epoch": 3.551532033426184, "grad_norm": 0.8194995897407035, "learning_rate": 2.2982480607888693e-05, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.07983898371458054, "step": 2550, "valid_targets_mean": 1524.9, "valid_targets_min": 793 }, { "epoch": 3.5584958217270195, "grad_norm": 0.7123126085956808, "learning_rate": 2.291378124480563e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.08361306041479111, "step": 2555, "valid_targets_mean": 1779.4, "valid_targets_min": 563 }, { "epoch": 3.565459610027855, "grad_norm": 0.7375463773516223, "learning_rate": 2.284504673837839e-05, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.08410098403692245, "step": 2560, "valid_targets_mean": 1741.2, "valid_targets_min": 1341 }, { "epoch": 3.5724233983286906, "grad_norm": 0.813717402129795, "learning_rate": 2.277627791761927e-05, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.0976366251707077, "step": 2565, "valid_targets_mean": 1875.6, "valid_targets_min": 1107 }, { "epoch": 3.5793871866295266, "grad_norm": 0.7638558548512067, "learning_rate": 2.270747561195441e-05, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.07316169142723083, "step": 2570, "valid_targets_mean": 1419.5, "valid_targets_min": 680 }, { "epoch": 3.586350974930362, "grad_norm": 0.7546648374433426, "learning_rate": 2.2638640651213804e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.10009348392486572, "step": 2575, "valid_targets_mean": 1968.2, "valid_targets_min": 981 }, { "epoch": 3.5933147632311977, "grad_norm": 0.8517766302015852, "learning_rate": 2.2569773865621324e-05, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.07636626064777374, "step": 2580, "valid_targets_mean": 1568.9, "valid_targets_min": 937 }, { "epoch": 3.6002785515320337, "grad_norm": 0.8067654097110404, "learning_rate": 2.2500876085784665e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.08284150809049606, "step": 2585, "valid_targets_mean": 1645.2, "valid_targets_min": 804 }, { "epoch": 3.6072423398328692, "grad_norm": 0.7691207000641539, "learning_rate": 2.2431948142685352e-05, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.07658159732818604, "step": 2590, "valid_targets_mean": 1574.9, "valid_targets_min": 1019 }, { "epoch": 3.614206128133705, "grad_norm": 0.7783596723806455, "learning_rate": 2.236299086766873e-05, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.06561608612537384, "step": 2595, "valid_targets_mean": 1121.6, "valid_targets_min": 882 }, { "epoch": 3.6211699164345403, "grad_norm": 0.7775958409848589, "learning_rate": 2.2294005092433887e-05, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.08176523447036743, "step": 2600, "valid_targets_mean": 1818.1, "valid_targets_min": 1168 }, { "epoch": 3.628133704735376, "grad_norm": 0.828811804727648, "learning_rate": 2.2224991649023675e-05, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.07202639430761337, "step": 2605, "valid_targets_mean": 1417.8, "valid_targets_min": 678 }, { "epoch": 3.635097493036212, "grad_norm": 0.8282689257518919, "learning_rate": 2.2155951369814644e-05, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.058761902153491974, "step": 2610, "valid_targets_mean": 1051.0, "valid_targets_min": 676 }, { "epoch": 3.6420612813370474, "grad_norm": 1.7079878973692406, "learning_rate": 2.2086885087507027e-05, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.06798002123832703, "step": 2615, "valid_targets_mean": 1431.1, "valid_targets_min": 794 }, { "epoch": 3.649025069637883, "grad_norm": 0.7717379455457729, "learning_rate": 2.2017793635114667e-05, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.07599664479494095, "step": 2620, "valid_targets_mean": 1486.9, "valid_targets_min": 742 }, { "epoch": 3.6559888579387185, "grad_norm": 0.7698310794801155, "learning_rate": 2.1948677845954985e-05, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.08982954919338226, "step": 2625, "valid_targets_mean": 1734.5, "valid_targets_min": 741 }, { "epoch": 3.662952646239554, "grad_norm": 0.8944739797043322, "learning_rate": 2.1879538553638942e-05, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.09024101495742798, "step": 2630, "valid_targets_mean": 1712.5, "valid_targets_min": 1157 }, { "epoch": 3.66991643454039, "grad_norm": 0.7894287756846752, "learning_rate": 2.1810376592060968e-05, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.09558722376823425, "step": 2635, "valid_targets_mean": 1723.8, "valid_targets_min": 862 }, { "epoch": 3.6768802228412256, "grad_norm": 0.8796292419764679, "learning_rate": 2.174119279538891e-05, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.09259238839149475, "step": 2640, "valid_targets_mean": 1633.1, "valid_targets_min": 1019 }, { "epoch": 3.683844011142061, "grad_norm": 0.7361323056285416, "learning_rate": 2.1671987998053954e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.0679299384355545, "step": 2645, "valid_targets_mean": 1376.1, "valid_targets_min": 1058 }, { "epoch": 3.690807799442897, "grad_norm": 0.7916992537280872, "learning_rate": 2.16027630347406e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.08028727769851685, "step": 2650, "valid_targets_mean": 1576.5, "valid_targets_min": 618 }, { "epoch": 3.6977715877437327, "grad_norm": 0.8165492508178849, "learning_rate": 2.1533518740376557e-05, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.0871560126543045, "step": 2655, "valid_targets_mean": 1615.8, "valid_targets_min": 629 }, { "epoch": 3.7047353760445683, "grad_norm": 0.8981802581015453, "learning_rate": 2.146425595012269e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.08319033682346344, "step": 2660, "valid_targets_mean": 1881.2, "valid_targets_min": 1167 }, { "epoch": 3.711699164345404, "grad_norm": 0.7955838043549589, "learning_rate": 2.1394975499362947e-05, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.07869289815425873, "step": 2665, "valid_targets_mean": 1367.2, "valid_targets_min": 699 }, { "epoch": 3.7186629526462394, "grad_norm": 0.7732510809048744, "learning_rate": 2.132567822369428e-05, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.058514297008514404, "step": 2670, "valid_targets_mean": 1174.9, "valid_targets_min": 679 }, { "epoch": 3.7256267409470754, "grad_norm": 0.7978233555615979, "learning_rate": 2.1256364958916564e-05, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.07325758785009384, "step": 2675, "valid_targets_mean": 1556.2, "valid_targets_min": 504 }, { "epoch": 3.732590529247911, "grad_norm": 0.8402148455143513, "learning_rate": 2.1187036541022533e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.08283115178346634, "step": 2680, "valid_targets_mean": 1885.0, "valid_targets_min": 1331 }, { "epoch": 3.7395543175487465, "grad_norm": 0.764780642210825, "learning_rate": 2.1117693806187657e-05, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.055060356855392456, "step": 2685, "valid_targets_mean": 1306.1, "valid_targets_min": 661 }, { "epoch": 3.7465181058495824, "grad_norm": 0.7707860162726192, "learning_rate": 2.104833759076011e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.05953007936477661, "step": 2690, "valid_targets_mean": 1330.1, "valid_targets_min": 958 }, { "epoch": 3.7534818941504176, "grad_norm": 0.7132388417704622, "learning_rate": 2.0978968731250648e-05, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.057646650820970535, "step": 2695, "valid_targets_mean": 1465.0, "valid_targets_min": 963 }, { "epoch": 3.7604456824512535, "grad_norm": 0.7777931157465899, "learning_rate": 2.0909588064322524e-05, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.07116229832172394, "step": 2700, "valid_targets_mean": 1428.0, "valid_targets_min": 793 }, { "epoch": 3.767409470752089, "grad_norm": 0.7925330730772479, "learning_rate": 2.08401964267814e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.091750867664814, "step": 2705, "valid_targets_mean": 1633.1, "valid_targets_min": 917 }, { "epoch": 3.7743732590529246, "grad_norm": 0.8377874283930322, "learning_rate": 2.0770794655565278e-05, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.06515245139598846, "step": 2710, "valid_targets_mean": 1246.5, "valid_targets_min": 872 }, { "epoch": 3.7813370473537606, "grad_norm": 0.7500409300068362, "learning_rate": 2.0701383587734334e-05, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.07608701288700104, "step": 2715, "valid_targets_mean": 1903.6, "valid_targets_min": 1220 }, { "epoch": 3.788300835654596, "grad_norm": 0.8435711995319485, "learning_rate": 2.0631964060460934e-05, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.06794526427984238, "step": 2720, "valid_targets_mean": 1391.6, "valid_targets_min": 712 }, { "epoch": 3.7952646239554317, "grad_norm": 0.8724016823017468, "learning_rate": 2.0562536911019415e-05, "loss": 0.1453, "loss_nan_ranks": 0, "loss_rank_avg": 0.0759831964969635, "step": 2725, "valid_targets_mean": 1295.0, "valid_targets_min": 605 }, { "epoch": 3.8022284122562673, "grad_norm": 0.7990588269247201, "learning_rate": 2.049310297677609e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.05404563248157501, "step": 2730, "valid_targets_mean": 1414.8, "valid_targets_min": 746 }, { "epoch": 3.809192200557103, "grad_norm": 0.9100646789026491, "learning_rate": 2.0423663095179084e-05, "loss": 0.1403, "loss_nan_ranks": 0, "loss_rank_avg": 0.06111488863825798, "step": 2735, "valid_targets_mean": 1059.4, "valid_targets_min": 723 }, { "epoch": 3.816155988857939, "grad_norm": 0.7835072806883097, "learning_rate": 2.0354218103748253e-05, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.08211217820644379, "step": 2740, "valid_targets_mean": 1634.2, "valid_targets_min": 1327 }, { "epoch": 3.8231197771587744, "grad_norm": 0.8355043521576563, "learning_rate": 2.028476884006508e-05, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.07008926570415497, "step": 2745, "valid_targets_mean": 1412.5, "valid_targets_min": 902 }, { "epoch": 3.83008356545961, "grad_norm": 0.8578826264946082, "learning_rate": 2.02153161417626e-05, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.07012935727834702, "step": 2750, "valid_targets_mean": 1558.8, "valid_targets_min": 803 }, { "epoch": 3.837047353760446, "grad_norm": 0.8206701722875304, "learning_rate": 2.0145860846515234e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.07594504952430725, "step": 2755, "valid_targets_mean": 1441.2, "valid_targets_min": 1079 }, { "epoch": 3.8440111420612815, "grad_norm": 0.7481367084277267, "learning_rate": 2.0076403792028757e-05, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.06753340363502502, "step": 2760, "valid_targets_mean": 1449.8, "valid_targets_min": 1263 }, { "epoch": 3.850974930362117, "grad_norm": 0.7968317810485137, "learning_rate": 2.000694581603016e-05, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.07419832050800323, "step": 2765, "valid_targets_mean": 1487.4, "valid_targets_min": 844 }, { "epoch": 3.8579387186629526, "grad_norm": 0.8690761427120194, "learning_rate": 1.993748775625752e-05, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.06871486455202103, "step": 2770, "valid_targets_mean": 1421.4, "valid_targets_min": 667 }, { "epoch": 3.864902506963788, "grad_norm": 0.8975013022838169, "learning_rate": 1.986803045044996e-05, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.08886584639549255, "step": 2775, "valid_targets_mean": 1822.6, "valid_targets_min": 1041 }, { "epoch": 3.871866295264624, "grad_norm": 0.7977117949143756, "learning_rate": 1.9798574736337487e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.06609257310628891, "step": 2780, "valid_targets_mean": 1327.4, "valid_targets_min": 777 }, { "epoch": 3.8788300835654597, "grad_norm": 0.7438548739680065, "learning_rate": 1.972912145163093e-05, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.07537013292312622, "step": 2785, "valid_targets_mean": 1823.8, "valid_targets_min": 1283 }, { "epoch": 3.885793871866295, "grad_norm": 0.928372055697338, "learning_rate": 1.965967143401178e-05, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.05227617174386978, "step": 2790, "valid_targets_mean": 924.0, "valid_targets_min": 620 }, { "epoch": 3.8927576601671308, "grad_norm": 0.8016846902818193, "learning_rate": 1.9590225521122167e-05, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.06370696425437927, "step": 2795, "valid_targets_mean": 1480.2, "valid_targets_min": 656 }, { "epoch": 3.8997214484679663, "grad_norm": 0.8062692815757603, "learning_rate": 1.9520784550554683e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.059848278760910034, "step": 2800, "valid_targets_mean": 1415.5, "valid_targets_min": 697 }, { "epoch": 3.9066852367688023, "grad_norm": 0.8353157154283097, "learning_rate": 1.9451349359842332e-05, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.07082884013652802, "step": 2805, "valid_targets_mean": 1655.8, "valid_targets_min": 816 }, { "epoch": 3.913649025069638, "grad_norm": 0.7597621427921378, "learning_rate": 1.938192078644839e-05, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.06765986979007721, "step": 2810, "valid_targets_mean": 1553.0, "valid_targets_min": 850 }, { "epoch": 3.9206128133704734, "grad_norm": 0.7816154228464142, "learning_rate": 1.931249966775633e-05, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.06977061927318573, "step": 2815, "valid_targets_mean": 1353.9, "valid_targets_min": 747 }, { "epoch": 3.9275766016713094, "grad_norm": 0.8523628518802676, "learning_rate": 1.92430868410597e-05, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.0653572827577591, "step": 2820, "valid_targets_mean": 1420.9, "valid_targets_min": 933 }, { "epoch": 3.934540389972145, "grad_norm": 0.801382105679613, "learning_rate": 1.9173683143552057e-05, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.07180759310722351, "step": 2825, "valid_targets_mean": 1394.9, "valid_targets_min": 827 }, { "epoch": 3.9415041782729805, "grad_norm": 0.7523245478800936, "learning_rate": 1.910428941231684e-05, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.06203988194465637, "step": 2830, "valid_targets_mean": 1383.2, "valid_targets_min": 909 }, { "epoch": 3.948467966573816, "grad_norm": 0.7403715943582305, "learning_rate": 1.903490648431728e-05, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.08447936922311783, "step": 2835, "valid_targets_mean": 1682.4, "valid_targets_min": 1094 }, { "epoch": 3.9554317548746516, "grad_norm": 0.8253011305912571, "learning_rate": 1.8965535196386326e-05, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.06693306565284729, "step": 2840, "valid_targets_mean": 1118.4, "valid_targets_min": 720 }, { "epoch": 3.9623955431754876, "grad_norm": 0.7530842490472827, "learning_rate": 1.889617638521651e-05, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.07407623529434204, "step": 2845, "valid_targets_mean": 1538.2, "valid_targets_min": 610 }, { "epoch": 3.969359331476323, "grad_norm": 0.7546263356082901, "learning_rate": 1.8826830887349902e-05, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.07467672973871231, "step": 2850, "valid_targets_mean": 1570.1, "valid_targets_min": 713 }, { "epoch": 3.9763231197771587, "grad_norm": 0.833106804892126, "learning_rate": 1.8757499539167986e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.07438725978136063, "step": 2855, "valid_targets_mean": 1537.8, "valid_targets_min": 874 }, { "epoch": 3.9832869080779947, "grad_norm": 0.7504076181098892, "learning_rate": 1.8688183176881596e-05, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.07164924591779709, "step": 2860, "valid_targets_mean": 1471.2, "valid_targets_min": 765 }, { "epoch": 3.9902506963788302, "grad_norm": 0.7785848799373203, "learning_rate": 1.861888263652081e-05, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.06348396092653275, "step": 2865, "valid_targets_mean": 1254.4, "valid_targets_min": 816 }, { "epoch": 3.997214484679666, "grad_norm": 0.78598015466159, "learning_rate": 1.8549598753924894e-05, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.0708591490983963, "step": 2870, "valid_targets_mean": 1482.9, "valid_targets_min": 1182 }, { "epoch": 4.004178272980502, "grad_norm": 0.7745411560000336, "learning_rate": 1.8480332364732178e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.09853234887123108, "step": 2875, "valid_targets_mean": 5435.1, "valid_targets_min": 3516 }, { "epoch": 4.011142061281337, "grad_norm": 0.45693392884456113, "learning_rate": 1.8411084304370014e-05, "loss": 0.1987, "loss_nan_ranks": 0, "loss_rank_avg": 0.09516393393278122, "step": 2880, "valid_targets_mean": 7654.2, "valid_targets_min": 6354 }, { "epoch": 4.018105849582173, "grad_norm": 0.4319211248040884, "learning_rate": 1.8341855408044697e-05, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.10908873379230499, "step": 2885, "valid_targets_mean": 7341.6, "valid_targets_min": 5754 }, { "epoch": 4.025069637883008, "grad_norm": 0.35087638698700635, "learning_rate": 1.8272646510731375e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.08147092163562775, "step": 2890, "valid_targets_mean": 7666.2, "valid_targets_min": 5666 }, { "epoch": 4.032033426183844, "grad_norm": 0.4079352838694494, "learning_rate": 1.820345844716399e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.09540951251983643, "step": 2895, "valid_targets_mean": 7469.0, "valid_targets_min": 5646 }, { "epoch": 4.03899721448468, "grad_norm": 0.453891412990921, "learning_rate": 1.81342920518252e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.1076955646276474, "step": 2900, "valid_targets_mean": 7046.9, "valid_targets_min": 5571 }, { "epoch": 4.045961002785515, "grad_norm": 0.44912248872165283, "learning_rate": 1.8065148158936323e-05, "loss": 0.1985, "loss_nan_ranks": 0, "loss_rank_avg": 0.10332390666007996, "step": 2905, "valid_targets_mean": 7827.6, "valid_targets_min": 5405 }, { "epoch": 4.052924791086351, "grad_norm": 0.3855281872703947, "learning_rate": 1.799602760244728e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.09584302455186844, "step": 2910, "valid_targets_mean": 7023.5, "valid_targets_min": 5664 }, { "epoch": 4.059888579387187, "grad_norm": 0.39674294021757817, "learning_rate": 1.7926931216026518e-05, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.08769885450601578, "step": 2915, "valid_targets_mean": 7069.8, "valid_targets_min": 5103 }, { "epoch": 4.066852367688022, "grad_norm": 0.4247588326582294, "learning_rate": 1.7857859833050983e-05, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.08552022278308868, "step": 2920, "valid_targets_mean": 6712.4, "valid_targets_min": 5469 }, { "epoch": 4.073816155988858, "grad_norm": 0.4334738323877378, "learning_rate": 1.7788814286596044e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.0862928107380867, "step": 2925, "valid_targets_mean": 7289.2, "valid_targets_min": 5513 }, { "epoch": 4.080779944289693, "grad_norm": 0.5671431858648565, "learning_rate": 1.7719795409425443e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.08433561772108078, "step": 2930, "valid_targets_mean": 7022.1, "valid_targets_min": 5691 }, { "epoch": 4.087743732590529, "grad_norm": 0.5417102538090298, "learning_rate": 1.765080403398127e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.0926387831568718, "step": 2935, "valid_targets_mean": 6736.0, "valid_targets_min": 5550 }, { "epoch": 4.094707520891365, "grad_norm": 0.3961734843289232, "learning_rate": 1.758184099237393e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.08144709467887878, "step": 2940, "valid_targets_mean": 6346.9, "valid_targets_min": 5067 }, { "epoch": 4.1016713091922, "grad_norm": 0.3937587901125671, "learning_rate": 1.7512907116372066e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.08808314055204391, "step": 2945, "valid_targets_mean": 6784.0, "valid_targets_min": 5618 }, { "epoch": 4.108635097493036, "grad_norm": 0.43597320037991466, "learning_rate": 1.7444003237392567e-05, "loss": 0.1784, "loss_nan_ranks": 0, "loss_rank_avg": 0.10079539567232132, "step": 2950, "valid_targets_mean": 7568.4, "valid_targets_min": 5856 }, { "epoch": 4.1155988857938715, "grad_norm": 0.3994536656356681, "learning_rate": 1.737513018649053e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.08414926379919052, "step": 2955, "valid_targets_mean": 7198.5, "valid_targets_min": 4793 }, { "epoch": 4.1225626740947074, "grad_norm": 0.4184797204828292, "learning_rate": 1.7306288794349213e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.08882571756839752, "step": 2960, "valid_targets_mean": 6680.5, "valid_targets_min": 5350 }, { "epoch": 4.129526462395543, "grad_norm": 0.4148372539820588, "learning_rate": 1.7237479891270054e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.0935942679643631, "step": 2965, "valid_targets_mean": 6770.6, "valid_targets_min": 5753 }, { "epoch": 4.1364902506963785, "grad_norm": 0.7626972756641216, "learning_rate": 1.7168704307162625e-05, "loss": 0.1835, "loss_nan_ranks": 0, "loss_rank_avg": 0.06254291534423828, "step": 2970, "valid_targets_mean": 1419.8, "valid_targets_min": 289 }, { "epoch": 4.1434540389972145, "grad_norm": 0.4371572099046906, "learning_rate": 1.7099962871534644e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.09101256728172302, "step": 2975, "valid_targets_mean": 6784.2, "valid_targets_min": 5042 }, { "epoch": 4.1504178272980505, "grad_norm": 0.4078695342570583, "learning_rate": 1.703125641348197e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.08425340801477432, "step": 2980, "valid_targets_mean": 6774.9, "valid_targets_min": 3875 }, { "epoch": 4.157381615598886, "grad_norm": 0.43908909204234714, "learning_rate": 1.696258576167856e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.09084954857826233, "step": 2985, "valid_targets_mean": 7047.6, "valid_targets_min": 6134 }, { "epoch": 4.164345403899722, "grad_norm": 0.3923313188578705, "learning_rate": 1.6893951744366547e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.09309709817171097, "step": 2990, "valid_targets_mean": 6886.6, "valid_targets_min": 5869 }, { "epoch": 4.171309192200557, "grad_norm": 0.377006462886014, "learning_rate": 1.6825355189346192e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.08231081813573837, "step": 2995, "valid_targets_mean": 7559.8, "valid_targets_min": 6145 }, { "epoch": 4.178272980501393, "grad_norm": 0.3411126289914851, "learning_rate": 1.675679692396593e-05, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.07891160249710083, "step": 3000, "valid_targets_mean": 8920.5, "valid_targets_min": 4780 }, { "epoch": 4.185236768802229, "grad_norm": 0.3592395577774327, "learning_rate": 1.6688277775112377e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.06996404379606247, "step": 3005, "valid_targets_mean": 7393.4, "valid_targets_min": 5116 }, { "epoch": 4.192200557103064, "grad_norm": 0.34174396201498236, "learning_rate": 1.6619798569200368e-05, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.07682168483734131, "step": 3010, "valid_targets_mean": 8477.5, "valid_targets_min": 4033 }, { "epoch": 4.1991643454039, "grad_norm": 0.40130345703058956, "learning_rate": 1.6551360132162967e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.08580783009529114, "step": 3015, "valid_targets_mean": 6736.6, "valid_targets_min": 4646 }, { "epoch": 4.206128133704736, "grad_norm": 0.43606325450974787, "learning_rate": 1.6482963289441533e-05, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.09041762351989746, "step": 3020, "valid_targets_mean": 7551.5, "valid_targets_min": 5461 }, { "epoch": 4.213091922005571, "grad_norm": 0.45829099636483556, "learning_rate": 1.6414608865975757e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.10397613048553467, "step": 3025, "valid_targets_mean": 7091.0, "valid_targets_min": 4879 }, { "epoch": 4.220055710306407, "grad_norm": 0.42080713802214453, "learning_rate": 1.6346297686193698e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.08283068239688873, "step": 3030, "valid_targets_mean": 6269.8, "valid_targets_min": 4606 }, { "epoch": 4.227019498607242, "grad_norm": 0.4001310643885332, "learning_rate": 1.6278030574001863e-05, "loss": 0.1834, "loss_nan_ranks": 0, "loss_rank_avg": 0.08124437183141708, "step": 3035, "valid_targets_mean": 6818.4, "valid_targets_min": 5525 }, { "epoch": 4.233983286908078, "grad_norm": 0.3928643150423594, "learning_rate": 1.6209808352775227e-05, "loss": 0.1725, "loss_nan_ranks": 0, "loss_rank_avg": 0.08757513761520386, "step": 3040, "valid_targets_mean": 7365.4, "valid_targets_min": 5000 }, { "epoch": 4.240947075208914, "grad_norm": 0.42455615486180276, "learning_rate": 1.6141631845347368e-05, "loss": 0.1761, "loss_nan_ranks": 0, "loss_rank_avg": 0.07783573120832443, "step": 3045, "valid_targets_mean": 6212.1, "valid_targets_min": 3988 }, { "epoch": 4.247910863509749, "grad_norm": 0.42241913812780074, "learning_rate": 1.607350187400049e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.08539704978466034, "step": 3050, "valid_targets_mean": 8396.9, "valid_targets_min": 6131 }, { "epoch": 4.254874651810585, "grad_norm": 0.4237454815884405, "learning_rate": 1.6005419260455512e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.0880412757396698, "step": 3055, "valid_targets_mean": 7651.0, "valid_targets_min": 4061 }, { "epoch": 4.26183844011142, "grad_norm": 0.37280072499256484, "learning_rate": 1.593738482586219e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.0859137699007988, "step": 3060, "valid_targets_mean": 7090.1, "valid_targets_min": 5203 }, { "epoch": 4.268802228412256, "grad_norm": 0.41477357509750673, "learning_rate": 1.5869399390789172e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.08433390408754349, "step": 3065, "valid_targets_mean": 7001.0, "valid_targets_min": 5362 }, { "epoch": 4.275766016713092, "grad_norm": 0.40793877263257894, "learning_rate": 1.5801463775214118e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.08703209459781647, "step": 3070, "valid_targets_mean": 6359.2, "valid_targets_min": 5236 }, { "epoch": 4.282729805013927, "grad_norm": 0.44350806675129867, "learning_rate": 1.573357879851381e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.09586170315742493, "step": 3075, "valid_targets_mean": 5939.8, "valid_targets_min": 4693 }, { "epoch": 4.289693593314763, "grad_norm": 1.146676173490332, "learning_rate": 1.5665745279454294e-05, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.030542651191353798, "step": 3080, "valid_targets_mean": 208.6, "valid_targets_min": 134 }, { "epoch": 4.296657381615599, "grad_norm": 0.48379943817559756, "learning_rate": 1.5597964036180955e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.09201765060424805, "step": 3085, "valid_targets_mean": 6008.5, "valid_targets_min": 4956 }, { "epoch": 4.303621169916434, "grad_norm": 0.4202491008226685, "learning_rate": 1.553023588620869e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.07570789754390717, "step": 3090, "valid_targets_mean": 6042.0, "valid_targets_min": 4817 }, { "epoch": 4.31058495821727, "grad_norm": 0.42477738905964485, "learning_rate": 1.5462561646412028e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.08630920946598053, "step": 3095, "valid_targets_mean": 6608.6, "valid_targets_min": 5102 }, { "epoch": 4.3175487465181055, "grad_norm": 0.42688040529738014, "learning_rate": 1.5394942133015278e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.08623873442411423, "step": 3100, "valid_targets_mean": 6670.1, "valid_targets_min": 4869 }, { "epoch": 4.3245125348189415, "grad_norm": 0.42003992455965294, "learning_rate": 1.5327378161582697e-05, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.07713023573160172, "step": 3105, "valid_targets_mean": 6088.4, "valid_targets_min": 4946 }, { "epoch": 4.3314763231197775, "grad_norm": 0.4216278012962236, "learning_rate": 1.5259870547008647e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.08279541879892349, "step": 3110, "valid_targets_mean": 6228.4, "valid_targets_min": 4856 }, { "epoch": 4.338440111420613, "grad_norm": 0.44787796967160803, "learning_rate": 1.5192420103507765e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.08231884241104126, "step": 3115, "valid_targets_mean": 5376.6, "valid_targets_min": 4145 }, { "epoch": 4.345403899721449, "grad_norm": 0.4676976765001585, "learning_rate": 1.5125027644605143e-05, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.08625025302171707, "step": 3120, "valid_targets_mean": 6309.2, "valid_targets_min": 5305 }, { "epoch": 4.352367688022284, "grad_norm": 0.4889513820698066, "learning_rate": 1.50576939831265e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.08322583138942719, "step": 3125, "valid_targets_mean": 6221.5, "valid_targets_min": 4636 }, { "epoch": 4.35933147632312, "grad_norm": 0.4369115623225211, "learning_rate": 1.4990419931188425e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.09070675075054169, "step": 3130, "valid_targets_mean": 6831.5, "valid_targets_min": 5668 }, { "epoch": 4.366295264623956, "grad_norm": 0.42542268683362244, "learning_rate": 1.4923206300188522e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.09038935601711273, "step": 3135, "valid_targets_mean": 6437.1, "valid_targets_min": 5004 }, { "epoch": 4.373259052924791, "grad_norm": 0.5378332721568458, "learning_rate": 1.4856053900795682e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.08066794276237488, "step": 3140, "valid_targets_mean": 6205.8, "valid_targets_min": 5341 }, { "epoch": 4.380222841225627, "grad_norm": 0.4295836677794995, "learning_rate": 1.4788963542940251e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.09073355048894882, "step": 3145, "valid_targets_mean": 6748.0, "valid_targets_min": 5363 }, { "epoch": 4.387186629526463, "grad_norm": 0.4850027247112984, "learning_rate": 1.4721936035804307e-05, "loss": 0.1686, "loss_nan_ranks": 0, "loss_rank_avg": 0.07909142971038818, "step": 3150, "valid_targets_mean": 5210.5, "valid_targets_min": 791 }, { "epoch": 4.394150417827298, "grad_norm": 0.7383337146665891, "learning_rate": 1.4654972187811858e-05, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.06561724841594696, "step": 3155, "valid_targets_mean": 1279.5, "valid_targets_min": 746 }, { "epoch": 4.401114206128134, "grad_norm": 0.8310596897559344, "learning_rate": 1.4588072806619135e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.08013515174388885, "step": 3160, "valid_targets_mean": 1635.8, "valid_targets_min": 661 }, { "epoch": 4.408077994428969, "grad_norm": 0.8516771248517533, "learning_rate": 1.4521238699104828e-05, "loss": 0.1453, "loss_nan_ranks": 0, "loss_rank_avg": 0.07185165584087372, "step": 3165, "valid_targets_mean": 1420.2, "valid_targets_min": 826 }, { "epoch": 4.415041782729805, "grad_norm": 0.825781158854519, "learning_rate": 1.4454470671360337e-05, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.06541028618812561, "step": 3170, "valid_targets_mean": 1399.9, "valid_targets_min": 742 }, { "epoch": 4.422005571030641, "grad_norm": 0.8548496982709529, "learning_rate": 1.4387769528680098e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.060420047491788864, "step": 3175, "valid_targets_mean": 1309.9, "valid_targets_min": 718 }, { "epoch": 4.428969359331476, "grad_norm": 0.8030341275951788, "learning_rate": 1.4321136075551816e-05, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.08500155806541443, "step": 3180, "valid_targets_mean": 1729.4, "valid_targets_min": 764 }, { "epoch": 4.435933147632312, "grad_norm": 0.7574670919758995, "learning_rate": 1.4254571115646795e-05, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.06925354897975922, "step": 3185, "valid_targets_mean": 1651.4, "valid_targets_min": 814 }, { "epoch": 4.442896935933147, "grad_norm": 0.8399886623759784, "learning_rate": 1.4188075451810238e-05, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.05408865213394165, "step": 3190, "valid_targets_mean": 1192.0, "valid_targets_min": 610 }, { "epoch": 4.449860724233983, "grad_norm": 0.8256278183381764, "learning_rate": 1.4121649886051567e-05, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.07870268821716309, "step": 3195, "valid_targets_mean": 1879.0, "valid_targets_min": 817 }, { "epoch": 4.456824512534819, "grad_norm": 0.7713275384072368, "learning_rate": 1.4055295219534735e-05, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.06405435502529144, "step": 3200, "valid_targets_mean": 1500.4, "valid_targets_min": 837 }, { "epoch": 4.463788300835654, "grad_norm": 0.9706438394826296, "learning_rate": 1.3989012252568596e-05, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.09357143938541412, "step": 3205, "valid_targets_mean": 1661.8, "valid_targets_min": 593 }, { "epoch": 4.47075208913649, "grad_norm": 0.7845778542370729, "learning_rate": 1.3922801784597191e-05, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.06827139109373093, "step": 3210, "valid_targets_mean": 1537.8, "valid_targets_min": 704 }, { "epoch": 4.477715877437326, "grad_norm": 0.7759659105769868, "learning_rate": 1.3856664614190186e-05, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.0502796433866024, "step": 3215, "valid_targets_mean": 1227.0, "valid_targets_min": 722 }, { "epoch": 4.484679665738161, "grad_norm": 0.8287147960258013, "learning_rate": 1.3790601539033168e-05, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.06461460888385773, "step": 3220, "valid_targets_mean": 1364.5, "valid_targets_min": 642 }, { "epoch": 4.491643454038997, "grad_norm": 0.8589525229582935, "learning_rate": 1.3724613355918077e-05, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.06513009965419769, "step": 3225, "valid_targets_mean": 1358.5, "valid_targets_min": 518 }, { "epoch": 4.498607242339833, "grad_norm": 0.8202013278047937, "learning_rate": 1.3658700860733566e-05, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.07893405854701996, "step": 3230, "valid_targets_mean": 1590.6, "valid_targets_min": 728 }, { "epoch": 4.505571030640668, "grad_norm": 0.7966714906034105, "learning_rate": 1.3592864848455415e-05, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.0855114758014679, "step": 3235, "valid_targets_mean": 1791.4, "valid_targets_min": 820 }, { "epoch": 4.512534818941504, "grad_norm": 0.8234446947551594, "learning_rate": 1.3527106113136915e-05, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.07350599765777588, "step": 3240, "valid_targets_mean": 1470.8, "valid_targets_min": 818 }, { "epoch": 4.5194986072423395, "grad_norm": 0.909954505776544, "learning_rate": 1.3461425447899345e-05, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.05728901922702789, "step": 3245, "valid_targets_mean": 1278.6, "valid_targets_min": 625 }, { "epoch": 4.5264623955431755, "grad_norm": 0.7815284768559326, "learning_rate": 1.3395823644922357e-05, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.08874043077230453, "step": 3250, "valid_targets_mean": 2313.5, "valid_targets_min": 790 }, { "epoch": 4.5334261838440115, "grad_norm": 0.8603759963719848, "learning_rate": 1.3330301495434439e-05, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.09591110795736313, "step": 3255, "valid_targets_mean": 2231.9, "valid_targets_min": 1335 }, { "epoch": 4.540389972144847, "grad_norm": 0.758467847298457, "learning_rate": 1.3264859789703391e-05, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.07577726244926453, "step": 3260, "valid_targets_mean": 1729.5, "valid_targets_min": 719 }, { "epoch": 4.547353760445683, "grad_norm": 0.8154388753592663, "learning_rate": 1.3199499317026741e-05, "loss": 0.1302, "loss_nan_ranks": 0, "loss_rank_avg": 0.052854329347610474, "step": 3265, "valid_targets_mean": 1222.9, "valid_targets_min": 697 }, { "epoch": 4.554317548746518, "grad_norm": 0.8552854445354738, "learning_rate": 1.3134220865722282e-05, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.07314737141132355, "step": 3270, "valid_targets_mean": 1521.1, "valid_targets_min": 998 }, { "epoch": 4.561281337047354, "grad_norm": 0.7820786112177985, "learning_rate": 1.3069025223118539e-05, "loss": 0.133, "loss_nan_ranks": 0, "loss_rank_avg": 0.06754308938980103, "step": 3275, "valid_targets_mean": 1693.9, "valid_targets_min": 629 }, { "epoch": 4.56824512534819, "grad_norm": 0.8755511497986203, "learning_rate": 1.3003913175545271e-05, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.07453906536102295, "step": 3280, "valid_targets_mean": 1630.2, "valid_targets_min": 1078 }, { "epoch": 4.575208913649025, "grad_norm": 0.7758564032420037, "learning_rate": 1.2938885508323989e-05, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.06837262213230133, "step": 3285, "valid_targets_mean": 1843.0, "valid_targets_min": 1075 }, { "epoch": 4.582172701949861, "grad_norm": 0.7809622207382767, "learning_rate": 1.28739430057585e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.07848972082138062, "step": 3290, "valid_targets_mean": 1848.2, "valid_targets_min": 1317 }, { "epoch": 4.589136490250697, "grad_norm": 0.7816839323875953, "learning_rate": 1.2809086451125402e-05, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.07772564888000488, "step": 3295, "valid_targets_mean": 1727.4, "valid_targets_min": 957 }, { "epoch": 4.596100278551532, "grad_norm": 0.9203545388755756, "learning_rate": 1.2744316626664702e-05, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.060780055820941925, "step": 3300, "valid_targets_mean": 1115.4, "valid_targets_min": 643 }, { "epoch": 4.603064066852368, "grad_norm": 0.896065872644034, "learning_rate": 1.2679634313570324e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.07272806763648987, "step": 3305, "valid_targets_mean": 1547.2, "valid_targets_min": 1111 }, { "epoch": 4.610027855153203, "grad_norm": 0.7733642462901773, "learning_rate": 1.2615040291980729e-05, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.061603400856256485, "step": 3310, "valid_targets_mean": 1450.0, "valid_targets_min": 705 }, { "epoch": 4.616991643454039, "grad_norm": 0.8143367409475855, "learning_rate": 1.2550535340969483e-05, "loss": 0.1305, "loss_nan_ranks": 0, "loss_rank_avg": 0.07132863998413086, "step": 3315, "valid_targets_mean": 1539.0, "valid_targets_min": 1288 }, { "epoch": 4.623955431754875, "grad_norm": 0.8553022073322677, "learning_rate": 1.2486120238535845e-05, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.06410254538059235, "step": 3320, "valid_targets_mean": 1321.2, "valid_targets_min": 753 }, { "epoch": 4.63091922005571, "grad_norm": 0.8567062695633868, "learning_rate": 1.2421795761595424e-05, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.0614665150642395, "step": 3325, "valid_targets_mean": 1480.0, "valid_targets_min": 817 }, { "epoch": 4.637883008356546, "grad_norm": 0.8755257408477221, "learning_rate": 1.2357562685970787e-05, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.05426248908042908, "step": 3330, "valid_targets_mean": 1293.9, "valid_targets_min": 974 }, { "epoch": 4.644846796657381, "grad_norm": 0.9722123694394161, "learning_rate": 1.2293421786382094e-05, "loss": 0.1333, "loss_nan_ranks": 0, "loss_rank_avg": 0.07091125100851059, "step": 3335, "valid_targets_mean": 1529.2, "valid_targets_min": 657 }, { "epoch": 4.651810584958217, "grad_norm": 0.9541829768814589, "learning_rate": 1.2229373836437764e-05, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.07790433615446091, "step": 3340, "valid_targets_mean": 1678.0, "valid_targets_min": 880 }, { "epoch": 4.658774373259053, "grad_norm": 0.8576485652747621, "learning_rate": 1.2165419608625157e-05, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.07814347743988037, "step": 3345, "valid_targets_mean": 1609.4, "valid_targets_min": 1050 }, { "epoch": 4.665738161559888, "grad_norm": 0.8917597302101115, "learning_rate": 1.2101559874301217e-05, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.05816866457462311, "step": 3350, "valid_targets_mean": 1449.0, "valid_targets_min": 682 }, { "epoch": 4.672701949860724, "grad_norm": 0.832501950400249, "learning_rate": 1.2037795403683212e-05, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.06002386286854744, "step": 3355, "valid_targets_mean": 1344.0, "valid_targets_min": 703 }, { "epoch": 4.67966573816156, "grad_norm": 0.8308585092709525, "learning_rate": 1.1974126965839434e-05, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.06484422087669373, "step": 3360, "valid_targets_mean": 1469.4, "valid_targets_min": 934 }, { "epoch": 4.686629526462395, "grad_norm": 0.8444644777001103, "learning_rate": 1.1910555328679896e-05, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.1002117171883583, "step": 3365, "valid_targets_mean": 1829.1, "valid_targets_min": 734 }, { "epoch": 4.693593314763231, "grad_norm": 0.7838276598240631, "learning_rate": 1.18470812589471e-05, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.08434125781059265, "step": 3370, "valid_targets_mean": 2010.8, "valid_targets_min": 1437 }, { "epoch": 4.7005571030640665, "grad_norm": 0.8121696038208687, "learning_rate": 1.1783705522206794e-05, "loss": 0.1248, "loss_nan_ranks": 0, "loss_rank_avg": 0.05047055333852768, "step": 3375, "valid_targets_mean": 1405.2, "valid_targets_min": 551 }, { "epoch": 4.7075208913649025, "grad_norm": 0.9702607731512856, "learning_rate": 1.1720428882838694e-05, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.08291260153055191, "step": 3380, "valid_targets_mean": 1817.6, "valid_targets_min": 931 }, { "epoch": 4.7144846796657385, "grad_norm": 0.820699694440321, "learning_rate": 1.1657252104027314e-05, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.06308387219905853, "step": 3385, "valid_targets_mean": 1599.1, "valid_targets_min": 904 }, { "epoch": 4.721448467966574, "grad_norm": 0.829670605394756, "learning_rate": 1.1594175947752749e-05, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.07266199588775635, "step": 3390, "valid_targets_mean": 1774.8, "valid_targets_min": 1158 }, { "epoch": 4.72841225626741, "grad_norm": 0.8896710009000609, "learning_rate": 1.1531201174781459e-05, "loss": 0.1211, "loss_nan_ranks": 0, "loss_rank_avg": 0.05510660260915756, "step": 3395, "valid_targets_mean": 1229.2, "valid_targets_min": 756 }, { "epoch": 4.735376044568245, "grad_norm": 1.1555963653569135, "learning_rate": 1.1468328544657132e-05, "loss": 0.1392, "loss_nan_ranks": 0, "loss_rank_avg": 0.08370531350374222, "step": 3400, "valid_targets_mean": 1536.9, "valid_targets_min": 854 }, { "epoch": 4.742339832869081, "grad_norm": 0.8354454053066505, "learning_rate": 1.1405558815691466e-05, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.07298648357391357, "step": 3405, "valid_targets_mean": 1739.5, "valid_targets_min": 1462 }, { "epoch": 4.749303621169917, "grad_norm": 0.8260820753810716, "learning_rate": 1.1342892744955112e-05, "loss": 0.1282, "loss_nan_ranks": 0, "loss_rank_avg": 0.05890219286084175, "step": 3410, "valid_targets_mean": 1475.9, "valid_targets_min": 944 }, { "epoch": 4.756267409470752, "grad_norm": 0.8016656660345047, "learning_rate": 1.1280331088268452e-05, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.060654304921627045, "step": 3415, "valid_targets_mean": 1482.6, "valid_targets_min": 1227 }, { "epoch": 4.763231197771588, "grad_norm": 0.7864044513954926, "learning_rate": 1.1217874600192542e-05, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.051892273128032684, "step": 3420, "valid_targets_mean": 1276.5, "valid_targets_min": 740 }, { "epoch": 4.770194986072424, "grad_norm": 0.774017966732346, "learning_rate": 1.1155524034019981e-05, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.07892292737960815, "step": 3425, "valid_targets_mean": 2024.8, "valid_targets_min": 881 }, { "epoch": 4.777158774373259, "grad_norm": 0.8962743138721668, "learning_rate": 1.1093280141765837e-05, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.06519632786512375, "step": 3430, "valid_targets_mean": 1288.6, "valid_targets_min": 636 }, { "epoch": 4.784122562674095, "grad_norm": 0.8008310946938783, "learning_rate": 1.103114367415858e-05, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.04663780331611633, "step": 3435, "valid_targets_mean": 1103.9, "valid_targets_min": 814 }, { "epoch": 4.791086350974931, "grad_norm": 0.857674350118069, "learning_rate": 1.0969115380631015e-05, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.061598315834999084, "step": 3440, "valid_targets_mean": 1392.9, "valid_targets_min": 820 }, { "epoch": 4.798050139275766, "grad_norm": 0.8096519542290342, "learning_rate": 1.090719600931126e-05, "loss": 0.129, "loss_nan_ranks": 0, "loss_rank_avg": 0.057360272854566574, "step": 3445, "valid_targets_mean": 1392.4, "valid_targets_min": 661 }, { "epoch": 4.805013927576602, "grad_norm": 0.8515212322986098, "learning_rate": 1.0845386307013703e-05, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.06106788292527199, "step": 3450, "valid_targets_mean": 1441.8, "valid_targets_min": 728 }, { "epoch": 4.811977715877437, "grad_norm": 0.8509639251731652, "learning_rate": 1.078368701923003e-05, "loss": 0.1248, "loss_nan_ranks": 0, "loss_rank_avg": 0.060364048928022385, "step": 3455, "valid_targets_mean": 1413.5, "valid_targets_min": 692 }, { "epoch": 4.818941504178273, "grad_norm": 0.8405241655525482, "learning_rate": 1.0722098890120176e-05, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.06148139387369156, "step": 3460, "valid_targets_mean": 1323.5, "valid_targets_min": 840 }, { "epoch": 4.825905292479108, "grad_norm": 0.9119451778532717, "learning_rate": 1.0660622662503389e-05, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.06766475737094879, "step": 3465, "valid_targets_mean": 1488.4, "valid_targets_min": 950 }, { "epoch": 4.832869080779944, "grad_norm": 0.7915913493434501, "learning_rate": 1.0599259077849294e-05, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.07292820513248444, "step": 3470, "valid_targets_mean": 1935.9, "valid_targets_min": 878 }, { "epoch": 4.83983286908078, "grad_norm": 0.8489205471637494, "learning_rate": 1.0538008876268887e-05, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.06822683662176132, "step": 3475, "valid_targets_mean": 1502.1, "valid_targets_min": 836 }, { "epoch": 4.846796657381615, "grad_norm": 0.8786148894939648, "learning_rate": 1.0476872796505658e-05, "loss": 0.1264, "loss_nan_ranks": 0, "loss_rank_avg": 0.07060012221336365, "step": 3480, "valid_targets_mean": 1535.1, "valid_targets_min": 1013 }, { "epoch": 4.853760445682451, "grad_norm": 0.8959033919138696, "learning_rate": 1.0415851575926656e-05, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.05586308240890503, "step": 3485, "valid_targets_mean": 1346.4, "valid_targets_min": 748 }, { "epoch": 4.860724233983287, "grad_norm": 0.9017231573931604, "learning_rate": 1.035494595051361e-05, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.06896314024925232, "step": 3490, "valid_targets_mean": 1543.9, "valid_targets_min": 729 }, { "epoch": 4.867688022284122, "grad_norm": 0.8540161387269878, "learning_rate": 1.0294156654854053e-05, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.058618832379579544, "step": 3495, "valid_targets_mean": 1541.9, "valid_targets_min": 1219 }, { "epoch": 4.874651810584958, "grad_norm": 0.8673351138138804, "learning_rate": 1.023348442213244e-05, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.06518058478832245, "step": 3500, "valid_targets_mean": 1632.8, "valid_targets_min": 916 }, { "epoch": 4.881615598885794, "grad_norm": 0.8662755506535637, "learning_rate": 1.0172929984121333e-05, "loss": 0.1292, "loss_nan_ranks": 0, "loss_rank_avg": 0.0599341094493866, "step": 3505, "valid_targets_mean": 1349.9, "valid_targets_min": 646 }, { "epoch": 4.888579387186629, "grad_norm": 0.8789665027258394, "learning_rate": 1.0112494071172549e-05, "loss": 0.1254, "loss_nan_ranks": 0, "loss_rank_avg": 0.06385256350040436, "step": 3510, "valid_targets_mean": 1383.0, "valid_targets_min": 906 }, { "epoch": 4.895543175487465, "grad_norm": 0.8475866768723133, "learning_rate": 1.0052177412208401e-05, "loss": 0.1225, "loss_nan_ranks": 0, "loss_rank_avg": 0.059585411101579666, "step": 3515, "valid_targets_mean": 1577.5, "valid_targets_min": 848 }, { "epoch": 4.9025069637883005, "grad_norm": 0.9212057570976543, "learning_rate": 9.991980734712821e-06, "loss": 0.1326, "loss_nan_ranks": 0, "loss_rank_avg": 0.06198536604642868, "step": 3520, "valid_targets_mean": 1183.5, "valid_targets_min": 692 }, { "epoch": 4.9094707520891365, "grad_norm": 0.8950552623059923, "learning_rate": 9.931904764722661e-06, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.058858513832092285, "step": 3525, "valid_targets_mean": 1373.9, "valid_targets_min": 821 }, { "epoch": 4.9164345403899725, "grad_norm": 0.7942490619902811, "learning_rate": 9.871950226818907e-06, "loss": 0.1202, "loss_nan_ranks": 0, "loss_rank_avg": 0.05587601661682129, "step": 3530, "valid_targets_mean": 1428.1, "valid_targets_min": 1013 }, { "epoch": 4.923398328690808, "grad_norm": 0.7959315882544532, "learning_rate": 9.812117844117955e-06, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.06044112890958786, "step": 3535, "valid_targets_mean": 1420.9, "valid_targets_min": 781 }, { "epoch": 4.930362116991644, "grad_norm": 0.9261429168716236, "learning_rate": 9.752408338262864e-06, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.06673343479633331, "step": 3540, "valid_targets_mean": 1255.1, "valid_targets_min": 548 }, { "epoch": 4.937325905292479, "grad_norm": 0.7859825717323234, "learning_rate": 9.692822429414657e-06, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.0637277364730835, "step": 3545, "valid_targets_mean": 1411.0, "valid_targets_min": 694 }, { "epoch": 4.944289693593315, "grad_norm": 0.8542974067863182, "learning_rate": 9.633360836243656e-06, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.08179077506065369, "step": 3550, "valid_targets_mean": 1973.8, "valid_targets_min": 1030 }, { "epoch": 4.951253481894151, "grad_norm": 0.7455850946114743, "learning_rate": 9.57402427592081e-06, "loss": 0.1209, "loss_nan_ranks": 0, "loss_rank_avg": 0.05281627178192139, "step": 3555, "valid_targets_mean": 1580.2, "valid_targets_min": 682 }, { "epoch": 4.958217270194986, "grad_norm": 0.8918246113696654, "learning_rate": 9.514813464109023e-06, "loss": 0.1229, "loss_nan_ranks": 0, "loss_rank_avg": 0.06317047029733658, "step": 3560, "valid_targets_mean": 1425.4, "valid_targets_min": 990 }, { "epoch": 4.965181058495822, "grad_norm": 0.8206588096352696, "learning_rate": 9.455729114954542e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.04826410859823227, "step": 3565, "valid_targets_mean": 1299.6, "valid_targets_min": 639 }, { "epoch": 4.972144846796658, "grad_norm": 0.8215144309267559, "learning_rate": 9.396771941078335e-06, "loss": 0.1254, "loss_nan_ranks": 0, "loss_rank_avg": 0.053259532898664474, "step": 3570, "valid_targets_mean": 1458.8, "valid_targets_min": 721 }, { "epoch": 4.979108635097493, "grad_norm": 0.8423487434531587, "learning_rate": 9.337942653567504e-06, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.05987967178225517, "step": 3575, "valid_targets_mean": 1329.8, "valid_targets_min": 874 }, { "epoch": 4.986072423398329, "grad_norm": 0.7786328247052688, "learning_rate": 9.279241961966698e-06, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.0674387663602829, "step": 3580, "valid_targets_mean": 1559.9, "valid_targets_min": 686 }, { "epoch": 4.993036211699164, "grad_norm": 0.8885857987523331, "learning_rate": 9.220670574269564e-06, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.07278092205524445, "step": 3585, "valid_targets_mean": 1392.5, "valid_targets_min": 713 }, { "epoch": 5.0, "grad_norm": 0.9810812179546335, "learning_rate": 9.162229196910201e-06, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.09730862826108932, "step": 3590, "valid_targets_mean": 6130.4, "valid_targets_min": 920 }, { "epoch": 5.006963788300836, "grad_norm": 0.7395884420407827, "learning_rate": 9.103918534754648e-06, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.09225118160247803, "step": 3595, "valid_targets_mean": 7389.0, "valid_targets_min": 5627 }, { "epoch": 5.013927576601671, "grad_norm": 0.7448900926657113, "learning_rate": 9.045739291092377e-06, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.05141618102788925, "step": 3600, "valid_targets_mean": 1294.8, "valid_targets_min": 422 }, { "epoch": 5.020891364902507, "grad_norm": 0.43737029497845903, "learning_rate": 8.987692167627807e-06, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.09226194024085999, "step": 3605, "valid_targets_mean": 8539.9, "valid_targets_min": 6761 }, { "epoch": 5.027855153203342, "grad_norm": 0.40244324306844387, "learning_rate": 8.929777864471847e-06, "loss": 0.1705, "loss_nan_ranks": 0, "loss_rank_avg": 0.0802266001701355, "step": 3610, "valid_targets_mean": 7579.0, "valid_targets_min": 6174 }, { "epoch": 5.034818941504178, "grad_norm": 0.3948157476493201, "learning_rate": 8.871997080133446e-06, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.07746812701225281, "step": 3615, "valid_targets_mean": 7328.2, "valid_targets_min": 4839 }, { "epoch": 5.041782729805014, "grad_norm": 0.42318640045066125, "learning_rate": 8.814350511511187e-06, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.09257575869560242, "step": 3620, "valid_targets_mean": 6838.2, "valid_targets_min": 5034 }, { "epoch": 5.048746518105849, "grad_norm": 0.4452897616046545, "learning_rate": 8.756838853884862e-06, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.09431345760822296, "step": 3625, "valid_targets_mean": 7248.2, "valid_targets_min": 5567 }, { "epoch": 5.055710306406685, "grad_norm": 0.4113841425843344, "learning_rate": 8.699462800907063e-06, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.07702521979808807, "step": 3630, "valid_targets_mean": 6234.0, "valid_targets_min": 5603 }, { "epoch": 5.062674094707521, "grad_norm": 0.6816435531080544, "learning_rate": 8.642223044594873e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.023794259876012802, "step": 3635, "valid_targets_mean": 602.0, "valid_targets_min": 152 }, { "epoch": 5.069637883008356, "grad_norm": 0.40935977827091236, "learning_rate": 8.585120275321493e-06, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.08000779151916504, "step": 3640, "valid_targets_mean": 7299.9, "valid_targets_min": 6158 }, { "epoch": 5.076601671309192, "grad_norm": 0.41147638157549343, "learning_rate": 8.528155181807895e-06, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.08062512427568436, "step": 3645, "valid_targets_mean": 6140.0, "valid_targets_min": 4648 }, { "epoch": 5.0835654596100275, "grad_norm": 0.44547329868476815, "learning_rate": 8.471328451114545e-06, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.08527650684118271, "step": 3650, "valid_targets_mean": 6603.0, "valid_targets_min": 4882 }, { "epoch": 5.0905292479108635, "grad_norm": 0.40170578080263875, "learning_rate": 8.414640768633096e-06, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.0836111456155777, "step": 3655, "valid_targets_mean": 8015.0, "valid_targets_min": 6344 }, { "epoch": 5.0974930362116995, "grad_norm": 0.41169416175196893, "learning_rate": 8.358092818078133e-06, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.07325682044029236, "step": 3660, "valid_targets_mean": 6305.2, "valid_targets_min": 4622 }, { "epoch": 5.104456824512535, "grad_norm": 0.40731776029002104, "learning_rate": 8.301685281478923e-06, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.089007668197155, "step": 3665, "valid_targets_mean": 7890.8, "valid_targets_min": 5485 }, { "epoch": 5.111420612813371, "grad_norm": 0.4776234320230322, "learning_rate": 8.24541883917119e-06, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.07598386704921722, "step": 3670, "valid_targets_mean": 7016.6, "valid_targets_min": 4960 }, { "epoch": 5.118384401114207, "grad_norm": 0.41863282757191406, "learning_rate": 8.189294169788913e-06, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.07902969419956207, "step": 3675, "valid_targets_mean": 6527.1, "valid_targets_min": 5399 }, { "epoch": 5.125348189415042, "grad_norm": 0.47406483603656724, "learning_rate": 8.133311950256127e-06, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.08029402792453766, "step": 3680, "valid_targets_mean": 4995.0, "valid_targets_min": 618 }, { "epoch": 5.132311977715878, "grad_norm": 0.4225431739550544, "learning_rate": 8.077472855778774e-06, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.09067791700363159, "step": 3685, "valid_targets_mean": 7219.4, "valid_targets_min": 5764 }, { "epoch": 5.139275766016713, "grad_norm": 0.4015096498481741, "learning_rate": 8.021777559836554e-06, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.08319695293903351, "step": 3690, "valid_targets_mean": 7998.5, "valid_targets_min": 5902 }, { "epoch": 5.146239554317549, "grad_norm": 0.38710682418396525, "learning_rate": 7.966226734174799e-06, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.06552509218454361, "step": 3695, "valid_targets_mean": 7377.4, "valid_targets_min": 5015 }, { "epoch": 5.153203342618385, "grad_norm": 0.3983605888889487, "learning_rate": 7.910821048796368e-06, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.06865357607603073, "step": 3700, "valid_targets_mean": 6794.0, "valid_targets_min": 5283 }, { "epoch": 5.16016713091922, "grad_norm": 0.44045948176479105, "learning_rate": 7.855561171953594e-06, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.09348156303167343, "step": 3705, "valid_targets_mean": 6656.4, "valid_targets_min": 4364 }, { "epoch": 5.167130919220056, "grad_norm": 0.43728173137315074, "learning_rate": 7.800447770140185e-06, "loss": 0.1677, "loss_nan_ranks": 0, "loss_rank_avg": 0.07885047048330307, "step": 3710, "valid_targets_mean": 7178.4, "valid_targets_min": 4448 }, { "epoch": 5.174094707520891, "grad_norm": 0.4411940412213923, "learning_rate": 7.74548150808319e-06, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.09826900064945221, "step": 3715, "valid_targets_mean": 7619.8, "valid_targets_min": 5737 }, { "epoch": 5.181058495821727, "grad_norm": 0.3963098926707128, "learning_rate": 7.690663048735009e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.06886550784111023, "step": 3720, "valid_targets_mean": 8754.4, "valid_targets_min": 5752 }, { "epoch": 5.188022284122563, "grad_norm": 0.4431165807502115, "learning_rate": 7.635993053265391e-06, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.07675637304782867, "step": 3725, "valid_targets_mean": 6341.0, "valid_targets_min": 4543 }, { "epoch": 5.194986072423398, "grad_norm": 0.4239858813074235, "learning_rate": 7.581472181053435e-06, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.08128580451011658, "step": 3730, "valid_targets_mean": 7181.9, "valid_targets_min": 4563 }, { "epoch": 5.201949860724234, "grad_norm": 0.7649649723811223, "learning_rate": 7.527101089679658e-06, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.051468294113874435, "step": 3735, "valid_targets_mean": 1104.4, "valid_targets_min": 161 }, { "epoch": 5.20891364902507, "grad_norm": 0.41405913060333405, "learning_rate": 7.4728804349180575e-06, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.07386703789234161, "step": 3740, "valid_targets_mean": 7018.2, "valid_targets_min": 5424 }, { "epoch": 5.215877437325905, "grad_norm": 0.45338644264188654, "learning_rate": 7.418810870728203e-06, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.08742383122444153, "step": 3745, "valid_targets_mean": 7738.4, "valid_targets_min": 5329 }, { "epoch": 5.222841225626741, "grad_norm": 0.4466036832294684, "learning_rate": 7.364893049247351e-06, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.0829770565032959, "step": 3750, "valid_targets_mean": 6426.6, "valid_targets_min": 5560 }, { "epoch": 5.229805013927576, "grad_norm": 0.48777116575319945, "learning_rate": 7.311127620782575e-06, "loss": 0.1702, "loss_nan_ranks": 0, "loss_rank_avg": 0.08484528213739395, "step": 3755, "valid_targets_mean": 6169.9, "valid_targets_min": 3446 }, { "epoch": 5.236768802228412, "grad_norm": 0.4147145687544805, "learning_rate": 7.2575152338029255e-06, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.08592289686203003, "step": 3760, "valid_targets_mean": 7204.6, "valid_targets_min": 5381 }, { "epoch": 5.243732590529248, "grad_norm": 0.4338983913748669, "learning_rate": 7.204056534931607e-06, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.08771762251853943, "step": 3765, "valid_targets_mean": 7600.4, "valid_targets_min": 5241 }, { "epoch": 5.250696378830083, "grad_norm": 0.41445196900515596, "learning_rate": 7.150752168938182e-06, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.08908963948488235, "step": 3770, "valid_targets_mean": 7098.5, "valid_targets_min": 5607 }, { "epoch": 5.257660167130919, "grad_norm": 0.463052253966403, "learning_rate": 7.097602778730788e-06, "loss": 0.1687, "loss_nan_ranks": 0, "loss_rank_avg": 0.08907216787338257, "step": 3775, "valid_targets_mean": 6955.1, "valid_targets_min": 5530 }, { "epoch": 5.264623955431755, "grad_norm": 0.4364902349015762, "learning_rate": 7.044609005348389e-06, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.08470651507377625, "step": 3780, "valid_targets_mean": 6748.1, "valid_targets_min": 5364 }, { "epoch": 5.27158774373259, "grad_norm": 0.4667194728842975, "learning_rate": 6.991771487953036e-06, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.08043470978736877, "step": 3785, "valid_targets_mean": 6273.9, "valid_targets_min": 5438 }, { "epoch": 5.278551532033426, "grad_norm": 0.42521567334703014, "learning_rate": 6.939090863822188e-06, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.07761454582214355, "step": 3790, "valid_targets_mean": 6419.5, "valid_targets_min": 4879 }, { "epoch": 5.2855153203342615, "grad_norm": 0.43932142773608807, "learning_rate": 6.8865677683409835e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.07779448479413986, "step": 3795, "valid_targets_mean": 6483.4, "valid_targets_min": 4309 }, { "epoch": 5.2924791086350975, "grad_norm": 0.47079517415735234, "learning_rate": 6.834202834994581e-06, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.09646376967430115, "step": 3800, "valid_targets_mean": 6825.0, "valid_targets_min": 5205 }, { "epoch": 5.2994428969359335, "grad_norm": 0.46289740146196456, "learning_rate": 6.781996695360553e-06, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.07646790146827698, "step": 3805, "valid_targets_mean": 6729.4, "valid_targets_min": 5200 }, { "epoch": 5.306406685236769, "grad_norm": 0.44246422147197345, "learning_rate": 6.729949979101256e-06, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.07880687713623047, "step": 3810, "valid_targets_mean": 6094.0, "valid_targets_min": 5302 }, { "epoch": 5.313370473537605, "grad_norm": 0.4386645916488665, "learning_rate": 6.678063313956211e-06, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.0853356197476387, "step": 3815, "valid_targets_mean": 7140.0, "valid_targets_min": 5270 }, { "epoch": 5.32033426183844, "grad_norm": 0.3896192941415339, "learning_rate": 6.626337325734564e-06, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.07671719789505005, "step": 3820, "valid_targets_mean": 7425.0, "valid_targets_min": 5281 }, { "epoch": 5.327298050139276, "grad_norm": 0.43882210400710403, "learning_rate": 6.574772638307496e-06, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.10439842939376831, "step": 3825, "valid_targets_mean": 7063.4, "valid_targets_min": 5386 }, { "epoch": 5.334261838440112, "grad_norm": 0.4328294638391199, "learning_rate": 6.523369873600767e-06, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.08555565774440765, "step": 3830, "valid_targets_mean": 6827.0, "valid_targets_min": 4547 }, { "epoch": 5.341225626740947, "grad_norm": 0.5740969553533752, "learning_rate": 6.472129651587147e-06, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.03779056295752525, "step": 3835, "valid_targets_mean": 2047.0, "valid_targets_min": 165 }, { "epoch": 5.348189415041783, "grad_norm": 0.4535247047853864, "learning_rate": 6.421052590278976e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.07807661592960358, "step": 3840, "valid_targets_mean": 6754.1, "valid_targets_min": 5196 }, { "epoch": 5.355153203342619, "grad_norm": 0.4691124981565333, "learning_rate": 6.370139305720693e-06, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.07937394082546234, "step": 3845, "valid_targets_mean": 5985.6, "valid_targets_min": 5028 }, { "epoch": 5.362116991643454, "grad_norm": 0.4621292650890354, "learning_rate": 6.319390411981421e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.07576687633991241, "step": 3850, "valid_targets_mean": 5963.9, "valid_targets_min": 5237 }, { "epoch": 5.36908077994429, "grad_norm": 0.47453529144859713, "learning_rate": 6.268806521147546e-06, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.08445766568183899, "step": 3855, "valid_targets_mean": 6319.0, "valid_targets_min": 5412 }, { "epoch": 5.376044568245125, "grad_norm": 0.41147646717777764, "learning_rate": 6.218388243315343e-06, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.06716381013393402, "step": 3860, "valid_targets_mean": 7125.8, "valid_targets_min": 5080 }, { "epoch": 5.383008356545961, "grad_norm": 0.43779798115412527, "learning_rate": 6.168136186583615e-06, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.07958684861660004, "step": 3865, "valid_targets_mean": 6123.5, "valid_targets_min": 4521 }, { "epoch": 5.389972144846797, "grad_norm": 0.966196621555397, "learning_rate": 6.118050957046358e-06, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.09092744439840317, "step": 3870, "valid_targets_mean": 1886.0, "valid_targets_min": 1111 }, { "epoch": 5.396935933147632, "grad_norm": 0.8077855185739582, "learning_rate": 6.068133158785463e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.07527165114879608, "step": 3875, "valid_targets_mean": 1497.6, "valid_targets_min": 893 }, { "epoch": 5.403899721448468, "grad_norm": 0.7144983965195878, "learning_rate": 6.018383393863412e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.049098506569862366, "step": 3880, "valid_targets_mean": 1356.0, "valid_targets_min": 914 }, { "epoch": 5.410863509749303, "grad_norm": 0.8109690813075966, "learning_rate": 5.968802262316009e-06, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.054713502526283264, "step": 3885, "valid_targets_mean": 1324.5, "valid_targets_min": 680 }, { "epoch": 5.417827298050139, "grad_norm": 0.8096672959801836, "learning_rate": 5.919390362145172e-06, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.06651387363672256, "step": 3890, "valid_targets_mean": 1931.8, "valid_targets_min": 876 }, { "epoch": 5.424791086350975, "grad_norm": 0.9084117209145378, "learning_rate": 5.870148289311719e-06, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.05635681003332138, "step": 3895, "valid_targets_mean": 1292.2, "valid_targets_min": 734 }, { "epoch": 5.43175487465181, "grad_norm": 0.8234461561242756, "learning_rate": 5.8210766377281425e-06, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.05349376052618027, "step": 3900, "valid_targets_mean": 1469.6, "valid_targets_min": 655 }, { "epoch": 5.438718662952646, "grad_norm": 0.8349797022317297, "learning_rate": 5.7721759992514835e-06, "loss": 0.1165, "loss_nan_ranks": 0, "loss_rank_avg": 0.06947162747383118, "step": 3905, "valid_targets_mean": 1548.4, "valid_targets_min": 737 }, { "epoch": 5.445682451253482, "grad_norm": 0.8357949779321237, "learning_rate": 5.7234469636761825e-06, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.05619405210018158, "step": 3910, "valid_targets_mean": 1316.5, "valid_targets_min": 759 }, { "epoch": 5.452646239554317, "grad_norm": 0.8320721049373022, "learning_rate": 5.674890118726955e-06, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.048418521881103516, "step": 3915, "valid_targets_mean": 1249.6, "valid_targets_min": 753 }, { "epoch": 5.459610027855153, "grad_norm": 0.8918073241547342, "learning_rate": 5.626506050051716e-06, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.07567094266414642, "step": 3920, "valid_targets_mean": 1833.0, "valid_targets_min": 927 }, { "epoch": 5.4665738161559885, "grad_norm": 0.864812696220783, "learning_rate": 5.578295341214519e-06, "loss": 0.1259, "loss_nan_ranks": 0, "loss_rank_avg": 0.06043354421854019, "step": 3925, "valid_targets_mean": 1338.4, "valid_targets_min": 679 }, { "epoch": 5.4735376044568245, "grad_norm": 0.854189693756131, "learning_rate": 5.530258573688496e-06, "loss": 0.124, "loss_nan_ranks": 0, "loss_rank_avg": 0.05904326215386391, "step": 3930, "valid_targets_mean": 1244.6, "valid_targets_min": 771 }, { "epoch": 5.4805013927576605, "grad_norm": 0.7843808631480862, "learning_rate": 5.482396326848884e-06, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.058021124452352524, "step": 3935, "valid_targets_mean": 1732.5, "valid_targets_min": 986 }, { "epoch": 5.487465181058496, "grad_norm": 0.9558429957238452, "learning_rate": 5.434709177965982e-06, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.05305638536810875, "step": 3940, "valid_targets_mean": 1389.9, "valid_targets_min": 1103 }, { "epoch": 5.494428969359332, "grad_norm": 0.8557141687664696, "learning_rate": 5.387197702198239e-06, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.0624840185046196, "step": 3945, "valid_targets_mean": 1593.2, "valid_targets_min": 675 }, { "epoch": 5.501392757660167, "grad_norm": 0.8442709657389822, "learning_rate": 5.339862472585284e-06, "loss": 0.1221, "loss_nan_ranks": 0, "loss_rank_avg": 0.07162931561470032, "step": 3950, "valid_targets_mean": 1926.6, "valid_targets_min": 974 }, { "epoch": 5.508356545961003, "grad_norm": 0.8922738009156526, "learning_rate": 5.292704060041047e-06, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.07262811809778214, "step": 3955, "valid_targets_mean": 1953.1, "valid_targets_min": 869 }, { "epoch": 5.515320334261839, "grad_norm": 0.8628907763362105, "learning_rate": 5.245723033346841e-06, "loss": 0.1226, "loss_nan_ranks": 0, "loss_rank_avg": 0.05248372256755829, "step": 3960, "valid_targets_mean": 1327.2, "valid_targets_min": 1023 }, { "epoch": 5.522284122562674, "grad_norm": 1.0689981634779093, "learning_rate": 5.198919959144504e-06, "loss": 0.1263, "loss_nan_ranks": 0, "loss_rank_avg": 0.06385475397109985, "step": 3965, "valid_targets_mean": 1717.9, "valid_targets_min": 709 }, { "epoch": 5.52924791086351, "grad_norm": 0.8507547339269755, "learning_rate": 5.152295401929581e-06, "loss": 0.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.04907778650522232, "step": 3970, "valid_targets_mean": 1139.9, "valid_targets_min": 658 }, { "epoch": 5.536211699164346, "grad_norm": 0.8352935218223749, "learning_rate": 5.10584992404453e-06, "loss": 0.1204, "loss_nan_ranks": 0, "loss_rank_avg": 0.05608684569597244, "step": 3975, "valid_targets_mean": 1444.8, "valid_targets_min": 662 }, { "epoch": 5.543175487465181, "grad_norm": 0.8360060925828016, "learning_rate": 5.059584085671896e-06, "loss": 0.1211, "loss_nan_ranks": 0, "loss_rank_avg": 0.04403482377529144, "step": 3980, "valid_targets_mean": 1242.2, "valid_targets_min": 859 }, { "epoch": 5.550139275766017, "grad_norm": 0.8557031879654616, "learning_rate": 5.0134984448275844e-06, "loss": 0.11, "loss_nan_ranks": 0, "loss_rank_avg": 0.06525018811225891, "step": 3985, "valid_targets_mean": 1569.2, "valid_targets_min": 950 }, { "epoch": 5.557103064066853, "grad_norm": 0.8940987834631933, "learning_rate": 4.967593557354125e-06, "loss": 0.1175, "loss_nan_ranks": 0, "loss_rank_avg": 0.057968899607658386, "step": 3990, "valid_targets_mean": 1539.8, "valid_targets_min": 686 }, { "epoch": 5.564066852367688, "grad_norm": 0.8803812608953893, "learning_rate": 4.921869976913964e-06, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.06881322711706161, "step": 3995, "valid_targets_mean": 1610.6, "valid_targets_min": 702 }, { "epoch": 5.571030640668524, "grad_norm": 0.8857750625346741, "learning_rate": 4.876328254982796e-06, "loss": 0.1188, "loss_nan_ranks": 0, "loss_rank_avg": 0.043028295040130615, "step": 4000, "valid_targets_mean": 1190.4, "valid_targets_min": 779 }, { "epoch": 5.577994428969359, "grad_norm": 0.8537850227769329, "learning_rate": 4.8309689408429015e-06, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.06296706199645996, "step": 4005, "valid_targets_mean": 1467.1, "valid_targets_min": 822 }, { "epoch": 5.584958217270195, "grad_norm": 0.8285166830028964, "learning_rate": 4.785792581576523e-06, "loss": 0.1172, "loss_nan_ranks": 0, "loss_rank_avg": 0.05445345491170883, "step": 4010, "valid_targets_mean": 1350.5, "valid_targets_min": 868 }, { "epoch": 5.591922005571031, "grad_norm": 0.8667031190956394, "learning_rate": 4.740799722059269e-06, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.04850904271006584, "step": 4015, "valid_targets_mean": 1283.5, "valid_targets_min": 781 }, { "epoch": 5.598885793871866, "grad_norm": 0.8366685664142771, "learning_rate": 4.6959909049535665e-06, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.05181458219885826, "step": 4020, "valid_targets_mean": 1303.2, "valid_targets_min": 793 }, { "epoch": 5.605849582172702, "grad_norm": 0.7495096178648898, "learning_rate": 4.651366670702054e-06, "loss": 0.1211, "loss_nan_ranks": 0, "loss_rank_avg": 0.047033414244651794, "step": 4025, "valid_targets_mean": 1309.1, "valid_targets_min": 806 }, { "epoch": 5.612813370473537, "grad_norm": 0.811123052386617, "learning_rate": 4.606927557521128e-06, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.04835967719554901, "step": 4030, "valid_targets_mean": 1397.6, "valid_targets_min": 803 }, { "epoch": 5.619777158774373, "grad_norm": 0.851744557513053, "learning_rate": 4.562674101394413e-06, "loss": 0.1157, "loss_nan_ranks": 0, "loss_rank_avg": 0.04473861679434776, "step": 4035, "valid_targets_mean": 1187.8, "valid_targets_min": 660 }, { "epoch": 5.626740947075209, "grad_norm": 0.8083228291949228, "learning_rate": 4.518606836066328e-06, "loss": 0.107, "loss_nan_ranks": 0, "loss_rank_avg": 0.05075952038168907, "step": 4040, "valid_targets_mean": 1547.0, "valid_targets_min": 853 }, { "epoch": 5.633704735376044, "grad_norm": 0.924317112722506, "learning_rate": 4.474726293035614e-06, "loss": 0.1172, "loss_nan_ranks": 0, "loss_rank_avg": 0.0637693852186203, "step": 4045, "valid_targets_mean": 1704.2, "valid_targets_min": 719 }, { "epoch": 5.64066852367688, "grad_norm": 0.8765664950505369, "learning_rate": 4.43103300154893e-06, "loss": 0.1161, "loss_nan_ranks": 0, "loss_rank_avg": 0.044058702886104584, "step": 4050, "valid_targets_mean": 1255.0, "valid_targets_min": 765 }, { "epoch": 5.647632311977716, "grad_norm": 0.8847967785711801, "learning_rate": 4.3875274885944965e-06, "loss": 0.1184, "loss_nan_ranks": 0, "loss_rank_avg": 0.06218354403972626, "step": 4055, "valid_targets_mean": 1550.8, "valid_targets_min": 875 }, { "epoch": 5.654596100278551, "grad_norm": 0.8774671561905153, "learning_rate": 4.344210278895729e-06, "loss": 0.1121, "loss_nan_ranks": 0, "loss_rank_avg": 0.0588260255753994, "step": 4060, "valid_targets_mean": 1362.0, "valid_targets_min": 739 }, { "epoch": 5.661559888579387, "grad_norm": 0.8793053210734343, "learning_rate": 4.301081894904882e-06, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.06402565538883209, "step": 4065, "valid_targets_mean": 1666.8, "valid_targets_min": 760 }, { "epoch": 5.6685236768802225, "grad_norm": 0.8736445128719057, "learning_rate": 4.258142856796779e-06, "loss": 0.111, "loss_nan_ranks": 0, "loss_rank_avg": 0.04810625687241554, "step": 4070, "valid_targets_mean": 1319.6, "valid_targets_min": 1046 }, { "epoch": 5.6754874651810585, "grad_norm": 0.9146961523812506, "learning_rate": 4.21539368246253e-06, "loss": 0.1235, "loss_nan_ranks": 0, "loss_rank_avg": 0.06791988015174866, "step": 4075, "valid_targets_mean": 1727.9, "valid_targets_min": 851 }, { "epoch": 5.6824512534818945, "grad_norm": 0.8950204260314059, "learning_rate": 4.172834887503277e-06, "loss": 0.1226, "loss_nan_ranks": 0, "loss_rank_avg": 0.06217281520366669, "step": 4080, "valid_targets_mean": 1643.2, "valid_targets_min": 907 }, { "epoch": 5.68941504178273, "grad_norm": 0.8625659343005182, "learning_rate": 4.1304669852239865e-06, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.052721407264471054, "step": 4085, "valid_targets_mean": 1478.5, "valid_targets_min": 764 }, { "epoch": 5.696378830083566, "grad_norm": 0.8423037084637137, "learning_rate": 4.088290486627249e-06, "loss": 0.1117, "loss_nan_ranks": 0, "loss_rank_avg": 0.051760852336883545, "step": 4090, "valid_targets_mean": 1522.6, "valid_targets_min": 822 }, { "epoch": 5.703342618384401, "grad_norm": 0.7986133696863431, "learning_rate": 4.046305900407123e-06, "loss": 0.1089, "loss_nan_ranks": 0, "loss_rank_avg": 0.05744687840342522, "step": 4095, "valid_targets_mean": 1589.0, "valid_targets_min": 982 }, { "epoch": 5.710306406685237, "grad_norm": 0.8247019511544061, "learning_rate": 4.004513732943001e-06, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.05563589930534363, "step": 4100, "valid_targets_mean": 1574.8, "valid_targets_min": 816 }, { "epoch": 5.717270194986073, "grad_norm": 0.8220162581325487, "learning_rate": 3.962914488293487e-06, "loss": 0.1119, "loss_nan_ranks": 0, "loss_rank_avg": 0.05360320955514908, "step": 4105, "valid_targets_mean": 1422.0, "valid_targets_min": 721 }, { "epoch": 5.724233983286908, "grad_norm": 0.8640387086170787, "learning_rate": 3.921508668190337e-06, "loss": 0.1102, "loss_nan_ranks": 0, "loss_rank_avg": 0.04421108961105347, "step": 4110, "valid_targets_mean": 1150.6, "valid_targets_min": 741 }, { "epoch": 5.731197771587744, "grad_norm": 0.9963080986309333, "learning_rate": 3.8802967720323944e-06, "loss": 0.116, "loss_nan_ranks": 0, "loss_rank_avg": 0.0667385682463646, "step": 4115, "valid_targets_mean": 1684.2, "valid_targets_min": 734 }, { "epoch": 5.73816155988858, "grad_norm": 0.9033327920465504, "learning_rate": 3.839279296879566e-06, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.07596944272518158, "step": 4120, "valid_targets_mean": 1937.1, "valid_targets_min": 744 }, { "epoch": 5.745125348189415, "grad_norm": 0.9201337682269749, "learning_rate": 3.7984567374468495e-06, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.06649009138345718, "step": 4125, "valid_targets_mean": 1842.2, "valid_targets_min": 620 }, { "epoch": 5.752089136490251, "grad_norm": 0.8638321399247245, "learning_rate": 3.757829586098334e-06, "loss": 0.1111, "loss_nan_ranks": 0, "loss_rank_avg": 0.06432803720235825, "step": 4130, "valid_targets_mean": 1637.6, "valid_targets_min": 785 }, { "epoch": 5.759052924791086, "grad_norm": 0.8229387884326227, "learning_rate": 3.717398332841269e-06, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.06425435841083527, "step": 4135, "valid_targets_mean": 1969.9, "valid_targets_min": 740 }, { "epoch": 5.766016713091922, "grad_norm": 0.9669615015698776, "learning_rate": 3.6771634653201726e-06, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.054495103657245636, "step": 4140, "valid_targets_mean": 1432.1, "valid_targets_min": 711 }, { "epoch": 5.772980501392758, "grad_norm": 0.7975239579352195, "learning_rate": 3.6371254688109493e-06, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.06108352169394493, "step": 4145, "valid_targets_mean": 1695.6, "valid_targets_min": 1122 }, { "epoch": 5.779944289693593, "grad_norm": 0.8324320935247468, "learning_rate": 3.5972848262150084e-06, "loss": 0.1145, "loss_nan_ranks": 0, "loss_rank_avg": 0.06076567620038986, "step": 4150, "valid_targets_mean": 1524.5, "valid_targets_min": 722 }, { "epoch": 5.786908077994429, "grad_norm": 0.8295223085601157, "learning_rate": 3.5576420180534666e-06, "loss": 0.1109, "loss_nan_ranks": 0, "loss_rank_avg": 0.052539028227329254, "step": 4155, "valid_targets_mean": 1289.2, "valid_targets_min": 661 }, { "epoch": 5.793871866295264, "grad_norm": 0.8688174214233373, "learning_rate": 3.518197522461344e-06, "loss": 0.1093, "loss_nan_ranks": 0, "loss_rank_avg": 0.05658646672964096, "step": 4160, "valid_targets_mean": 1519.5, "valid_targets_min": 1011 }, { "epoch": 5.8008356545961, "grad_norm": 0.8560277889635767, "learning_rate": 3.4789518151817926e-06, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.0627206489443779, "step": 4165, "valid_targets_mean": 1731.4, "valid_targets_min": 1277 }, { "epoch": 5.807799442896936, "grad_norm": 0.8221705464226036, "learning_rate": 3.43990536956037e-06, "loss": 0.1132, "loss_nan_ranks": 0, "loss_rank_avg": 0.05920272320508957, "step": 4170, "valid_targets_mean": 1486.1, "valid_targets_min": 807 }, { "epoch": 5.814763231197771, "grad_norm": 0.8332753209312879, "learning_rate": 3.4010586565393176e-06, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.057332780212163925, "step": 4175, "valid_targets_mean": 1549.9, "valid_targets_min": 679 }, { "epoch": 5.821727019498607, "grad_norm": 0.8619887271447355, "learning_rate": 3.36241214465189e-06, "loss": 0.116, "loss_nan_ranks": 0, "loss_rank_avg": 0.05862189084291458, "step": 4180, "valid_targets_mean": 1656.0, "valid_targets_min": 1294 }, { "epoch": 5.828690807799443, "grad_norm": 0.8103161574226729, "learning_rate": 3.323966300016699e-06, "loss": 0.1199, "loss_nan_ranks": 0, "loss_rank_avg": 0.053418777883052826, "step": 4185, "valid_targets_mean": 1368.8, "valid_targets_min": 790 }, { "epoch": 5.835654596100278, "grad_norm": 0.8465138226795567, "learning_rate": 3.285721586332089e-06, "loss": 0.1161, "loss_nan_ranks": 0, "loss_rank_avg": 0.06450681388378143, "step": 4190, "valid_targets_mean": 1765.8, "valid_targets_min": 592 }, { "epoch": 5.842618384401114, "grad_norm": 0.8341389356508091, "learning_rate": 3.247678464870556e-06, "loss": 0.1161, "loss_nan_ranks": 0, "loss_rank_avg": 0.0624236986041069, "step": 4195, "valid_targets_mean": 1586.8, "valid_targets_min": 662 }, { "epoch": 5.84958217270195, "grad_norm": 0.9648828608657739, "learning_rate": 3.2098373944731696e-06, "loss": 0.114, "loss_nan_ranks": 0, "loss_rank_avg": 0.05213096737861633, "step": 4200, "valid_targets_mean": 1336.9, "valid_targets_min": 622 }, { "epoch": 5.8565459610027855, "grad_norm": 0.8693836846048845, "learning_rate": 3.1721988315440467e-06, "loss": 0.113, "loss_nan_ranks": 0, "loss_rank_avg": 0.03882891684770584, "step": 4205, "valid_targets_mean": 1097.1, "valid_targets_min": 625 }, { "epoch": 5.8635097493036215, "grad_norm": 0.8889935458275575, "learning_rate": 3.1347632300448528e-06, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.05130942910909653, "step": 4210, "valid_targets_mean": 1484.9, "valid_targets_min": 888 }, { "epoch": 5.870473537604457, "grad_norm": 0.8950418860834436, "learning_rate": 3.0975310414893147e-06, "loss": 0.1216, "loss_nan_ranks": 0, "loss_rank_avg": 0.06308726966381073, "step": 4215, "valid_targets_mean": 1757.0, "valid_targets_min": 635 }, { "epoch": 5.8774373259052926, "grad_norm": 0.9448517682773246, "learning_rate": 3.060502714937772e-06, "loss": 0.116, "loss_nan_ranks": 0, "loss_rank_avg": 0.06284761428833008, "step": 4220, "valid_targets_mean": 1476.1, "valid_targets_min": 522 }, { "epoch": 5.884401114206128, "grad_norm": 0.8513582848638479, "learning_rate": 3.023678696991774e-06, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.04917547106742859, "step": 4225, "valid_targets_mean": 1230.9, "valid_targets_min": 697 }, { "epoch": 5.891364902506964, "grad_norm": 0.8380241944756079, "learning_rate": 2.9870594317887012e-06, "loss": 0.109, "loss_nan_ranks": 0, "loss_rank_avg": 0.060824502259492874, "step": 4230, "valid_targets_mean": 1671.0, "valid_targets_min": 1010 }, { "epoch": 5.8983286908078, "grad_norm": 0.9611502718725131, "learning_rate": 2.950645360996378e-06, "loss": 0.111, "loss_nan_ranks": 0, "loss_rank_avg": 0.05260036140680313, "step": 4235, "valid_targets_mean": 1411.0, "valid_targets_min": 769 }, { "epoch": 5.905292479108635, "grad_norm": 0.8900339205155612, "learning_rate": 2.914436923807773e-06, "loss": 0.115, "loss_nan_ranks": 0, "loss_rank_avg": 0.04677753150463104, "step": 4240, "valid_targets_mean": 1298.6, "valid_targets_min": 745 }, { "epoch": 5.912256267409471, "grad_norm": 0.8870011470624816, "learning_rate": 2.878434556935672e-06, "loss": 0.1108, "loss_nan_ranks": 0, "loss_rank_avg": 0.042783405631780624, "step": 4245, "valid_targets_mean": 1118.9, "valid_targets_min": 680 }, { "epoch": 5.919220055710307, "grad_norm": 0.8118186588287939, "learning_rate": 2.8426386946074625e-06, "loss": 0.1112, "loss_nan_ranks": 0, "loss_rank_avg": 0.07259643822908401, "step": 4250, "valid_targets_mean": 1905.9, "valid_targets_min": 1347 }, { "epoch": 5.926183844011142, "grad_norm": 0.9846435636971836, "learning_rate": 2.807049768559844e-06, "loss": 0.1197, "loss_nan_ranks": 0, "loss_rank_avg": 0.08297774195671082, "step": 4255, "valid_targets_mean": 1636.0, "valid_targets_min": 851 }, { "epoch": 5.933147632311978, "grad_norm": 0.89306065477576, "learning_rate": 2.771668208033642e-06, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.05090225487947464, "step": 4260, "valid_targets_mean": 1457.2, "valid_targets_min": 903 }, { "epoch": 5.940111420612814, "grad_norm": 0.8381846762533809, "learning_rate": 2.7364944397686356e-06, "loss": 0.1146, "loss_nan_ranks": 0, "loss_rank_avg": 0.05966182425618172, "step": 4265, "valid_targets_mean": 1674.4, "valid_targets_min": 1240 }, { "epoch": 5.947075208913649, "grad_norm": 0.6975382895103197, "learning_rate": 2.7015288879984013e-06, "loss": 0.1174, "loss_nan_ranks": 0, "loss_rank_avg": 0.05049895867705345, "step": 4270, "valid_targets_mean": 1697.1, "valid_targets_min": 917 }, { "epoch": 5.954038997214485, "grad_norm": 0.8183978547191294, "learning_rate": 2.6667719744452037e-06, "loss": 0.1058, "loss_nan_ranks": 0, "loss_rank_avg": 0.05475775897502899, "step": 4275, "valid_targets_mean": 1580.9, "valid_targets_min": 930 }, { "epoch": 5.96100278551532, "grad_norm": 0.8177442897301394, "learning_rate": 2.6322241183149057e-06, "loss": 0.1153, "loss_nan_ranks": 0, "loss_rank_avg": 0.059341538697481155, "step": 4280, "valid_targets_mean": 1655.1, "valid_targets_min": 1227 }, { "epoch": 5.967966573816156, "grad_norm": 0.8272238546293612, "learning_rate": 2.5978857362919054e-06, "loss": 0.1135, "loss_nan_ranks": 0, "loss_rank_avg": 0.05763782560825348, "step": 4285, "valid_targets_mean": 1565.8, "valid_targets_min": 870 }, { "epoch": 5.974930362116992, "grad_norm": 0.9573734999330009, "learning_rate": 2.5637572425341174e-06, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.06584827601909637, "step": 4290, "valid_targets_mean": 1564.6, "valid_targets_min": 822 }, { "epoch": 5.981894150417827, "grad_norm": 1.1210065324101028, "learning_rate": 2.529839048667997e-06, "loss": 0.1222, "loss_nan_ranks": 0, "loss_rank_avg": 0.05611727386713028, "step": 4295, "valid_targets_mean": 1540.5, "valid_targets_min": 1214 }, { "epoch": 5.988857938718663, "grad_norm": 0.8877917752913989, "learning_rate": 2.4961315637835346e-06, "loss": 0.1124, "loss_nan_ranks": 0, "loss_rank_avg": 0.05314347892999649, "step": 4300, "valid_targets_mean": 1268.6, "valid_targets_min": 591 }, { "epoch": 5.995821727019498, "grad_norm": 0.9062573425634036, "learning_rate": 2.4626351944293435e-06, "loss": 0.1205, "loss_nan_ranks": 0, "loss_rank_avg": 0.04725968837738037, "step": 4305, "valid_targets_mean": 1232.5, "valid_targets_min": 646 }, { "epoch": 6.002785515320334, "grad_norm": 0.9480677409493633, "learning_rate": 2.4293503446077638e-06, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.08825192600488663, "step": 4310, "valid_targets_mean": 8514.0, "valid_targets_min": 6788 }, { "epoch": 6.00974930362117, "grad_norm": 0.8792429695725503, "learning_rate": 2.3962774157699853e-06, "loss": 0.1906, "loss_nan_ranks": 0, "loss_rank_avg": 0.09347966313362122, "step": 4315, "valid_targets_mean": 6668.0, "valid_targets_min": 5933 }, { "epoch": 6.016713091922005, "grad_norm": 0.7256186554172626, "learning_rate": 2.363416806811196e-06, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.07888566702604294, "step": 4320, "valid_targets_mean": 4107.0, "valid_targets_min": 161 }, { "epoch": 6.023676880222841, "grad_norm": 0.5337563605817399, "learning_rate": 2.3307689140657796e-06, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.07886291295289993, "step": 4325, "valid_targets_mean": 7946.0, "valid_targets_min": 5596 }, { "epoch": 6.030640668523677, "grad_norm": 0.5250064440886613, "learning_rate": 2.29833413130252e-06, "loss": 0.167, "loss_nan_ranks": 0, "loss_rank_avg": 0.08924835920333862, "step": 4330, "valid_targets_mean": 7392.8, "valid_targets_min": 5629 }, { "epoch": 6.037604456824512, "grad_norm": 1.706269156371303, "learning_rate": 2.2661128497198905e-06, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.08858384191989899, "step": 4335, "valid_targets_mean": 6879.6, "valid_targets_min": 5113 }, { "epoch": 6.044568245125348, "grad_norm": 0.4944795196550045, "learning_rate": 2.234105457941289e-06, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.08616100996732712, "step": 4340, "valid_targets_mean": 6919.5, "valid_targets_min": 5080 }, { "epoch": 6.0515320334261835, "grad_norm": 0.46269857441542933, "learning_rate": 2.202312342010382e-06, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.0758790597319603, "step": 4345, "valid_targets_mean": 6377.0, "valid_targets_min": 3939 }, { "epoch": 6.0584958217270195, "grad_norm": 0.46714693312176175, "learning_rate": 2.170733885386431e-06, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.08216223120689392, "step": 4350, "valid_targets_mean": 6392.2, "valid_targets_min": 4355 }, { "epoch": 6.0654596100278555, "grad_norm": 0.6249782828216601, "learning_rate": 2.1393704689396812e-06, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.08479143679141998, "step": 4355, "valid_targets_mean": 5196.5, "valid_targets_min": 137 }, { "epoch": 6.072423398328691, "grad_norm": 0.43679042233173293, "learning_rate": 2.108222470946757e-06, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.07390058040618896, "step": 4360, "valid_targets_mean": 7344.4, "valid_targets_min": 5244 }, { "epoch": 6.079387186629527, "grad_norm": 0.43303393100622734, "learning_rate": 2.077290267086105e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.06864619255065918, "step": 4365, "valid_targets_mean": 7921.0, "valid_targets_min": 5311 }, { "epoch": 6.086350974930362, "grad_norm": 0.4246006529195599, "learning_rate": 2.04657423043346e-06, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.08542105555534363, "step": 4370, "valid_targets_mean": 7931.2, "valid_targets_min": 6015 }, { "epoch": 6.093314763231198, "grad_norm": 0.4106570417894629, "learning_rate": 2.016074731457356e-06, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.07517217099666595, "step": 4375, "valid_targets_mean": 7640.8, "valid_targets_min": 5248 }, { "epoch": 6.100278551532034, "grad_norm": 0.4148098516880654, "learning_rate": 1.9857921380146462e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.07737202942371368, "step": 4380, "valid_targets_mean": 7249.6, "valid_targets_min": 5217 }, { "epoch": 6.107242339832869, "grad_norm": 0.4436920181563948, "learning_rate": 1.955726815346053e-06, "loss": 0.1622, "loss_nan_ranks": 0, "loss_rank_avg": 0.08977077901363373, "step": 4385, "valid_targets_mean": 7619.9, "valid_targets_min": 5094 }, { "epoch": 6.114206128133705, "grad_norm": 0.40942198769595695, "learning_rate": 1.9258791260717944e-06, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.07487683743238449, "step": 4390, "valid_targets_mean": 7732.8, "valid_targets_min": 5842 }, { "epoch": 6.121169916434541, "grad_norm": 0.4096948039067667, "learning_rate": 1.896249430187198e-06, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.08216005563735962, "step": 4395, "valid_targets_mean": 7952.9, "valid_targets_min": 5494 }, { "epoch": 6.128133704735376, "grad_norm": 0.5382913217347769, "learning_rate": 1.866838085058349e-06, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.08534446358680725, "step": 4400, "valid_targets_mean": 8001.0, "valid_targets_min": 5454 }, { "epoch": 6.135097493036212, "grad_norm": 0.4993178623034378, "learning_rate": 1.837645445417786e-06, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.05737616866827011, "step": 4405, "valid_targets_mean": 2985.1, "valid_targets_min": 1896 }, { "epoch": 6.142061281337047, "grad_norm": 0.5514824724986366, "learning_rate": 1.8086718633602252e-06, "loss": 0.1294, "loss_nan_ranks": 0, "loss_rank_avg": 0.07018405199050903, "step": 4410, "valid_targets_mean": 6714.6, "valid_targets_min": 4917 }, { "epoch": 6.149025069637883, "grad_norm": 0.4252531390576798, "learning_rate": 1.7799176883383152e-06, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.08560578525066376, "step": 4415, "valid_targets_mean": 7595.2, "valid_targets_min": 5488 }, { "epoch": 6.155988857938719, "grad_norm": 0.5092771217817552, "learning_rate": 1.751383267158413e-06, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.08620335161685944, "step": 4420, "valid_targets_mean": 7046.1, "valid_targets_min": 5579 }, { "epoch": 6.162952646239554, "grad_norm": 0.4716862438880787, "learning_rate": 1.7230689439764136e-06, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.07925520837306976, "step": 4425, "valid_targets_mean": 7108.0, "valid_targets_min": 4963 }, { "epoch": 6.16991643454039, "grad_norm": 0.45619274881293254, "learning_rate": 1.694975060293591e-06, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.08042465150356293, "step": 4430, "valid_targets_mean": 6810.1, "valid_targets_min": 5666 }, { "epoch": 6.176880222841225, "grad_norm": 0.3901334892783887, "learning_rate": 1.6671019549524724e-06, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.07437565922737122, "step": 4435, "valid_targets_mean": 8068.5, "valid_targets_min": 5524 }, { "epoch": 6.183844011142061, "grad_norm": 0.40732855082482716, "learning_rate": 1.63944996413278e-06, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.06510244309902191, "step": 4440, "valid_targets_mean": 6553.8, "valid_targets_min": 3621 }, { "epoch": 6.190807799442897, "grad_norm": 0.42124118933928567, "learning_rate": 1.612019421347335e-06, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.07448364794254303, "step": 4445, "valid_targets_mean": 6762.5, "valid_targets_min": 4968 }, { "epoch": 6.197771587743732, "grad_norm": 0.4383555593223217, "learning_rate": 1.5848106574380694e-06, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.07571583241224289, "step": 4450, "valid_targets_mean": 6143.9, "valid_targets_min": 4917 }, { "epoch": 6.204735376044568, "grad_norm": 0.5466494230157721, "learning_rate": 1.5578240005720147e-06, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.10035134851932526, "step": 4455, "valid_targets_mean": 4583.8, "valid_targets_min": 215 }, { "epoch": 6.211699164345404, "grad_norm": 0.4040453396697649, "learning_rate": 1.5310597762373624e-06, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.08089716732501984, "step": 4460, "valid_targets_mean": 7317.1, "valid_targets_min": 4948 }, { "epoch": 6.218662952646239, "grad_norm": 0.4727586903795262, "learning_rate": 1.504518307239522e-06, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.08399631083011627, "step": 4465, "valid_targets_mean": 6437.6, "valid_targets_min": 4510 }, { "epoch": 6.225626740947075, "grad_norm": 0.47933738314929225, "learning_rate": 1.478199913697227e-06, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.09280038625001907, "step": 4470, "valid_targets_mean": 7707.9, "valid_targets_min": 5796 }, { "epoch": 6.2325905292479105, "grad_norm": 0.41595542358539167, "learning_rate": 1.4521049130386854e-06, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.07995796948671341, "step": 4475, "valid_targets_mean": 7900.9, "valid_targets_min": 5643 }, { "epoch": 6.2395543175487465, "grad_norm": 0.4778381922849063, "learning_rate": 1.4262336199977545e-06, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.08848213404417038, "step": 4480, "valid_targets_mean": 7627.2, "valid_targets_min": 5742 }, { "epoch": 6.2465181058495824, "grad_norm": 0.4136225741751865, "learning_rate": 1.4005863466101265e-06, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.09422549605369568, "step": 4485, "valid_targets_mean": 8725.6, "valid_targets_min": 5141 }, { "epoch": 6.2534818941504176, "grad_norm": 0.5089693736225027, "learning_rate": 1.375163402209576e-06, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.09053859859704971, "step": 4490, "valid_targets_mean": 6967.8, "valid_targets_min": 6088 }, { "epoch": 6.2604456824512535, "grad_norm": 0.4130639739472889, "learning_rate": 1.3499650934242325e-06, "loss": 0.1637, "loss_nan_ranks": 0, "loss_rank_avg": 0.07545335590839386, "step": 4495, "valid_targets_mean": 7140.1, "valid_targets_min": 4834 }, { "epoch": 6.2674094707520895, "grad_norm": 0.43000993148245376, "learning_rate": 1.3249917241728704e-06, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.07579700648784637, "step": 4500, "valid_targets_mean": 6706.9, "valid_targets_min": 5108 }, { "epoch": 6.274373259052925, "grad_norm": 0.5160601513181945, "learning_rate": 1.3002435956612614e-06, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.08105462789535522, "step": 4505, "valid_targets_mean": 5931.4, "valid_targets_min": 4708 }, { "epoch": 6.281337047353761, "grad_norm": 0.44759379754062206, "learning_rate": 1.2757210063785186e-06, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.07396161556243896, "step": 4510, "valid_targets_mean": 7145.6, "valid_targets_min": 5280 }, { "epoch": 6.288300835654596, "grad_norm": 0.7344682406855992, "learning_rate": 1.2514242520935182e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.04381747171282768, "step": 4515, "valid_targets_mean": 1554.9, "valid_targets_min": 592 }, { "epoch": 6.295264623955432, "grad_norm": 0.46744454281739256, "learning_rate": 1.2273536258513174e-06, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.09317928552627563, "step": 4520, "valid_targets_mean": 7069.5, "valid_targets_min": 4765 }, { "epoch": 6.302228412256268, "grad_norm": 0.44624650053434495, "learning_rate": 1.2035094179696305e-06, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.08074669539928436, "step": 4525, "valid_targets_mean": 6193.4, "valid_targets_min": 5587 }, { "epoch": 6.309192200557103, "grad_norm": 0.45433035530886273, "learning_rate": 1.1798919160353183e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.0842660665512085, "step": 4530, "valid_targets_mean": 6612.2, "valid_targets_min": 4894 }, { "epoch": 6.316155988857939, "grad_norm": 0.4219263161331273, "learning_rate": 1.1565014049009227e-06, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.07519182562828064, "step": 4535, "valid_targets_mean": 6605.9, "valid_targets_min": 3795 }, { "epoch": 6.323119777158775, "grad_norm": 0.428099298209557, "learning_rate": 1.1333381666812326e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.08015845715999603, "step": 4540, "valid_targets_mean": 7186.8, "valid_targets_min": 4890 }, { "epoch": 6.33008356545961, "grad_norm": 0.5405733766441226, "learning_rate": 1.110402480749886e-06, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.08327323198318481, "step": 4545, "valid_targets_mean": 6544.4, "valid_targets_min": 4615 }, { "epoch": 6.337047353760446, "grad_norm": 0.48862459251110824, "learning_rate": 1.0876946237359887e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.0856969878077507, "step": 4550, "valid_targets_mean": 6339.2, "valid_targets_min": 4798 }, { "epoch": 6.344011142061281, "grad_norm": 0.5591305131293233, "learning_rate": 1.0652148695207809e-06, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.08373311161994934, "step": 4555, "valid_targets_mean": 4558.8, "valid_targets_min": 148 }, { "epoch": 6.350974930362117, "grad_norm": 0.4694300456582176, "learning_rate": 1.042963489234341e-06, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.08754730969667435, "step": 4560, "valid_targets_mean": 6807.9, "valid_targets_min": 5164 }, { "epoch": 6.357938718662953, "grad_norm": 0.4564231493271595, "learning_rate": 1.0209407512523194e-06, "loss": 0.1522, "loss_nan_ranks": 0, "loss_rank_avg": 0.07847484946250916, "step": 4565, "valid_targets_mean": 7011.8, "valid_targets_min": 4974 }, { "epoch": 6.364902506963788, "grad_norm": 0.44585558276766535, "learning_rate": 9.99146921192682e-07, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.07176651060581207, "step": 4570, "valid_targets_mean": 5794.2, "valid_targets_min": 4809 }, { "epoch": 6.371866295264624, "grad_norm": 0.4586375643278151, "learning_rate": 9.775822619125242e-07, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.06948361545801163, "step": 4575, "valid_targets_mean": 6401.8, "valid_targets_min": 4842 }, { "epoch": 6.378830083565459, "grad_norm": 0.4501958201734831, "learning_rate": 9.562470335048912e-07, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.07945942133665085, "step": 4580, "valid_targets_mean": 6182.1, "valid_targets_min": 5116 }, { "epoch": 6.385793871866295, "grad_norm": 0.4327240600935404, "learning_rate": 9.351414932956482e-07, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.0714079886674881, "step": 4585, "valid_targets_mean": 6165.1, "valid_targets_min": 5764 }, { "epoch": 6.392757660167131, "grad_norm": 0.8047252344536302, "learning_rate": 9.142658958403694e-07, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.05607593059539795, "step": 4590, "valid_targets_mean": 1428.2, "valid_targets_min": 1062 }, { "epoch": 6.399721448467966, "grad_norm": 0.8195753374003149, "learning_rate": 8.936204929212766e-07, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.06777313351631165, "step": 4595, "valid_targets_mean": 1663.0, "valid_targets_min": 960 }, { "epoch": 6.406685236768802, "grad_norm": 0.833685966360577, "learning_rate": 8.732055335441902e-07, "loss": 0.1253, "loss_nan_ranks": 0, "loss_rank_avg": 0.06374421715736389, "step": 4600, "valid_targets_mean": 1476.5, "valid_targets_min": 933 }, { "epoch": 6.413649025069638, "grad_norm": 0.780358085772891, "learning_rate": 8.530212639355384e-07, "loss": 0.1247, "loss_nan_ranks": 0, "loss_rank_avg": 0.06148510053753853, "step": 4605, "valid_targets_mean": 1478.1, "valid_targets_min": 881 }, { "epoch": 6.420612813370473, "grad_norm": 0.890308955107473, "learning_rate": 8.330679275393816e-07, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.07429173588752747, "step": 4610, "valid_targets_mean": 1640.6, "valid_targets_min": 869 }, { "epoch": 6.427576601671309, "grad_norm": 0.9489952322841751, "learning_rate": 8.133457650144705e-07, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.06858045607805252, "step": 4615, "valid_targets_mean": 1709.0, "valid_targets_min": 1090 }, { "epoch": 6.4345403899721445, "grad_norm": 0.8409646954850704, "learning_rate": 7.938550142313594e-07, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.046157389879226685, "step": 4620, "valid_targets_mean": 1157.9, "valid_targets_min": 761 }, { "epoch": 6.4415041782729805, "grad_norm": 0.7487722194005665, "learning_rate": 7.7459591026952e-07, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.05890098214149475, "step": 4625, "valid_targets_mean": 1553.6, "valid_targets_min": 1241 }, { "epoch": 6.4484679665738165, "grad_norm": 0.7904874191930988, "learning_rate": 7.555686854145184e-07, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.05734875053167343, "step": 4630, "valid_targets_mean": 1538.1, "valid_targets_min": 733 }, { "epoch": 6.455431754874652, "grad_norm": 0.792386346804611, "learning_rate": 7.367735691552047e-07, "loss": 0.1231, "loss_nan_ranks": 0, "loss_rank_avg": 0.03880469501018524, "step": 4635, "valid_targets_mean": 1250.6, "valid_targets_min": 835 }, { "epoch": 6.462395543175488, "grad_norm": 0.860965341679149, "learning_rate": 7.182107881809486e-07, "loss": 0.1115, "loss_nan_ranks": 0, "loss_rank_avg": 0.06356509774923325, "step": 4640, "valid_targets_mean": 1596.2, "valid_targets_min": 1046 }, { "epoch": 6.469359331476323, "grad_norm": 0.8718675926426537, "learning_rate": 6.998805663789077e-07, "loss": 0.1212, "loss_nan_ranks": 0, "loss_rank_avg": 0.05807361379265785, "step": 4645, "valid_targets_mean": 1646.5, "valid_targets_min": 797 }, { "epoch": 6.476323119777159, "grad_norm": 0.8164546555462905, "learning_rate": 6.817831248313279e-07, "loss": 0.1123, "loss_nan_ranks": 0, "loss_rank_avg": 0.05345907807350159, "step": 4650, "valid_targets_mean": 1448.9, "valid_targets_min": 570 }, { "epoch": 6.483286908077995, "grad_norm": 0.7688143714918261, "learning_rate": 6.639186818128696e-07, "loss": 0.1069, "loss_nan_ranks": 0, "loss_rank_avg": 0.04237380996346474, "step": 4655, "valid_targets_mean": 1164.1, "valid_targets_min": 548 }, { "epoch": 6.49025069637883, "grad_norm": 0.8494248149460677, "learning_rate": 6.462874527879859e-07, "loss": 0.108, "loss_nan_ranks": 0, "loss_rank_avg": 0.05192333832383156, "step": 4660, "valid_targets_mean": 1338.0, "valid_targets_min": 682 }, { "epoch": 6.497214484679666, "grad_norm": 0.9725150847641078, "learning_rate": 6.288896504083019e-07, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.06402169167995453, "step": 4665, "valid_targets_mean": 1632.8, "valid_targets_min": 896 }, { "epoch": 6.504178272980502, "grad_norm": 0.8615786174263845, "learning_rate": 6.117254845100884e-07, "loss": 0.115, "loss_nan_ranks": 0, "loss_rank_avg": 0.0654836893081665, "step": 4670, "valid_targets_mean": 1806.5, "valid_targets_min": 597 }, { "epoch": 6.511142061281337, "grad_norm": 0.8339197139282923, "learning_rate": 5.947951621116899e-07, "loss": 0.1197, "loss_nan_ranks": 0, "loss_rank_avg": 0.049058057367801666, "step": 4675, "valid_targets_mean": 1289.9, "valid_targets_min": 706 }, { "epoch": 6.518105849582173, "grad_norm": 0.7968481465627608, "learning_rate": 5.78098887411056e-07, "loss": 0.1137, "loss_nan_ranks": 0, "loss_rank_avg": 0.04030627757310867, "step": 4680, "valid_targets_mean": 1354.1, "valid_targets_min": 754 }, { "epoch": 6.525069637883008, "grad_norm": 0.7476070454913744, "learning_rate": 5.616368617832657e-07, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.049573637545108795, "step": 4685, "valid_targets_mean": 1461.9, "valid_targets_min": 819 }, { "epoch": 6.532033426183844, "grad_norm": 1.0053730974789308, "learning_rate": 5.454092837781e-07, "loss": 0.1164, "loss_nan_ranks": 0, "loss_rank_avg": 0.041574910283088684, "step": 4690, "valid_targets_mean": 1225.5, "valid_targets_min": 684 }, { "epoch": 6.53899721448468, "grad_norm": 0.9520563364369184, "learning_rate": 5.294163491176507e-07, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.05617387592792511, "step": 4695, "valid_targets_mean": 1282.2, "valid_targets_min": 711 }, { "epoch": 6.545961002785515, "grad_norm": 1.2484349046028755, "learning_rate": 5.136582506939558e-07, "loss": 0.1108, "loss_nan_ranks": 0, "loss_rank_avg": 0.06170322746038437, "step": 4700, "valid_targets_mean": 1634.8, "valid_targets_min": 1190 }, { "epoch": 6.552924791086351, "grad_norm": 0.8277215108085088, "learning_rate": 4.981351785666788e-07, "loss": 0.1073, "loss_nan_ranks": 0, "loss_rank_avg": 0.05962364748120308, "step": 4705, "valid_targets_mean": 1615.9, "valid_targets_min": 774 }, { "epoch": 6.559888579387186, "grad_norm": 1.256443333024305, "learning_rate": 4.828473199608086e-07, "loss": 0.1114, "loss_nan_ranks": 0, "loss_rank_avg": 0.062144938856363297, "step": 4710, "valid_targets_mean": 1848.4, "valid_targets_min": 734 }, { "epoch": 6.566852367688022, "grad_norm": 0.8519945991274293, "learning_rate": 4.6779485926440994e-07, "loss": 0.1102, "loss_nan_ranks": 0, "loss_rank_avg": 0.06112103536725044, "step": 4715, "valid_targets_mean": 1570.6, "valid_targets_min": 1011 }, { "epoch": 6.573816155988858, "grad_norm": 0.8867015908107557, "learning_rate": 4.529779780263899e-07, "loss": 0.1188, "loss_nan_ranks": 0, "loss_rank_avg": 0.06696411967277527, "step": 4720, "valid_targets_mean": 1697.0, "valid_targets_min": 803 }, { "epoch": 6.580779944289693, "grad_norm": 0.8971331539026275, "learning_rate": 4.3839685495431494e-07, "loss": 0.1156, "loss_nan_ranks": 0, "loss_rank_avg": 0.05167017877101898, "step": 4725, "valid_targets_mean": 1307.1, "valid_targets_min": 782 }, { "epoch": 6.587743732590529, "grad_norm": 0.8240677573070857, "learning_rate": 4.240516659122529e-07, "loss": 0.1112, "loss_nan_ranks": 0, "loss_rank_avg": 0.05892687290906906, "step": 4730, "valid_targets_mean": 1596.6, "valid_targets_min": 646 }, { "epoch": 6.594707520891365, "grad_norm": 0.8777230504903879, "learning_rate": 4.099425839186588e-07, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.07540211081504822, "step": 4735, "valid_targets_mean": 1817.5, "valid_targets_min": 922 }, { "epoch": 6.6016713091922, "grad_norm": 0.9233129928932025, "learning_rate": 3.960697791442725e-07, "loss": 0.1185, "loss_nan_ranks": 0, "loss_rank_avg": 0.06853315234184265, "step": 4740, "valid_targets_mean": 1822.2, "valid_targets_min": 796 }, { "epoch": 6.608635097493036, "grad_norm": 0.8365359905989758, "learning_rate": 3.824334189100864e-07, "loss": 0.1067, "loss_nan_ranks": 0, "loss_rank_avg": 0.05597367510199547, "step": 4745, "valid_targets_mean": 1542.4, "valid_targets_min": 903 }, { "epoch": 6.615598885793872, "grad_norm": 0.8653881395676635, "learning_rate": 3.6903366768530347e-07, "loss": 0.1093, "loss_nan_ranks": 0, "loss_rank_avg": 0.059465356171131134, "step": 4750, "valid_targets_mean": 1459.5, "valid_targets_min": 780 }, { "epoch": 6.6225626740947074, "grad_norm": 1.0220209875020088, "learning_rate": 3.558706870853801e-07, "loss": 0.1059, "loss_nan_ranks": 0, "loss_rank_avg": 0.05482107773423195, "step": 4755, "valid_targets_mean": 1581.1, "valid_targets_min": 783 }, { "epoch": 6.629526462395543, "grad_norm": 0.8895541017805985, "learning_rate": 3.42944635870055e-07, "loss": 0.1085, "loss_nan_ranks": 0, "loss_rank_avg": 0.04831491783261299, "step": 4760, "valid_targets_mean": 1342.1, "valid_targets_min": 662 }, { "epoch": 6.6364902506963785, "grad_norm": 0.85022678615267, "learning_rate": 3.302556699414461e-07, "loss": 0.1065, "loss_nan_ranks": 0, "loss_rank_avg": 0.04755166172981262, "step": 4765, "valid_targets_mean": 1269.1, "valid_targets_min": 724 }, { "epoch": 6.6434540389972145, "grad_norm": 0.9159333691892194, "learning_rate": 3.178039423421675e-07, "loss": 0.1092, "loss_nan_ranks": 0, "loss_rank_avg": 0.05955637991428375, "step": 4770, "valid_targets_mean": 1510.1, "valid_targets_min": 966 }, { "epoch": 6.65041782729805, "grad_norm": 0.8794943394432526, "learning_rate": 3.055896032534844e-07, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.04700024425983429, "step": 4775, "valid_targets_mean": 1327.8, "valid_targets_min": 773 }, { "epoch": 6.657381615598886, "grad_norm": 1.0648559373125812, "learning_rate": 2.9361279999349456e-07, "loss": 0.1072, "loss_nan_ranks": 0, "loss_rank_avg": 0.0473455972969532, "step": 4780, "valid_targets_mean": 1353.2, "valid_targets_min": 807 }, { "epoch": 6.664345403899722, "grad_norm": 0.8462867733368669, "learning_rate": 2.8187367701536514e-07, "loss": 0.1106, "loss_nan_ranks": 0, "loss_rank_avg": 0.0411439947783947, "step": 4785, "valid_targets_mean": 1142.5, "valid_targets_min": 782 }, { "epoch": 6.671309192200557, "grad_norm": 0.8759881208699287, "learning_rate": 2.7037237590557874e-07, "loss": 0.1082, "loss_nan_ranks": 0, "loss_rank_avg": 0.06818887591362, "step": 4790, "valid_targets_mean": 1849.9, "valid_targets_min": 634 }, { "epoch": 6.678272980501393, "grad_norm": 0.8652916414354441, "learning_rate": 2.591090353822279e-07, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.05813930183649063, "step": 4795, "valid_targets_mean": 1599.6, "valid_targets_min": 573 }, { "epoch": 6.685236768802229, "grad_norm": 0.8289668185741821, "learning_rate": 2.480837912933476e-07, "loss": 0.1141, "loss_nan_ranks": 0, "loss_rank_avg": 0.06298094987869263, "step": 4800, "valid_targets_mean": 1994.9, "valid_targets_min": 1102 }, { "epoch": 6.692200557103064, "grad_norm": 0.8437774991054501, "learning_rate": 2.372967766152745e-07, "loss": 0.1149, "loss_nan_ranks": 0, "loss_rank_avg": 0.04422305151820183, "step": 4805, "valid_targets_mean": 1239.2, "valid_targets_min": 841 }, { "epoch": 6.6991643454039, "grad_norm": 0.8335016224230695, "learning_rate": 2.2674812145103253e-07, "loss": 0.1059, "loss_nan_ranks": 0, "loss_rank_avg": 0.04819972813129425, "step": 4810, "valid_targets_mean": 1467.5, "valid_targets_min": 956 }, { "epoch": 6.706128133704736, "grad_norm": 0.9023177270948384, "learning_rate": 2.16437953028783e-07, "loss": 0.1115, "loss_nan_ranks": 0, "loss_rank_avg": 0.05732536315917969, "step": 4815, "valid_targets_mean": 1300.9, "valid_targets_min": 857 }, { "epoch": 6.713091922005571, "grad_norm": 0.8464182537507942, "learning_rate": 2.0636639570027706e-07, "loss": 0.1107, "loss_nan_ranks": 0, "loss_rank_avg": 0.054763518273830414, "step": 4820, "valid_targets_mean": 1389.8, "valid_targets_min": 808 }, { "epoch": 6.720055710306407, "grad_norm": 0.8724602751899221, "learning_rate": 1.9653357093935677e-07, "loss": 0.1042, "loss_nan_ranks": 0, "loss_rank_avg": 0.05148616060614586, "step": 4825, "valid_targets_mean": 1303.8, "valid_targets_min": 677 }, { "epoch": 6.727019498607242, "grad_norm": 0.892862606177971, "learning_rate": 1.8693959734049194e-07, "loss": 0.1064, "loss_nan_ranks": 0, "loss_rank_avg": 0.04439748823642731, "step": 4830, "valid_targets_mean": 1220.1, "valid_targets_min": 727 }, { "epoch": 6.733983286908078, "grad_norm": 0.8006054734140239, "learning_rate": 1.7758459061735235e-07, "loss": 0.1099, "loss_nan_ranks": 0, "loss_rank_avg": 0.04145853966474533, "step": 4835, "valid_targets_mean": 1262.0, "valid_targets_min": 726 }, { "epoch": 6.740947075208914, "grad_norm": 0.9012716233194072, "learning_rate": 1.6846866360140434e-07, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.06492114067077637, "step": 4840, "valid_targets_mean": 1615.0, "valid_targets_min": 669 }, { "epoch": 6.747910863509749, "grad_norm": 0.8349181470475844, "learning_rate": 1.595919262405632e-07, "loss": 0.1111, "loss_nan_ranks": 0, "loss_rank_avg": 0.05895448848605156, "step": 4845, "valid_targets_mean": 1806.5, "valid_targets_min": 792 }, { "epoch": 6.754874651810585, "grad_norm": 0.8116954418998069, "learning_rate": 1.5095448559785176e-07, "loss": 0.1073, "loss_nan_ranks": 0, "loss_rank_avg": 0.05427628010511398, "step": 4850, "valid_targets_mean": 1627.6, "valid_targets_min": 736 }, { "epoch": 6.76183844011142, "grad_norm": 0.8820001141515799, "learning_rate": 1.425564458501194e-07, "loss": 0.1152, "loss_nan_ranks": 0, "loss_rank_avg": 0.07305572926998138, "step": 4855, "valid_targets_mean": 1822.9, "valid_targets_min": 694 }, { "epoch": 6.768802228412256, "grad_norm": 0.8785588698821919, "learning_rate": 1.3439790828678523e-07, "loss": 0.1075, "loss_nan_ranks": 0, "loss_rank_avg": 0.06912118941545486, "step": 4860, "valid_targets_mean": 1848.9, "valid_targets_min": 1437 }, { "epoch": 6.775766016713092, "grad_norm": 0.8363864610673993, "learning_rate": 1.2647897130860566e-07, "loss": 0.1113, "loss_nan_ranks": 0, "loss_rank_avg": 0.06591206789016724, "step": 4865, "valid_targets_mean": 1852.4, "valid_targets_min": 809 }, { "epoch": 6.782729805013927, "grad_norm": 0.8474827648363192, "learning_rate": 1.187997304265065e-07, "loss": 0.108, "loss_nan_ranks": 0, "loss_rank_avg": 0.05124801769852638, "step": 4870, "valid_targets_mean": 1375.5, "valid_targets_min": 790 }, { "epoch": 6.789693593314763, "grad_norm": 0.8696793467523222, "learning_rate": 1.1136027826040841e-07, "loss": 0.102, "loss_nan_ranks": 0, "loss_rank_avg": 0.048445772379636765, "step": 4875, "valid_targets_mean": 1338.8, "valid_targets_min": 750 }, { "epoch": 6.796657381615599, "grad_norm": 0.9202757557686742, "learning_rate": 1.041607045381321e-07, "loss": 0.1109, "loss_nan_ranks": 0, "loss_rank_avg": 0.06679531186819077, "step": 4880, "valid_targets_mean": 1778.8, "valid_targets_min": 826 }, { "epoch": 6.803621169916434, "grad_norm": 0.8516595011162112, "learning_rate": 9.720109609429928e-08, "loss": 0.1121, "loss_nan_ranks": 0, "loss_rank_avg": 0.05206713080406189, "step": 4885, "valid_targets_mean": 1600.8, "valid_targets_min": 907 }, { "epoch": 6.81058495821727, "grad_norm": 0.8400966183501765, "learning_rate": 9.04815368692935e-08, "loss": 0.1044, "loss_nan_ranks": 0, "loss_rank_avg": 0.05995471403002739, "step": 4890, "valid_targets_mean": 1474.5, "valid_targets_min": 1093 }, { "epoch": 6.8175487465181055, "grad_norm": 0.8562520722201993, "learning_rate": 8.400210790824536e-08, "loss": 0.109, "loss_nan_ranks": 0, "loss_rank_avg": 0.06154263764619827, "step": 4895, "valid_targets_mean": 1577.2, "valid_targets_min": 1119 }, { "epoch": 6.8245125348189415, "grad_norm": 0.8814865307617711, "learning_rate": 7.776288736005776e-08, "loss": 0.1132, "loss_nan_ranks": 0, "loss_rank_avg": 0.06116368994116783, "step": 4900, "valid_targets_mean": 1512.1, "valid_targets_min": 700 }, { "epoch": 6.8314763231197775, "grad_norm": 0.816015444670367, "learning_rate": 7.176395047645557e-08, "loss": 0.11, "loss_nan_ranks": 0, "loss_rank_avg": 0.0455644354224205, "step": 4905, "valid_targets_mean": 1288.2, "valid_targets_min": 810 }, { "epoch": 6.838440111420613, "grad_norm": 0.9432317625659447, "learning_rate": 6.600536961109072e-08, "loss": 0.1136, "loss_nan_ranks": 0, "loss_rank_avg": 0.052437908947467804, "step": 4910, "valid_targets_mean": 1328.9, "valid_targets_min": 635 }, { "epoch": 6.845403899721449, "grad_norm": 0.8794044449829441, "learning_rate": 6.048721421865633e-08, "loss": 0.1057, "loss_nan_ranks": 0, "loss_rank_avg": 0.059289056807756424, "step": 4915, "valid_targets_mean": 1542.5, "valid_targets_min": 673 }, { "epoch": 6.852367688022284, "grad_norm": 0.9326004661735458, "learning_rate": 5.5209550854058435e-08, "loss": 0.1152, "loss_nan_ranks": 0, "loss_rank_avg": 0.06115001440048218, "step": 4920, "valid_targets_mean": 1215.6, "valid_targets_min": 641 }, { "epoch": 6.85933147632312, "grad_norm": 0.8767540104775717, "learning_rate": 5.017244317160997e-08, "loss": 0.1056, "loss_nan_ranks": 0, "loss_rank_avg": 0.04882102459669113, "step": 4925, "valid_targets_mean": 1222.6, "valid_targets_min": 701 }, { "epoch": 6.866295264623956, "grad_norm": 0.8971771361885165, "learning_rate": 4.537595192425803e-08, "loss": 0.1211, "loss_nan_ranks": 0, "loss_rank_avg": 0.0595490038394928, "step": 4930, "valid_targets_mean": 1850.6, "valid_targets_min": 1202 }, { "epoch": 6.873259052924791, "grad_norm": 0.8299434208974764, "learning_rate": 4.0820134962864525e-08, "loss": 0.1095, "loss_nan_ranks": 0, "loss_rank_avg": 0.044841837137937546, "step": 4935, "valid_targets_mean": 1265.5, "valid_targets_min": 657 }, { "epoch": 6.880222841225627, "grad_norm": 0.901095866607732, "learning_rate": 3.650504723549109e-08, "loss": 0.1125, "loss_nan_ranks": 0, "loss_rank_avg": 0.05367933213710785, "step": 4940, "valid_targets_mean": 1388.0, "valid_targets_min": 672 }, { "epoch": 6.887186629526463, "grad_norm": 0.8315063396628217, "learning_rate": 3.243074078675301e-08, "loss": 0.1088, "loss_nan_ranks": 0, "loss_rank_avg": 0.06695376336574554, "step": 4945, "valid_targets_mean": 1813.6, "valid_targets_min": 1019 }, { "epoch": 6.894150417827298, "grad_norm": 0.8625526799833706, "learning_rate": 2.85972647571775e-08, "loss": 0.1029, "loss_nan_ranks": 0, "loss_rank_avg": 0.044332314282655716, "step": 4950, "valid_targets_mean": 1114.6, "valid_targets_min": 732 }, { "epoch": 6.901114206128134, "grad_norm": 1.0040487494315289, "learning_rate": 2.5004665382619698e-08, "loss": 0.1126, "loss_nan_ranks": 0, "loss_rank_avg": 0.0398283377289772, "step": 4955, "valid_targets_mean": 1194.5, "valid_targets_min": 634 }, { "epoch": 6.908077994428969, "grad_norm": 0.8569836647676721, "learning_rate": 2.1652985993705355e-08, "loss": 0.1055, "loss_nan_ranks": 0, "loss_rank_avg": 0.0556265227496624, "step": 4960, "valid_targets_mean": 1756.5, "valid_targets_min": 905 }, { "epoch": 6.915041782729805, "grad_norm": 0.8794612149843942, "learning_rate": 1.8542267015297932e-08, "loss": 0.1044, "loss_nan_ranks": 0, "loss_rank_avg": 0.06186116486787796, "step": 4965, "valid_targets_mean": 1554.9, "valid_targets_min": 596 }, { "epoch": 6.922005571030641, "grad_norm": 0.8682797357172517, "learning_rate": 1.5672545966025633e-08, "loss": 0.105, "loss_nan_ranks": 0, "loss_rank_avg": 0.0438067801296711, "step": 4970, "valid_targets_mean": 1214.6, "valid_targets_min": 687 }, { "epoch": 6.928969359331476, "grad_norm": 0.8529938938679981, "learning_rate": 1.3043857457819553e-08, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.06511755287647247, "step": 4975, "valid_targets_mean": 1955.1, "valid_targets_min": 1199 }, { "epoch": 6.935933147632312, "grad_norm": 0.8325142431206025, "learning_rate": 1.0656233195498466e-08, "loss": 0.1088, "loss_nan_ranks": 0, "loss_rank_avg": 0.059841353446245193, "step": 4980, "valid_targets_mean": 1758.6, "valid_targets_min": 1214 }, { "epoch": 6.942896935933147, "grad_norm": 0.8532395148660459, "learning_rate": 8.509701976382456e-09, "loss": 0.1079, "loss_nan_ranks": 0, "loss_rank_avg": 0.06080895662307739, "step": 4985, "valid_targets_mean": 1711.5, "valid_targets_min": 1122 }, { "epoch": 6.949860724233983, "grad_norm": 0.8576769303500783, "learning_rate": 6.6042896899576324e-09, "loss": 0.1106, "loss_nan_ranks": 0, "loss_rank_avg": 0.051803942769765854, "step": 4990, "valid_targets_mean": 1489.6, "valid_targets_min": 850 }, { "epoch": 6.956824512534819, "grad_norm": 0.7839478511204715, "learning_rate": 4.940019317547506e-09, "loss": 0.0999, "loss_nan_ranks": 0, "loss_rank_avg": 0.049742192029953, "step": 4995, "valid_targets_mean": 1572.4, "valid_targets_min": 1318 }, { "epoch": 6.963788300835654, "grad_norm": 0.8785812149835993, "learning_rate": 3.516910932048756e-09, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.060333505272865295, "step": 5000, "valid_targets_mean": 1500.0, "valid_targets_min": 1043 }, { "epoch": 6.97075208913649, "grad_norm": 0.8822603333113546, "learning_rate": 2.3349816976825367e-09, "loss": 0.1113, "loss_nan_ranks": 0, "loss_rank_avg": 0.06858158856630325, "step": 5005, "valid_targets_mean": 1774.9, "valid_targets_min": 920 }, { "epoch": 6.977715877437326, "grad_norm": 0.8367535436815119, "learning_rate": 1.3942458697924211e-09, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.05870440602302551, "step": 5010, "valid_targets_mean": 1547.1, "valid_targets_min": 847 }, { "epoch": 6.984679665738161, "grad_norm": 0.7917458458759404, "learning_rate": 6.947147946645416e-10, "loss": 0.1116, "loss_nan_ranks": 0, "loss_rank_avg": 0.05920833349227905, "step": 5015, "valid_targets_mean": 1769.4, "valid_targets_min": 738 }, { "epoch": 6.991643454038997, "grad_norm": 0.9106170116332665, "learning_rate": 2.3639690939880613e-10, "loss": 0.1124, "loss_nan_ranks": 0, "loss_rank_avg": 0.06107974797487259, "step": 5020, "valid_targets_mean": 1540.1, "valid_targets_min": 594 }, { "epoch": 6.998607242339833, "grad_norm": 1.1797464944725595, "learning_rate": 1.929774180231547e-11, "loss": 0.1135, "loss_nan_ranks": 0, "loss_rank_avg": 0.06046333163976669, "step": 5025, "valid_targets_mean": 2228.6, "valid_targets_min": 1393 }, { "epoch": 7.0, "step": 5026, "total_flos": 1.6519984675532308e+18, "train_loss": 0.0, "train_runtime": 1.7845, "train_samples_per_second": 45043.632, "train_steps_per_second": 2816.453 } ], "logging_steps": 5, "max_steps": 5026, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.6519984675532308e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }