{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 8169, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.004284490145672665, "grad_norm": 13.494672426000244, "learning_rate": 1.9583843329253365e-07, "loss": 0.6876, "loss_nan_ranks": 0, "loss_rank_avg": 0.3388299345970154, "step": 5, "valid_targets_mean": 4748.4, "valid_targets_min": 2097 }, { "epoch": 0.00856898029134533, "grad_norm": 13.627970120064575, "learning_rate": 4.406364749082008e-07, "loss": 0.6849, "loss_nan_ranks": 0, "loss_rank_avg": 0.3521880507469177, "step": 10, "valid_targets_mean": 5171.9, "valid_targets_min": 2306 }, { "epoch": 0.012853470437017995, "grad_norm": 13.0750137558056, "learning_rate": 6.854345165238678e-07, "loss": 0.6856, "loss_nan_ranks": 0, "loss_rank_avg": 0.37566128373146057, "step": 15, "valid_targets_mean": 5947.0, "valid_targets_min": 4169 }, { "epoch": 0.01713796058269066, "grad_norm": 11.347303801767657, "learning_rate": 9.30232558139535e-07, "loss": 0.6682, "loss_nan_ranks": 0, "loss_rank_avg": 0.30158156156539917, "step": 20, "valid_targets_mean": 5885.1, "valid_targets_min": 3731 }, { "epoch": 0.021422450728363324, "grad_norm": 8.458288031130037, "learning_rate": 1.175030599755202e-06, "loss": 0.6535, "loss_nan_ranks": 0, "loss_rank_avg": 0.3375881314277649, "step": 25, "valid_targets_mean": 5465.9, "valid_targets_min": 2991 }, { "epoch": 0.02570694087403599, "grad_norm": 6.174217503581587, "learning_rate": 1.4198286413708693e-06, "loss": 0.6146, "loss_nan_ranks": 0, "loss_rank_avg": 0.2947828769683838, "step": 30, "valid_targets_mean": 6386.5, "valid_targets_min": 4563 }, { "epoch": 0.029991431019708654, "grad_norm": 5.113168458961102, "learning_rate": 1.6646266829865362e-06, "loss": 0.5942, "loss_nan_ranks": 0, "loss_rank_avg": 0.28605085611343384, "step": 35, "valid_targets_mean": 4906.0, "valid_targets_min": 2785 }, { "epoch": 0.03427592116538132, "grad_norm": 4.466096345198193, "learning_rate": 1.9094247246022034e-06, "loss": 0.5779, "loss_nan_ranks": 0, "loss_rank_avg": 0.28148600459098816, "step": 40, "valid_targets_mean": 4122.8, "valid_targets_min": 2077 }, { "epoch": 0.038560411311053984, "grad_norm": 4.4102843948797235, "learning_rate": 2.1542227662178707e-06, "loss": 0.5303, "loss_nan_ranks": 0, "loss_rank_avg": 0.24403318762779236, "step": 45, "valid_targets_mean": 5068.8, "valid_targets_min": 1885 }, { "epoch": 0.04284490145672665, "grad_norm": 2.5838635468953304, "learning_rate": 2.3990208078335376e-06, "loss": 0.4715, "loss_nan_ranks": 0, "loss_rank_avg": 0.24094364047050476, "step": 50, "valid_targets_mean": 5781.5, "valid_targets_min": 1360 }, { "epoch": 0.04712939160239932, "grad_norm": 1.66427395007336, "learning_rate": 2.6438188494492045e-06, "loss": 0.466, "loss_nan_ranks": 0, "loss_rank_avg": 0.24363049864768982, "step": 55, "valid_targets_mean": 5561.0, "valid_targets_min": 2994 }, { "epoch": 0.05141388174807198, "grad_norm": 1.2843484071788496, "learning_rate": 2.8886168910648714e-06, "loss": 0.4702, "loss_nan_ranks": 0, "loss_rank_avg": 0.18553395569324493, "step": 60, "valid_targets_mean": 4436.9, "valid_targets_min": 2411 }, { "epoch": 0.055698371893744644, "grad_norm": 1.1208170150705083, "learning_rate": 3.1334149326805383e-06, "loss": 0.4611, "loss_nan_ranks": 0, "loss_rank_avg": 0.20919764041900635, "step": 65, "valid_targets_mean": 4674.6, "valid_targets_min": 2789 }, { "epoch": 0.05998286203941731, "grad_norm": 0.8862735321798944, "learning_rate": 3.378212974296206e-06, "loss": 0.4505, "loss_nan_ranks": 0, "loss_rank_avg": 0.17865021526813507, "step": 70, "valid_targets_mean": 4583.2, "valid_targets_min": 1330 }, { "epoch": 0.06426735218508997, "grad_norm": 0.8100500072395349, "learning_rate": 3.623011015911873e-06, "loss": 0.4574, "loss_nan_ranks": 0, "loss_rank_avg": 0.20401369035243988, "step": 75, "valid_targets_mean": 5121.2, "valid_targets_min": 1862 }, { "epoch": 0.06855184233076264, "grad_norm": 0.7408478984723242, "learning_rate": 3.86780905752754e-06, "loss": 0.4241, "loss_nan_ranks": 0, "loss_rank_avg": 0.22882798314094543, "step": 80, "valid_targets_mean": 5859.9, "valid_targets_min": 2694 }, { "epoch": 0.0728363324764353, "grad_norm": 0.6980932774784856, "learning_rate": 4.112607099143207e-06, "loss": 0.415, "loss_nan_ranks": 0, "loss_rank_avg": 0.2240135371685028, "step": 85, "valid_targets_mean": 4830.5, "valid_targets_min": 1794 }, { "epoch": 0.07712082262210797, "grad_norm": 0.5915927033833656, "learning_rate": 4.357405140758874e-06, "loss": 0.4105, "loss_nan_ranks": 0, "loss_rank_avg": 0.2051009237766266, "step": 90, "valid_targets_mean": 6430.6, "valid_targets_min": 4764 }, { "epoch": 0.08140531276778064, "grad_norm": 0.5894205300368119, "learning_rate": 4.6022031823745415e-06, "loss": 0.3988, "loss_nan_ranks": 0, "loss_rank_avg": 0.21032562851905823, "step": 95, "valid_targets_mean": 6892.0, "valid_targets_min": 4453 }, { "epoch": 0.0856898029134533, "grad_norm": 0.6598571392919448, "learning_rate": 4.847001223990209e-06, "loss": 0.3942, "loss_nan_ranks": 0, "loss_rank_avg": 0.21012765169143677, "step": 100, "valid_targets_mean": 4862.1, "valid_targets_min": 1875 }, { "epoch": 0.08997429305912596, "grad_norm": 0.7406760827901361, "learning_rate": 5.091799265605875e-06, "loss": 0.3795, "loss_nan_ranks": 0, "loss_rank_avg": 0.21197551488876343, "step": 105, "valid_targets_mean": 5108.5, "valid_targets_min": 2767 }, { "epoch": 0.09425878320479864, "grad_norm": 0.6224090599201313, "learning_rate": 5.336597307221543e-06, "loss": 0.3819, "loss_nan_ranks": 0, "loss_rank_avg": 0.139212965965271, "step": 110, "valid_targets_mean": 3294.1, "valid_targets_min": 1668 }, { "epoch": 0.09854327335047129, "grad_norm": 0.5436817831194202, "learning_rate": 5.58139534883721e-06, "loss": 0.3826, "loss_nan_ranks": 0, "loss_rank_avg": 0.16008134186267853, "step": 115, "valid_targets_mean": 4258.8, "valid_targets_min": 1850 }, { "epoch": 0.10282776349614396, "grad_norm": 0.527086505076333, "learning_rate": 5.8261933904528765e-06, "loss": 0.3991, "loss_nan_ranks": 0, "loss_rank_avg": 0.20387375354766846, "step": 120, "valid_targets_mean": 5987.6, "valid_targets_min": 4164 }, { "epoch": 0.10711225364181662, "grad_norm": 0.5288720994634073, "learning_rate": 6.070991432068544e-06, "loss": 0.3599, "loss_nan_ranks": 0, "loss_rank_avg": 0.16154056787490845, "step": 125, "valid_targets_mean": 5076.4, "valid_targets_min": 1265 }, { "epoch": 0.11139674378748929, "grad_norm": 0.5757742789735052, "learning_rate": 6.31578947368421e-06, "loss": 0.3566, "loss_nan_ranks": 0, "loss_rank_avg": 0.19382911920547485, "step": 130, "valid_targets_mean": 4982.8, "valid_targets_min": 2004 }, { "epoch": 0.11568123393316196, "grad_norm": 0.4866632046001885, "learning_rate": 6.560587515299878e-06, "loss": 0.3591, "loss_nan_ranks": 0, "loss_rank_avg": 0.1747215837240219, "step": 135, "valid_targets_mean": 6455.6, "valid_targets_min": 2291 }, { "epoch": 0.11996572407883462, "grad_norm": 0.5502088562401298, "learning_rate": 6.805385556915545e-06, "loss": 0.3531, "loss_nan_ranks": 0, "loss_rank_avg": 0.17451369762420654, "step": 140, "valid_targets_mean": 5308.2, "valid_targets_min": 1552 }, { "epoch": 0.12425021422450729, "grad_norm": 0.566485704846439, "learning_rate": 7.050183598531213e-06, "loss": 0.354, "loss_nan_ranks": 0, "loss_rank_avg": 0.18449868261814117, "step": 145, "valid_targets_mean": 4460.1, "valid_targets_min": 1410 }, { "epoch": 0.12853470437017994, "grad_norm": 0.6014576667932432, "learning_rate": 7.29498164014688e-06, "loss": 0.3503, "loss_nan_ranks": 0, "loss_rank_avg": 0.16550466418266296, "step": 150, "valid_targets_mean": 4723.2, "valid_targets_min": 2563 }, { "epoch": 0.1328191945158526, "grad_norm": 0.5678765320233051, "learning_rate": 7.539779681762547e-06, "loss": 0.35, "loss_nan_ranks": 0, "loss_rank_avg": 0.20662416517734528, "step": 155, "valid_targets_mean": 6524.4, "valid_targets_min": 4442 }, { "epoch": 0.13710368466152528, "grad_norm": 0.5209904193861675, "learning_rate": 7.784577723378214e-06, "loss": 0.3441, "loss_nan_ranks": 0, "loss_rank_avg": 0.17364206910133362, "step": 160, "valid_targets_mean": 5728.1, "valid_targets_min": 3117 }, { "epoch": 0.14138817480719795, "grad_norm": 0.5495554877332163, "learning_rate": 8.02937576499388e-06, "loss": 0.3406, "loss_nan_ranks": 0, "loss_rank_avg": 0.19940133392810822, "step": 165, "valid_targets_mean": 5301.6, "valid_targets_min": 2457 }, { "epoch": 0.1456726649528706, "grad_norm": 0.6721459306059137, "learning_rate": 8.274173806609547e-06, "loss": 0.3484, "loss_nan_ranks": 0, "loss_rank_avg": 0.15087860822677612, "step": 170, "valid_targets_mean": 3913.6, "valid_targets_min": 1133 }, { "epoch": 0.14995715509854327, "grad_norm": 0.5139212368391745, "learning_rate": 8.518971848225216e-06, "loss": 0.3418, "loss_nan_ranks": 0, "loss_rank_avg": 0.1852315366268158, "step": 175, "valid_targets_mean": 6394.9, "valid_targets_min": 2348 }, { "epoch": 0.15424164524421594, "grad_norm": 0.6080406124848964, "learning_rate": 8.763769889840882e-06, "loss": 0.3439, "loss_nan_ranks": 0, "loss_rank_avg": 0.2070283591747284, "step": 180, "valid_targets_mean": 5282.9, "valid_targets_min": 501 }, { "epoch": 0.1585261353898886, "grad_norm": 0.5434520776028683, "learning_rate": 9.008567931456548e-06, "loss": 0.3407, "loss_nan_ranks": 0, "loss_rank_avg": 0.13234570622444153, "step": 185, "valid_targets_mean": 3877.6, "valid_targets_min": 988 }, { "epoch": 0.16281062553556128, "grad_norm": 0.5084708583445311, "learning_rate": 9.253365973072217e-06, "loss": 0.3367, "loss_nan_ranks": 0, "loss_rank_avg": 0.18342074751853943, "step": 190, "valid_targets_mean": 6325.2, "valid_targets_min": 4092 }, { "epoch": 0.16709511568123395, "grad_norm": 0.5710666319007862, "learning_rate": 9.498164014687883e-06, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.1878889948129654, "step": 195, "valid_targets_mean": 5223.2, "valid_targets_min": 1916 }, { "epoch": 0.1713796058269066, "grad_norm": 0.6479959072854039, "learning_rate": 9.74296205630355e-06, "loss": 0.3622, "loss_nan_ranks": 0, "loss_rank_avg": 0.16445878148078918, "step": 200, "valid_targets_mean": 3273.6, "valid_targets_min": 815 }, { "epoch": 0.17566409597257926, "grad_norm": 0.5202221871171575, "learning_rate": 9.987760097919218e-06, "loss": 0.3173, "loss_nan_ranks": 0, "loss_rank_avg": 0.16284489631652832, "step": 205, "valid_targets_mean": 5055.8, "valid_targets_min": 2305 }, { "epoch": 0.17994858611825193, "grad_norm": 0.5524924025549904, "learning_rate": 1.0232558139534884e-05, "loss": 0.3382, "loss_nan_ranks": 0, "loss_rank_avg": 0.19672557711601257, "step": 210, "valid_targets_mean": 5106.8, "valid_targets_min": 997 }, { "epoch": 0.1842330762639246, "grad_norm": 1.0223498715512376, "learning_rate": 1.047735618115055e-05, "loss": 0.3263, "loss_nan_ranks": 0, "loss_rank_avg": 0.19318395853042603, "step": 215, "valid_targets_mean": 5064.0, "valid_targets_min": 2027 }, { "epoch": 0.18851756640959727, "grad_norm": 0.5211527369329275, "learning_rate": 1.0722154222766219e-05, "loss": 0.3221, "loss_nan_ranks": 0, "loss_rank_avg": 0.17607557773590088, "step": 220, "valid_targets_mean": 6074.5, "valid_targets_min": 2335 }, { "epoch": 0.1928020565552699, "grad_norm": 0.5123127191188075, "learning_rate": 1.0966952264381885e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.15591086447238922, "step": 225, "valid_targets_mean": 6394.2, "valid_targets_min": 1530 }, { "epoch": 0.19708654670094258, "grad_norm": 0.5191104747458265, "learning_rate": 1.1211750305997554e-05, "loss": 0.3338, "loss_nan_ranks": 0, "loss_rank_avg": 0.14223499596118927, "step": 230, "valid_targets_mean": 4574.8, "valid_targets_min": 1339 }, { "epoch": 0.20137103684661525, "grad_norm": 0.5699877811233731, "learning_rate": 1.1456548347613222e-05, "loss": 0.3153, "loss_nan_ranks": 0, "loss_rank_avg": 0.17597973346710205, "step": 235, "valid_targets_mean": 6795.1, "valid_targets_min": 4224 }, { "epoch": 0.20565552699228792, "grad_norm": 0.5970363797480456, "learning_rate": 1.1701346389228887e-05, "loss": 0.3228, "loss_nan_ranks": 0, "loss_rank_avg": 0.1517130434513092, "step": 240, "valid_targets_mean": 5152.9, "valid_targets_min": 2470 }, { "epoch": 0.2099400171379606, "grad_norm": 0.5127097301248218, "learning_rate": 1.1946144430844555e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.159349724650383, "step": 245, "valid_targets_mean": 5716.4, "valid_targets_min": 1947 }, { "epoch": 0.21422450728363324, "grad_norm": 0.584380958903832, "learning_rate": 1.2190942472460221e-05, "loss": 0.3276, "loss_nan_ranks": 0, "loss_rank_avg": 0.17096039652824402, "step": 250, "valid_targets_mean": 5353.8, "valid_targets_min": 2263 }, { "epoch": 0.2185089974293059, "grad_norm": 0.531304528969124, "learning_rate": 1.243574051407589e-05, "loss": 0.3189, "loss_nan_ranks": 0, "loss_rank_avg": 0.176926851272583, "step": 255, "valid_targets_mean": 5375.8, "valid_targets_min": 2384 }, { "epoch": 0.22279348757497858, "grad_norm": 0.5610210920466541, "learning_rate": 1.2680538555691554e-05, "loss": 0.3162, "loss_nan_ranks": 0, "loss_rank_avg": 0.15306371450424194, "step": 260, "valid_targets_mean": 4906.6, "valid_targets_min": 1320 }, { "epoch": 0.22707797772065125, "grad_norm": 0.6099494807045799, "learning_rate": 1.2925336597307222e-05, "loss": 0.3233, "loss_nan_ranks": 0, "loss_rank_avg": 0.17797164618968964, "step": 265, "valid_targets_mean": 6262.9, "valid_targets_min": 1200 }, { "epoch": 0.23136246786632392, "grad_norm": 0.5584816599275492, "learning_rate": 1.3170134638922889e-05, "loss": 0.317, "loss_nan_ranks": 0, "loss_rank_avg": 0.14984680712223053, "step": 270, "valid_targets_mean": 5216.5, "valid_targets_min": 3918 }, { "epoch": 0.23564695801199656, "grad_norm": 0.5581317615102905, "learning_rate": 1.3414932680538557e-05, "loss": 0.3113, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488761305809021, "step": 275, "valid_targets_mean": 5854.2, "valid_targets_min": 3345 }, { "epoch": 0.23993144815766923, "grad_norm": 0.7063875640569396, "learning_rate": 1.3659730722154224e-05, "loss": 0.3183, "loss_nan_ranks": 0, "loss_rank_avg": 0.1853543519973755, "step": 280, "valid_targets_mean": 3949.1, "valid_targets_min": 1876 }, { "epoch": 0.2442159383033419, "grad_norm": 0.53488254992811, "learning_rate": 1.3904528763769892e-05, "loss": 0.321, "loss_nan_ranks": 0, "loss_rank_avg": 0.14736245572566986, "step": 285, "valid_targets_mean": 4980.2, "valid_targets_min": 1308 }, { "epoch": 0.24850042844901457, "grad_norm": 0.5414391694510241, "learning_rate": 1.4149326805385557e-05, "loss": 0.3221, "loss_nan_ranks": 0, "loss_rank_avg": 0.12899701297283173, "step": 290, "valid_targets_mean": 4972.6, "valid_targets_min": 1062 }, { "epoch": 0.2527849185946872, "grad_norm": 0.6054725196706271, "learning_rate": 1.4394124847001225e-05, "loss": 0.31, "loss_nan_ranks": 0, "loss_rank_avg": 0.13913224637508392, "step": 295, "valid_targets_mean": 4399.9, "valid_targets_min": 1640 }, { "epoch": 0.2570694087403599, "grad_norm": 0.5637355859677816, "learning_rate": 1.4638922888616893e-05, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.1314675658941269, "step": 300, "valid_targets_mean": 4433.2, "valid_targets_min": 863 }, { "epoch": 0.26135389888603255, "grad_norm": 0.5867368931627099, "learning_rate": 1.488372093023256e-05, "loss": 0.3138, "loss_nan_ranks": 0, "loss_rank_avg": 0.16789467632770538, "step": 305, "valid_targets_mean": 4875.8, "valid_targets_min": 3050 }, { "epoch": 0.2656383890317052, "grad_norm": 0.8512860966478079, "learning_rate": 1.5128518971848228e-05, "loss": 0.3146, "loss_nan_ranks": 0, "loss_rank_avg": 0.17016926407814026, "step": 310, "valid_targets_mean": 5136.0, "valid_targets_min": 1296 }, { "epoch": 0.2699228791773779, "grad_norm": 0.5870192100135584, "learning_rate": 1.5373317013463894e-05, "loss": 0.2978, "loss_nan_ranks": 0, "loss_rank_avg": 0.17785808444023132, "step": 315, "valid_targets_mean": 4783.2, "valid_targets_min": 814 }, { "epoch": 0.27420736932305056, "grad_norm": 0.5658522055114601, "learning_rate": 1.561811505507956e-05, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.134462371468544, "step": 320, "valid_targets_mean": 4842.8, "valid_targets_min": 1679 }, { "epoch": 0.27849185946872324, "grad_norm": 0.6039759670188529, "learning_rate": 1.5862913096695227e-05, "loss": 0.309, "loss_nan_ranks": 0, "loss_rank_avg": 0.1433200240135193, "step": 325, "valid_targets_mean": 4665.6, "valid_targets_min": 2454 }, { "epoch": 0.2827763496143959, "grad_norm": 0.6039885202347223, "learning_rate": 1.6107711138310894e-05, "loss": 0.2999, "loss_nan_ranks": 0, "loss_rank_avg": 0.13930335640907288, "step": 330, "valid_targets_mean": 3988.1, "valid_targets_min": 2263 }, { "epoch": 0.2870608397600686, "grad_norm": 0.5444104462871615, "learning_rate": 1.635250917992656e-05, "loss": 0.2902, "loss_nan_ranks": 0, "loss_rank_avg": 0.1417446732521057, "step": 335, "valid_targets_mean": 4539.2, "valid_targets_min": 2819 }, { "epoch": 0.2913453299057412, "grad_norm": 0.50219258851867, "learning_rate": 1.659730722154223e-05, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.12210437655448914, "step": 340, "valid_targets_mean": 5315.8, "valid_targets_min": 2531 }, { "epoch": 0.29562982005141386, "grad_norm": 0.6297237494404057, "learning_rate": 1.6842105263157896e-05, "loss": 0.3063, "loss_nan_ranks": 0, "loss_rank_avg": 0.15295211970806122, "step": 345, "valid_targets_mean": 3552.4, "valid_targets_min": 1152 }, { "epoch": 0.29991431019708653, "grad_norm": 0.5297704310792776, "learning_rate": 1.7086903304773563e-05, "loss": 0.2893, "loss_nan_ranks": 0, "loss_rank_avg": 0.15931358933448792, "step": 350, "valid_targets_mean": 5920.4, "valid_targets_min": 2610 }, { "epoch": 0.3041988003427592, "grad_norm": 0.5703340645186171, "learning_rate": 1.7331701346389233e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.15025386214256287, "step": 355, "valid_targets_mean": 5074.5, "valid_targets_min": 2473 }, { "epoch": 0.30848329048843187, "grad_norm": 0.4830147558403847, "learning_rate": 1.7576499388004896e-05, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.1271696537733078, "step": 360, "valid_targets_mean": 5975.8, "valid_targets_min": 2878 }, { "epoch": 0.31276778063410454, "grad_norm": 0.6325322902133472, "learning_rate": 1.7821297429620566e-05, "loss": 0.3037, "loss_nan_ranks": 0, "loss_rank_avg": 0.13799910247325897, "step": 365, "valid_targets_mean": 6035.0, "valid_targets_min": 2353 }, { "epoch": 0.3170522707797772, "grad_norm": 0.5287748967291697, "learning_rate": 1.8066095471236232e-05, "loss": 0.3053, "loss_nan_ranks": 0, "loss_rank_avg": 0.14968207478523254, "step": 370, "valid_targets_mean": 5034.8, "valid_targets_min": 1135 }, { "epoch": 0.3213367609254499, "grad_norm": 0.669848870896634, "learning_rate": 1.83108935128519e-05, "loss": 0.3068, "loss_nan_ranks": 0, "loss_rank_avg": 0.12943169474601746, "step": 375, "valid_targets_mean": 3075.2, "valid_targets_min": 1410 }, { "epoch": 0.32562125107112255, "grad_norm": 0.5893188910141677, "learning_rate": 1.8555691554467565e-05, "loss": 0.2976, "loss_nan_ranks": 0, "loss_rank_avg": 0.1718309074640274, "step": 380, "valid_targets_mean": 4813.2, "valid_targets_min": 2649 }, { "epoch": 0.3299057412167952, "grad_norm": 0.6019329357724723, "learning_rate": 1.8800489596083232e-05, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.15909942984580994, "step": 385, "valid_targets_mean": 4439.0, "valid_targets_min": 1582 }, { "epoch": 0.3341902313624679, "grad_norm": 0.6064248819899891, "learning_rate": 1.9045287637698898e-05, "loss": 0.295, "loss_nan_ranks": 0, "loss_rank_avg": 0.12156758457422256, "step": 390, "valid_targets_mean": 3861.8, "valid_targets_min": 1737 }, { "epoch": 0.3384747215081405, "grad_norm": 0.5842534367398564, "learning_rate": 1.9290085679314568e-05, "loss": 0.2994, "loss_nan_ranks": 0, "loss_rank_avg": 0.160810187458992, "step": 395, "valid_targets_mean": 4659.6, "valid_targets_min": 1685 }, { "epoch": 0.3427592116538132, "grad_norm": 0.5268467691843103, "learning_rate": 1.9534883720930235e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.15826356410980225, "step": 400, "valid_targets_mean": 5544.1, "valid_targets_min": 1661 }, { "epoch": 0.34704370179948585, "grad_norm": 0.6958394661491231, "learning_rate": 1.97796817625459e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.16895712912082672, "step": 405, "valid_targets_mean": 5782.8, "valid_targets_min": 2263 }, { "epoch": 0.3513281919451585, "grad_norm": 0.5948462583056694, "learning_rate": 2.002447980416157e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.16228261590003967, "step": 410, "valid_targets_mean": 5028.5, "valid_targets_min": 3210 }, { "epoch": 0.3556126820908312, "grad_norm": 0.5420726443350751, "learning_rate": 2.0269277845777234e-05, "loss": 0.2815, "loss_nan_ranks": 0, "loss_rank_avg": 0.13688191771507263, "step": 415, "valid_targets_mean": 5821.4, "valid_targets_min": 1708 }, { "epoch": 0.35989717223650386, "grad_norm": 0.6388615140705679, "learning_rate": 2.05140758873929e-05, "loss": 0.306, "loss_nan_ranks": 0, "loss_rank_avg": 0.14519023895263672, "step": 420, "valid_targets_mean": 4266.8, "valid_targets_min": 1438 }, { "epoch": 0.36418166238217653, "grad_norm": 0.5663922132128151, "learning_rate": 2.075887392900857e-05, "loss": 0.2924, "loss_nan_ranks": 0, "loss_rank_avg": 0.1524307131767273, "step": 425, "valid_targets_mean": 4807.2, "valid_targets_min": 1665 }, { "epoch": 0.3684661525278492, "grad_norm": 0.5688733222055533, "learning_rate": 2.1003671970624237e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.11472992599010468, "step": 430, "valid_targets_mean": 3932.0, "valid_targets_min": 618 }, { "epoch": 0.37275064267352187, "grad_norm": 0.6223142453975377, "learning_rate": 2.1248470012239903e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.15172141790390015, "step": 435, "valid_targets_mean": 3571.1, "valid_targets_min": 1021 }, { "epoch": 0.37703513281919454, "grad_norm": 0.5609083997959252, "learning_rate": 2.149326805385557e-05, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.14583829045295715, "step": 440, "valid_targets_mean": 5311.2, "valid_targets_min": 1171 }, { "epoch": 0.38131962296486716, "grad_norm": 0.5460504697544348, "learning_rate": 2.173806609547124e-05, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.13169243931770325, "step": 445, "valid_targets_mean": 5064.8, "valid_targets_min": 2680 }, { "epoch": 0.3856041131105398, "grad_norm": 0.5770188612901637, "learning_rate": 2.1982864137086906e-05, "loss": 0.2788, "loss_nan_ranks": 0, "loss_rank_avg": 0.12129063904285431, "step": 450, "valid_targets_mean": 5601.2, "valid_targets_min": 1197 }, { "epoch": 0.3898886032562125, "grad_norm": 0.5993535554284934, "learning_rate": 2.2227662178702573e-05, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.15587423741817474, "step": 455, "valid_targets_mean": 6190.5, "valid_targets_min": 2977 }, { "epoch": 0.39417309340188517, "grad_norm": 0.5386585493381317, "learning_rate": 2.2472460220318236e-05, "loss": 0.2968, "loss_nan_ranks": 0, "loss_rank_avg": 0.14170946180820465, "step": 460, "valid_targets_mean": 4982.9, "valid_targets_min": 2205 }, { "epoch": 0.39845758354755784, "grad_norm": 0.6195415175294577, "learning_rate": 2.271725826193391e-05, "loss": 0.3146, "loss_nan_ranks": 0, "loss_rank_avg": 0.13214179873466492, "step": 465, "valid_targets_mean": 4013.9, "valid_targets_min": 1611 }, { "epoch": 0.4027420736932305, "grad_norm": 0.5519123387328592, "learning_rate": 2.2962056303549572e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.13508766889572144, "step": 470, "valid_targets_mean": 5249.9, "valid_targets_min": 3133 }, { "epoch": 0.4070265638389032, "grad_norm": 0.5009869019667028, "learning_rate": 2.320685434516524e-05, "loss": 0.277, "loss_nan_ranks": 0, "loss_rank_avg": 0.14315488934516907, "step": 475, "valid_targets_mean": 5515.5, "valid_targets_min": 3758 }, { "epoch": 0.41131105398457585, "grad_norm": 0.5626625359580815, "learning_rate": 2.345165238678091e-05, "loss": 0.2841, "loss_nan_ranks": 0, "loss_rank_avg": 0.16055189073085785, "step": 480, "valid_targets_mean": 5776.0, "valid_targets_min": 2353 }, { "epoch": 0.4155955441302485, "grad_norm": 0.5449390116780272, "learning_rate": 2.3696450428396575e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.1312532126903534, "step": 485, "valid_targets_mean": 5009.4, "valid_targets_min": 637 }, { "epoch": 0.4198800342759212, "grad_norm": 0.5779586892568972, "learning_rate": 2.394124847001224e-05, "loss": 0.2904, "loss_nan_ranks": 0, "loss_rank_avg": 0.14948180317878723, "step": 490, "valid_targets_mean": 5899.0, "valid_targets_min": 2260 }, { "epoch": 0.4241645244215938, "grad_norm": 0.6200627622851805, "learning_rate": 2.4186046511627908e-05, "loss": 0.2763, "loss_nan_ranks": 0, "loss_rank_avg": 0.13663563132286072, "step": 495, "valid_targets_mean": 4235.1, "valid_targets_min": 1282 }, { "epoch": 0.4284490145672665, "grad_norm": 0.5205400982232026, "learning_rate": 2.4430844553243578e-05, "loss": 0.2705, "loss_nan_ranks": 0, "loss_rank_avg": 0.11656229943037033, "step": 500, "valid_targets_mean": 5687.9, "valid_targets_min": 2297 }, { "epoch": 0.43273350471293914, "grad_norm": 0.47871740853032907, "learning_rate": 2.4675642594859244e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.11609447002410889, "step": 505, "valid_targets_mean": 5404.6, "valid_targets_min": 3686 }, { "epoch": 0.4370179948586118, "grad_norm": 0.5492898934140984, "learning_rate": 2.492044063647491e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.14045745134353638, "step": 510, "valid_targets_mean": 5541.1, "valid_targets_min": 3317 }, { "epoch": 0.4413024850042845, "grad_norm": 0.5071268634243311, "learning_rate": 2.5165238678090574e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.128058522939682, "step": 515, "valid_targets_mean": 5796.8, "valid_targets_min": 2077 }, { "epoch": 0.44558697514995715, "grad_norm": 0.5655382730838427, "learning_rate": 2.5410036719706247e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.11492526531219482, "step": 520, "valid_targets_mean": 4854.9, "valid_targets_min": 1338 }, { "epoch": 0.4498714652956298, "grad_norm": 0.5424893346687838, "learning_rate": 2.565483476132191e-05, "loss": 0.2814, "loss_nan_ranks": 0, "loss_rank_avg": 0.12241284549236298, "step": 525, "valid_targets_mean": 4384.1, "valid_targets_min": 1704 }, { "epoch": 0.4541559554413025, "grad_norm": 0.5448333250427129, "learning_rate": 2.5899632802937577e-05, "loss": 0.2875, "loss_nan_ranks": 0, "loss_rank_avg": 0.13487297296524048, "step": 530, "valid_targets_mean": 5340.8, "valid_targets_min": 2939 }, { "epoch": 0.45844044558697516, "grad_norm": 0.6187884073389983, "learning_rate": 2.6144430844553243e-05, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.13935431838035583, "step": 535, "valid_targets_mean": 4248.1, "valid_targets_min": 1438 }, { "epoch": 0.46272493573264784, "grad_norm": 0.6001804492599332, "learning_rate": 2.6389228886168913e-05, "loss": 0.2737, "loss_nan_ranks": 0, "loss_rank_avg": 0.1647961139678955, "step": 540, "valid_targets_mean": 5800.1, "valid_targets_min": 4068 }, { "epoch": 0.4670094258783205, "grad_norm": 0.5600479101604777, "learning_rate": 2.663402692778458e-05, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.14143353700637817, "step": 545, "valid_targets_mean": 5761.4, "valid_targets_min": 2433 }, { "epoch": 0.4712939160239931, "grad_norm": 0.5673387034583495, "learning_rate": 2.6878824969400246e-05, "loss": 0.2839, "loss_nan_ranks": 0, "loss_rank_avg": 0.14500755071640015, "step": 550, "valid_targets_mean": 4903.9, "valid_targets_min": 1460 }, { "epoch": 0.4755784061696658, "grad_norm": 0.5691470882956529, "learning_rate": 2.7123623011015916e-05, "loss": 0.2685, "loss_nan_ranks": 0, "loss_rank_avg": 0.1349785029888153, "step": 555, "valid_targets_mean": 4998.4, "valid_targets_min": 2318 }, { "epoch": 0.47986289631533846, "grad_norm": 0.5709082137504153, "learning_rate": 2.7368421052631583e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.14183221757411957, "step": 560, "valid_targets_mean": 5866.0, "valid_targets_min": 3081 }, { "epoch": 0.48414738646101113, "grad_norm": 0.5442903898637672, "learning_rate": 2.761321909424725e-05, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.13423144817352295, "step": 565, "valid_targets_mean": 5355.0, "valid_targets_min": 2979 }, { "epoch": 0.4884318766066838, "grad_norm": 0.5145090110407444, "learning_rate": 2.7858017135862912e-05, "loss": 0.2942, "loss_nan_ranks": 0, "loss_rank_avg": 0.13521131873130798, "step": 570, "valid_targets_mean": 5537.5, "valid_targets_min": 1981 }, { "epoch": 0.49271636675235647, "grad_norm": 0.5126476525977094, "learning_rate": 2.8102815177478585e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.2233107089996338, "step": 575, "valid_targets_mean": 5748.8, "valid_targets_min": 2260 }, { "epoch": 0.49700085689802914, "grad_norm": 0.49860856959951844, "learning_rate": 2.834761321909425e-05, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.13818103075027466, "step": 580, "valid_targets_mean": 5683.2, "valid_targets_min": 3056 }, { "epoch": 0.5012853470437018, "grad_norm": 0.6185441022844439, "learning_rate": 2.8592411260709915e-05, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.13868600130081177, "step": 585, "valid_targets_mean": 4239.5, "valid_targets_min": 1407 }, { "epoch": 0.5055698371893744, "grad_norm": 0.4868317952453862, "learning_rate": 2.883720930232558e-05, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.12314537912607193, "step": 590, "valid_targets_mean": 7541.9, "valid_targets_min": 4887 }, { "epoch": 0.5098543273350471, "grad_norm": 0.5956933077864743, "learning_rate": 2.908200734394125e-05, "loss": 0.2736, "loss_nan_ranks": 0, "loss_rank_avg": 0.16916868090629578, "step": 595, "valid_targets_mean": 5266.6, "valid_targets_min": 2106 }, { "epoch": 0.5141388174807198, "grad_norm": 0.5145182472434158, "learning_rate": 2.9326805385556918e-05, "loss": 0.2771, "loss_nan_ranks": 0, "loss_rank_avg": 0.12932124733924866, "step": 600, "valid_targets_mean": 5444.1, "valid_targets_min": 2584 }, { "epoch": 0.5184233076263924, "grad_norm": 0.5148978628448854, "learning_rate": 2.9571603427172584e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.10980220139026642, "step": 605, "valid_targets_mean": 4968.5, "valid_targets_min": 1153 }, { "epoch": 0.5227077977720651, "grad_norm": 0.6546541289847614, "learning_rate": 2.9816401468788254e-05, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.17208120226860046, "step": 610, "valid_targets_mean": 4161.1, "valid_targets_min": 1401 }, { "epoch": 0.5269922879177378, "grad_norm": 0.5713763418705968, "learning_rate": 3.006119951040392e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.14918869733810425, "step": 615, "valid_targets_mean": 4642.0, "valid_targets_min": 1988 }, { "epoch": 0.5312767780634104, "grad_norm": 0.582802473484628, "learning_rate": 3.0305997552019587e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.13957634568214417, "step": 620, "valid_targets_mean": 4580.8, "valid_targets_min": 671 }, { "epoch": 0.5355612682090831, "grad_norm": 0.5074017899375523, "learning_rate": 3.0550795593635254e-05, "loss": 0.2659, "loss_nan_ranks": 0, "loss_rank_avg": 0.11979982256889343, "step": 625, "valid_targets_mean": 4226.1, "valid_targets_min": 3320 }, { "epoch": 0.5398457583547558, "grad_norm": 0.7080288701071616, "learning_rate": 3.079559363525092e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.12488646060228348, "step": 630, "valid_targets_mean": 3806.6, "valid_targets_min": 1293 }, { "epoch": 0.5441302485004285, "grad_norm": 0.5523074527657701, "learning_rate": 3.104039167686659e-05, "loss": 0.29, "loss_nan_ranks": 0, "loss_rank_avg": 0.14442437887191772, "step": 635, "valid_targets_mean": 6145.4, "valid_targets_min": 4748 }, { "epoch": 0.5484147386461011, "grad_norm": 0.5839924266213236, "learning_rate": 3.128518971848225e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.16150975227355957, "step": 640, "valid_targets_mean": 5677.8, "valid_targets_min": 2736 }, { "epoch": 0.5526992287917738, "grad_norm": 0.5513476463866779, "learning_rate": 3.152998776009792e-05, "loss": 0.2757, "loss_nan_ranks": 0, "loss_rank_avg": 0.13722610473632812, "step": 645, "valid_targets_mean": 4844.5, "valid_targets_min": 873 }, { "epoch": 0.5569837189374465, "grad_norm": 0.5616002902466735, "learning_rate": 3.177478580171359e-05, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.1205633282661438, "step": 650, "valid_targets_mean": 4022.0, "valid_targets_min": 1058 }, { "epoch": 0.5612682090831191, "grad_norm": 0.5025577976134684, "learning_rate": 3.201958384332925e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.1423630565404892, "step": 655, "valid_targets_mean": 6668.2, "valid_targets_min": 3320 }, { "epoch": 0.5655526992287918, "grad_norm": 0.8192137076290354, "learning_rate": 3.226438188494492e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.16772106289863586, "step": 660, "valid_targets_mean": 4754.0, "valid_targets_min": 2355 }, { "epoch": 0.5698371893744645, "grad_norm": 0.5727839053126536, "learning_rate": 3.250917992656059e-05, "loss": 0.2692, "loss_nan_ranks": 0, "loss_rank_avg": 0.1537611484527588, "step": 665, "valid_targets_mean": 5351.6, "valid_targets_min": 3234 }, { "epoch": 0.5741216795201372, "grad_norm": 0.5444238697417997, "learning_rate": 3.275397796817626e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.14869078993797302, "step": 670, "valid_targets_mean": 5715.8, "valid_targets_min": 3830 }, { "epoch": 0.5784061696658098, "grad_norm": 0.5836983468782506, "learning_rate": 3.2998776009791925e-05, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.14694061875343323, "step": 675, "valid_targets_mean": 4126.9, "valid_targets_min": 2461 }, { "epoch": 0.5826906598114824, "grad_norm": 0.6568378900260874, "learning_rate": 3.324357405140759e-05, "loss": 0.2906, "loss_nan_ranks": 0, "loss_rank_avg": 0.15956830978393555, "step": 680, "valid_targets_mean": 4040.9, "valid_targets_min": 1980 }, { "epoch": 0.586975149957155, "grad_norm": 0.5145475286597274, "learning_rate": 3.348837209302326e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.12406280636787415, "step": 685, "valid_targets_mean": 5950.8, "valid_targets_min": 1383 }, { "epoch": 0.5912596401028277, "grad_norm": 0.5558673446263661, "learning_rate": 3.3733170134638925e-05, "loss": 0.2702, "loss_nan_ranks": 0, "loss_rank_avg": 0.12211956083774567, "step": 690, "valid_targets_mean": 6111.4, "valid_targets_min": 3072 }, { "epoch": 0.5955441302485004, "grad_norm": 0.4747838546803119, "learning_rate": 3.397796817625459e-05, "loss": 0.2591, "loss_nan_ranks": 0, "loss_rank_avg": 0.12097050994634628, "step": 695, "valid_targets_mean": 7185.4, "valid_targets_min": 1457 }, { "epoch": 0.5998286203941731, "grad_norm": 0.5194524552843034, "learning_rate": 3.422276621787026e-05, "loss": 0.2649, "loss_nan_ranks": 0, "loss_rank_avg": 0.12255051732063293, "step": 700, "valid_targets_mean": 5736.5, "valid_targets_min": 2366 }, { "epoch": 0.6041131105398457, "grad_norm": 0.5106674807425143, "learning_rate": 3.446756425948593e-05, "loss": 0.2511, "loss_nan_ranks": 0, "loss_rank_avg": 0.11906369030475616, "step": 705, "valid_targets_mean": 5204.1, "valid_targets_min": 3741 }, { "epoch": 0.6083976006855184, "grad_norm": 0.6010561442816965, "learning_rate": 3.471236230110159e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.1466081142425537, "step": 710, "valid_targets_mean": 3954.8, "valid_targets_min": 1020 }, { "epoch": 0.6126820908311911, "grad_norm": 0.5256518508777503, "learning_rate": 3.495716034271726e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.12180833518505096, "step": 715, "valid_targets_mean": 5649.9, "valid_targets_min": 1919 }, { "epoch": 0.6169665809768637, "grad_norm": 0.5968635555634715, "learning_rate": 3.5201958384332924e-05, "loss": 0.2769, "loss_nan_ranks": 0, "loss_rank_avg": 0.16054174304008484, "step": 720, "valid_targets_mean": 5424.4, "valid_targets_min": 2052 }, { "epoch": 0.6212510711225364, "grad_norm": 0.5087542046238016, "learning_rate": 3.54467564259486e-05, "loss": 0.2577, "loss_nan_ranks": 0, "loss_rank_avg": 0.13530471920967102, "step": 725, "valid_targets_mean": 5822.2, "valid_targets_min": 3292 }, { "epoch": 0.6255355612682091, "grad_norm": 0.5308493101137274, "learning_rate": 3.5691554467564264e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.12818732857704163, "step": 730, "valid_targets_mean": 4503.0, "valid_targets_min": 1724 }, { "epoch": 0.6298200514138818, "grad_norm": 0.531906996873097, "learning_rate": 3.593635250917993e-05, "loss": 0.2751, "loss_nan_ranks": 0, "loss_rank_avg": 0.1301267445087433, "step": 735, "valid_targets_mean": 4668.6, "valid_targets_min": 2431 }, { "epoch": 0.6341045415595544, "grad_norm": 0.5963099527547568, "learning_rate": 3.6181150550795597e-05, "loss": 0.2888, "loss_nan_ranks": 0, "loss_rank_avg": 0.16435176134109497, "step": 740, "valid_targets_mean": 5506.2, "valid_targets_min": 2628 }, { "epoch": 0.6383890317052271, "grad_norm": 0.6155164579618286, "learning_rate": 3.642594859241126e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.13344869017601013, "step": 745, "valid_targets_mean": 5700.5, "valid_targets_min": 3180 }, { "epoch": 0.6426735218508998, "grad_norm": 0.501126635501298, "learning_rate": 3.667074663402693e-05, "loss": 0.2715, "loss_nan_ranks": 0, "loss_rank_avg": 0.12969595193862915, "step": 750, "valid_targets_mean": 5380.1, "valid_targets_min": 2965 }, { "epoch": 0.6469580119965724, "grad_norm": 0.6452184273012488, "learning_rate": 3.6915544675642596e-05, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.1391134411096573, "step": 755, "valid_targets_mean": 4782.4, "valid_targets_min": 2001 }, { "epoch": 0.6512425021422451, "grad_norm": 0.5469747322011657, "learning_rate": 3.716034271725827e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.12635910511016846, "step": 760, "valid_targets_mean": 4953.2, "valid_targets_min": 2284 }, { "epoch": 0.6555269922879178, "grad_norm": 0.9231721523981166, "learning_rate": 3.740514075887393e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.1526474952697754, "step": 765, "valid_targets_mean": 3834.5, "valid_targets_min": 1720 }, { "epoch": 0.6598114824335904, "grad_norm": 0.5371949962004401, "learning_rate": 3.7649938800489595e-05, "loss": 0.2708, "loss_nan_ranks": 0, "loss_rank_avg": 0.123946413397789, "step": 770, "valid_targets_mean": 3959.9, "valid_targets_min": 1194 }, { "epoch": 0.6640959725792631, "grad_norm": 0.515907944612913, "learning_rate": 3.789473684210526e-05, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.11019599437713623, "step": 775, "valid_targets_mean": 5306.2, "valid_targets_min": 2080 }, { "epoch": 0.6683804627249358, "grad_norm": 0.535884454819786, "learning_rate": 3.8139534883720935e-05, "loss": 0.2665, "loss_nan_ranks": 0, "loss_rank_avg": 0.11634519696235657, "step": 780, "valid_targets_mean": 4438.4, "valid_targets_min": 2185 }, { "epoch": 0.6726649528706083, "grad_norm": 0.5779089412080396, "learning_rate": 3.83843329253366e-05, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.12202630937099457, "step": 785, "valid_targets_mean": 4871.4, "valid_targets_min": 981 }, { "epoch": 0.676949443016281, "grad_norm": 0.7054778397195679, "learning_rate": 3.862913096695227e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.19049608707427979, "step": 790, "valid_targets_mean": 4367.0, "valid_targets_min": 1829 }, { "epoch": 0.6812339331619537, "grad_norm": 0.5847261365100348, "learning_rate": 3.8873929008567935e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.13841959834098816, "step": 795, "valid_targets_mean": 4756.6, "valid_targets_min": 2879 }, { "epoch": 0.6855184233076264, "grad_norm": 0.48740615813189136, "learning_rate": 3.91187270501836e-05, "loss": 0.2772, "loss_nan_ranks": 0, "loss_rank_avg": 0.12658631801605225, "step": 800, "valid_targets_mean": 5949.4, "valid_targets_min": 2546 }, { "epoch": 0.689802913453299, "grad_norm": 0.520041364867478, "learning_rate": 3.936352509179927e-05, "loss": 0.2581, "loss_nan_ranks": 0, "loss_rank_avg": 0.1271926909685135, "step": 805, "valid_targets_mean": 4749.2, "valid_targets_min": 2381 }, { "epoch": 0.6940874035989717, "grad_norm": 0.5101189199156749, "learning_rate": 3.9608323133414934e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.11503781378269196, "step": 810, "valid_targets_mean": 4865.8, "valid_targets_min": 1847 }, { "epoch": 0.6983718937446444, "grad_norm": 0.5265392292861037, "learning_rate": 3.985312117503061e-05, "loss": 0.2639, "loss_nan_ranks": 0, "loss_rank_avg": 0.12135123461484909, "step": 815, "valid_targets_mean": 6132.9, "valid_targets_min": 4072 }, { "epoch": 0.702656383890317, "grad_norm": 0.47800731568934585, "learning_rate": 3.999999269620268e-05, "loss": 0.2782, "loss_nan_ranks": 0, "loss_rank_avg": 0.12147536873817444, "step": 820, "valid_targets_mean": 6568.1, "valid_targets_min": 4664 }, { "epoch": 0.7069408740359897, "grad_norm": 0.537235188878352, "learning_rate": 3.9999910528544e-05, "loss": 0.2677, "loss_nan_ranks": 0, "loss_rank_avg": 0.104698546230793, "step": 825, "valid_targets_mean": 5815.1, "valid_targets_min": 4353 }, { "epoch": 0.7112253641816624, "grad_norm": 0.5159489954530644, "learning_rate": 3.999973706385632e-05, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.13141869008541107, "step": 830, "valid_targets_mean": 5879.0, "valid_targets_min": 1423 }, { "epoch": 0.715509854327335, "grad_norm": 0.5585389197621717, "learning_rate": 3.999947230293148e-05, "loss": 0.2781, "loss_nan_ranks": 0, "loss_rank_avg": 0.14570122957229614, "step": 835, "valid_targets_mean": 5374.4, "valid_targets_min": 3055 }, { "epoch": 0.7197943444730077, "grad_norm": 0.48092488487972956, "learning_rate": 3.999911624697808e-05, "loss": 0.269, "loss_nan_ranks": 0, "loss_rank_avg": 0.12411829084157944, "step": 840, "valid_targets_mean": 5068.4, "valid_targets_min": 2888 }, { "epoch": 0.7240788346186804, "grad_norm": 0.5805619507516684, "learning_rate": 3.9998668897621475e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.12677715718746185, "step": 845, "valid_targets_mean": 4666.0, "valid_targets_min": 1524 }, { "epoch": 0.7283633247643531, "grad_norm": 0.46425962080468136, "learning_rate": 3.999813025690375e-05, "loss": 0.2783, "loss_nan_ranks": 0, "loss_rank_avg": 0.14648611843585968, "step": 850, "valid_targets_mean": 6841.4, "valid_targets_min": 2339 }, { "epoch": 0.7326478149100257, "grad_norm": 0.6069969870776635, "learning_rate": 3.999750032728374e-05, "loss": 0.2666, "loss_nan_ranks": 0, "loss_rank_avg": 0.12701371312141418, "step": 855, "valid_targets_mean": 4912.1, "valid_targets_min": 1219 }, { "epoch": 0.7369323050556984, "grad_norm": 0.6481210450101693, "learning_rate": 3.999677911163699e-05, "loss": 0.2718, "loss_nan_ranks": 0, "loss_rank_avg": 0.17122164368629456, "step": 860, "valid_targets_mean": 6041.9, "valid_targets_min": 3392 }, { "epoch": 0.7412167952013711, "grad_norm": 0.527730875932154, "learning_rate": 3.9995966613255745e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.13581043481826782, "step": 865, "valid_targets_mean": 5484.5, "valid_targets_min": 3171 }, { "epoch": 0.7455012853470437, "grad_norm": 0.5952293340519983, "learning_rate": 3.999506283584897e-05, "loss": 0.2703, "loss_nan_ranks": 0, "loss_rank_avg": 0.152851864695549, "step": 870, "valid_targets_mean": 5642.9, "valid_targets_min": 3182 }, { "epoch": 0.7497857754927164, "grad_norm": 0.5850366617796318, "learning_rate": 3.999406778354229e-05, "loss": 0.2557, "loss_nan_ranks": 0, "loss_rank_avg": 0.15019948780536652, "step": 875, "valid_targets_mean": 6524.1, "valid_targets_min": 2770 }, { "epoch": 0.7540702656383891, "grad_norm": 0.575250820294863, "learning_rate": 3.999298146087799e-05, "loss": 0.2646, "loss_nan_ranks": 0, "loss_rank_avg": 0.15052559971809387, "step": 880, "valid_targets_mean": 4841.0, "valid_targets_min": 2024 }, { "epoch": 0.7583547557840618, "grad_norm": 0.5493149132399983, "learning_rate": 3.9991803872814984e-05, "loss": 0.2543, "loss_nan_ranks": 0, "loss_rank_avg": 0.13368487358093262, "step": 885, "valid_targets_mean": 5288.2, "valid_targets_min": 1295 }, { "epoch": 0.7626392459297343, "grad_norm": 0.6160371683158595, "learning_rate": 3.9990535024728834e-05, "loss": 0.2663, "loss_nan_ranks": 0, "loss_rank_avg": 0.12840642035007477, "step": 890, "valid_targets_mean": 4293.9, "valid_targets_min": 2469 }, { "epoch": 0.766923736075407, "grad_norm": 0.5101580762550667, "learning_rate": 3.9989174922411645e-05, "loss": 0.246, "loss_nan_ranks": 0, "loss_rank_avg": 0.10666569322347641, "step": 895, "valid_targets_mean": 5572.5, "valid_targets_min": 2629 }, { "epoch": 0.7712082262210797, "grad_norm": 0.5267886267732871, "learning_rate": 3.998772357207212e-05, "loss": 0.2607, "loss_nan_ranks": 0, "loss_rank_avg": 0.15602833032608032, "step": 900, "valid_targets_mean": 5127.2, "valid_targets_min": 855 }, { "epoch": 0.7754927163667523, "grad_norm": 0.6179003743095123, "learning_rate": 3.9986180980335495e-05, "loss": 0.2725, "loss_nan_ranks": 0, "loss_rank_avg": 0.11543315649032593, "step": 905, "valid_targets_mean": 4137.4, "valid_targets_min": 2362 }, { "epoch": 0.779777206512425, "grad_norm": 0.7245223925500395, "learning_rate": 3.998454715424349e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.14181703329086304, "step": 910, "valid_targets_mean": 4639.0, "valid_targets_min": 2314 }, { "epoch": 0.7840616966580977, "grad_norm": 0.566536142916355, "learning_rate": 3.9982822101254325e-05, "loss": 0.2647, "loss_nan_ranks": 0, "loss_rank_avg": 0.14244404435157776, "step": 915, "valid_targets_mean": 5085.1, "valid_targets_min": 852 }, { "epoch": 0.7883461868037703, "grad_norm": 0.5345840659362985, "learning_rate": 3.998100582924263e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.11293502151966095, "step": 920, "valid_targets_mean": 4794.4, "valid_targets_min": 2450 }, { "epoch": 0.792630676949443, "grad_norm": 0.5659991348613919, "learning_rate": 3.997909834649947e-05, "loss": 0.2664, "loss_nan_ranks": 0, "loss_rank_avg": 0.12308050692081451, "step": 925, "valid_targets_mean": 4838.2, "valid_targets_min": 2091 }, { "epoch": 0.7969151670951157, "grad_norm": 0.6133976264224211, "learning_rate": 3.997709966173224e-05, "loss": 0.262, "loss_nan_ranks": 0, "loss_rank_avg": 0.13634806871414185, "step": 930, "valid_targets_mean": 5017.0, "valid_targets_min": 1673 }, { "epoch": 0.8011996572407883, "grad_norm": 0.5073324638405171, "learning_rate": 3.99750097840647e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.12453116476535797, "step": 935, "valid_targets_mean": 4123.8, "valid_targets_min": 2410 }, { "epoch": 0.805484147386461, "grad_norm": 0.629776260395206, "learning_rate": 3.9972828723036866e-05, "loss": 0.2635, "loss_nan_ranks": 0, "loss_rank_avg": 0.17246073484420776, "step": 940, "valid_targets_mean": 5477.5, "valid_targets_min": 2430 }, { "epoch": 0.8097686375321337, "grad_norm": 0.536197964984172, "learning_rate": 3.9970556488605005e-05, "loss": 0.2623, "loss_nan_ranks": 0, "loss_rank_avg": 0.1453799456357956, "step": 945, "valid_targets_mean": 5394.2, "valid_targets_min": 2969 }, { "epoch": 0.8140531276778064, "grad_norm": 0.519512629373522, "learning_rate": 3.996819309114157e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.13137950003147125, "step": 950, "valid_targets_mean": 5013.2, "valid_targets_min": 208 }, { "epoch": 0.818337617823479, "grad_norm": 0.5279654224402252, "learning_rate": 3.996573854143517e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.12292104959487915, "step": 955, "valid_targets_mean": 5456.9, "valid_targets_min": 2518 }, { "epoch": 0.8226221079691517, "grad_norm": 0.530627611144268, "learning_rate": 3.9963192850690505e-05, "loss": 0.2654, "loss_nan_ranks": 0, "loss_rank_avg": 0.14889578521251678, "step": 960, "valid_targets_mean": 5652.2, "valid_targets_min": 464 }, { "epoch": 0.8269065981148244, "grad_norm": 0.5292718935261117, "learning_rate": 3.996055603052834e-05, "loss": 0.2657, "loss_nan_ranks": 0, "loss_rank_avg": 0.1426638662815094, "step": 965, "valid_targets_mean": 5372.0, "valid_targets_min": 2310 }, { "epoch": 0.831191088260497, "grad_norm": 0.49393157060692316, "learning_rate": 3.995782809298541e-05, "loss": 0.2672, "loss_nan_ranks": 0, "loss_rank_avg": 0.13456028699874878, "step": 970, "valid_targets_mean": 5692.2, "valid_targets_min": 3007 }, { "epoch": 0.8354755784061697, "grad_norm": 0.5093574922007108, "learning_rate": 3.99550090505144e-05, "loss": 0.2527, "loss_nan_ranks": 0, "loss_rank_avg": 0.11772598326206207, "step": 975, "valid_targets_mean": 4665.6, "valid_targets_min": 2811 }, { "epoch": 0.8397600685518424, "grad_norm": 0.5389340710537845, "learning_rate": 3.995209891598389e-05, "loss": 0.2629, "loss_nan_ranks": 0, "loss_rank_avg": 0.10856447368860245, "step": 980, "valid_targets_mean": 4917.9, "valid_targets_min": 2593 }, { "epoch": 0.844044558697515, "grad_norm": 0.5633173022193055, "learning_rate": 3.994909770267826e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.0946207195520401, "step": 985, "valid_targets_mean": 5132.9, "valid_targets_min": 2355 }, { "epoch": 0.8483290488431876, "grad_norm": 0.5661047160597428, "learning_rate": 3.994600542429766e-05, "loss": 0.255, "loss_nan_ranks": 0, "loss_rank_avg": 0.13344813883304596, "step": 990, "valid_targets_mean": 5267.4, "valid_targets_min": 1603 }, { "epoch": 0.8526135389888603, "grad_norm": 0.4974712864932079, "learning_rate": 3.994282209495796e-05, "loss": 0.25, "loss_nan_ranks": 0, "loss_rank_avg": 0.10783732682466507, "step": 995, "valid_targets_mean": 6089.4, "valid_targets_min": 2375 }, { "epoch": 0.856898029134533, "grad_norm": 0.5203686372043815, "learning_rate": 3.9939547729190635e-05, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.11107154190540314, "step": 1000, "valid_targets_mean": 4804.4, "valid_targets_min": 593 }, { "epoch": 0.8611825192802056, "grad_norm": 0.5095587249033884, "learning_rate": 3.993618234194276e-05, "loss": 0.2648, "loss_nan_ranks": 0, "loss_rank_avg": 0.12677043676376343, "step": 1005, "valid_targets_mean": 5111.6, "valid_targets_min": 1473 }, { "epoch": 0.8654670094258783, "grad_norm": 0.5583450696312183, "learning_rate": 3.993272594857688e-05, "loss": 0.2588, "loss_nan_ranks": 0, "loss_rank_avg": 0.10360285639762878, "step": 1010, "valid_targets_mean": 3846.5, "valid_targets_min": 1142 }, { "epoch": 0.869751499571551, "grad_norm": 0.52221496646814, "learning_rate": 3.9929178564871e-05, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.11834236234426498, "step": 1015, "valid_targets_mean": 4285.2, "valid_targets_min": 2182 }, { "epoch": 0.8740359897172236, "grad_norm": 0.4630768401778714, "learning_rate": 3.9925540207018476e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.11245059967041016, "step": 1020, "valid_targets_mean": 5297.0, "valid_targets_min": 1991 }, { "epoch": 0.8783204798628963, "grad_norm": 0.5543771552921872, "learning_rate": 3.992181089162793e-05, "loss": 0.2542, "loss_nan_ranks": 0, "loss_rank_avg": 0.11139364540576935, "step": 1025, "valid_targets_mean": 5065.1, "valid_targets_min": 2356 }, { "epoch": 0.882604970008569, "grad_norm": 0.4831163743420262, "learning_rate": 3.991799063572323e-05, "loss": 0.248, "loss_nan_ranks": 0, "loss_rank_avg": 0.1225896030664444, "step": 1030, "valid_targets_mean": 5435.6, "valid_targets_min": 2743 }, { "epoch": 0.8868894601542416, "grad_norm": 0.48868600865654355, "learning_rate": 3.991407945674333e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.14089226722717285, "step": 1035, "valid_targets_mean": 4377.1, "valid_targets_min": 1227 }, { "epoch": 0.8911739502999143, "grad_norm": 0.56988270931451, "learning_rate": 3.9910077372542275e-05, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.14983482658863068, "step": 1040, "valid_targets_mean": 4440.5, "valid_targets_min": 1002 }, { "epoch": 0.895458440445587, "grad_norm": 0.6135335700902131, "learning_rate": 3.990598440138906e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.11355569958686829, "step": 1045, "valid_targets_mean": 5958.2, "valid_targets_min": 3276 }, { "epoch": 0.8997429305912596, "grad_norm": 0.5907089677929637, "learning_rate": 3.9901800561967585e-05, "loss": 0.2701, "loss_nan_ranks": 0, "loss_rank_avg": 0.142267107963562, "step": 1050, "valid_targets_mean": 5085.5, "valid_targets_min": 1497 }, { "epoch": 0.9040274207369323, "grad_norm": 0.5304317761747265, "learning_rate": 3.9897525873376536e-05, "loss": 0.2643, "loss_nan_ranks": 0, "loss_rank_avg": 0.1555720418691635, "step": 1055, "valid_targets_mean": 5944.8, "valid_targets_min": 2371 }, { "epoch": 0.908311910882605, "grad_norm": 0.5288262253537347, "learning_rate": 3.9893160355129314e-05, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.10222537070512772, "step": 1060, "valid_targets_mean": 4336.6, "valid_targets_min": 1612 }, { "epoch": 0.9125964010282777, "grad_norm": 0.516164532221851, "learning_rate": 3.988870402715395e-05, "loss": 0.2348, "loss_nan_ranks": 0, "loss_rank_avg": 0.09846851974725723, "step": 1065, "valid_targets_mean": 4531.5, "valid_targets_min": 2632 }, { "epoch": 0.9168808911739503, "grad_norm": 0.5836994718154224, "learning_rate": 3.988415690979302e-05, "loss": 0.2661, "loss_nan_ranks": 0, "loss_rank_avg": 0.16352909803390503, "step": 1070, "valid_targets_mean": 5046.2, "valid_targets_min": 2063 }, { "epoch": 0.921165381319623, "grad_norm": 0.504311532246728, "learning_rate": 3.987951902380352e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.1278531849384308, "step": 1075, "valid_targets_mean": 4596.0, "valid_targets_min": 1628 }, { "epoch": 0.9254498714652957, "grad_norm": 0.5683140754140763, "learning_rate": 3.987479039035681e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.14287438988685608, "step": 1080, "valid_targets_mean": 3734.8, "valid_targets_min": 1460 }, { "epoch": 0.9297343616109683, "grad_norm": 0.6658402907336981, "learning_rate": 3.986997103103851e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.1435733586549759, "step": 1085, "valid_targets_mean": 4683.5, "valid_targets_min": 2230 }, { "epoch": 0.934018851756641, "grad_norm": 0.5336490395553605, "learning_rate": 3.986506096784835e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.09944146126508713, "step": 1090, "valid_targets_mean": 5346.2, "valid_targets_min": 878 }, { "epoch": 0.9383033419023136, "grad_norm": 0.5146882277747881, "learning_rate": 3.986006022320016e-05, "loss": 0.259, "loss_nan_ranks": 0, "loss_rank_avg": 0.1226465106010437, "step": 1095, "valid_targets_mean": 5573.5, "valid_targets_min": 2145 }, { "epoch": 0.9425878320479862, "grad_norm": 0.5248136140897455, "learning_rate": 3.985496881992169e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.1310267150402069, "step": 1100, "valid_targets_mean": 5006.2, "valid_targets_min": 2506 }, { "epoch": 0.9468723221936589, "grad_norm": 0.4963079106449318, "learning_rate": 3.9849786781254545e-05, "loss": 0.2584, "loss_nan_ranks": 0, "loss_rank_avg": 0.11951654404401779, "step": 1105, "valid_targets_mean": 5100.5, "valid_targets_min": 1529 }, { "epoch": 0.9511568123393316, "grad_norm": 0.5099594473574132, "learning_rate": 3.9844514130854074e-05, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.16315767168998718, "step": 1110, "valid_targets_mean": 6070.2, "valid_targets_min": 2569 }, { "epoch": 0.9554413024850043, "grad_norm": 0.5985623194305978, "learning_rate": 3.9839150892789246e-05, "loss": 0.258, "loss_nan_ranks": 0, "loss_rank_avg": 0.10299926996231079, "step": 1115, "valid_targets_mean": 3485.2, "valid_targets_min": 182 }, { "epoch": 0.9597257926306769, "grad_norm": 0.4687631245915332, "learning_rate": 3.983369709154255e-05, "loss": 0.2408, "loss_nan_ranks": 0, "loss_rank_avg": 0.09602198004722595, "step": 1120, "valid_targets_mean": 4476.5, "valid_targets_min": 1512 }, { "epoch": 0.9640102827763496, "grad_norm": 0.5635958054071022, "learning_rate": 3.98281527520099e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.11026757955551147, "step": 1125, "valid_targets_mean": 4010.4, "valid_targets_min": 1727 }, { "epoch": 0.9682947729220223, "grad_norm": 0.5665722329143809, "learning_rate": 3.9822517899500486e-05, "loss": 0.2675, "loss_nan_ranks": 0, "loss_rank_avg": 0.1259326934814453, "step": 1130, "valid_targets_mean": 4350.8, "valid_targets_min": 1457 }, { "epoch": 0.9725792630676949, "grad_norm": 0.5059137742295718, "learning_rate": 3.981679255973669e-05, "loss": 0.2559, "loss_nan_ranks": 0, "loss_rank_avg": 0.1195632740855217, "step": 1135, "valid_targets_mean": 5862.1, "valid_targets_min": 1916 }, { "epoch": 0.9768637532133676, "grad_norm": 0.4913048915853541, "learning_rate": 3.981097675885396e-05, "loss": 0.2537, "loss_nan_ranks": 0, "loss_rank_avg": 0.1371796727180481, "step": 1140, "valid_targets_mean": 5177.4, "valid_targets_min": 2014 }, { "epoch": 0.9811482433590403, "grad_norm": 0.5254857739233036, "learning_rate": 3.980507052340068e-05, "loss": 0.2521, "loss_nan_ranks": 0, "loss_rank_avg": 0.120770163834095, "step": 1145, "valid_targets_mean": 5489.5, "valid_targets_min": 1497 }, { "epoch": 0.9854327335047129, "grad_norm": 0.5748653058226206, "learning_rate": 3.9799073880338055e-05, "loss": 0.2425, "loss_nan_ranks": 0, "loss_rank_avg": 0.11903972923755646, "step": 1150, "valid_targets_mean": 5864.4, "valid_targets_min": 3012 }, { "epoch": 0.9897172236503856, "grad_norm": 0.47846029169056215, "learning_rate": 3.979298685703999e-05, "loss": 0.2414, "loss_nan_ranks": 0, "loss_rank_avg": 0.09142991900444031, "step": 1155, "valid_targets_mean": 4676.9, "valid_targets_min": 1133 }, { "epoch": 0.9940017137960583, "grad_norm": 0.49721265958922034, "learning_rate": 3.978680948129297e-05, "loss": 0.2673, "loss_nan_ranks": 0, "loss_rank_avg": 0.12009415030479431, "step": 1160, "valid_targets_mean": 4889.5, "valid_targets_min": 2491 }, { "epoch": 0.998286203941731, "grad_norm": 0.5997068908898251, "learning_rate": 3.978054178129593e-05, "loss": 0.2485, "loss_nan_ranks": 0, "loss_rank_avg": 0.16987952589988708, "step": 1165, "valid_targets_mean": 5021.4, "valid_targets_min": 3299 }, { "epoch": 1.0025706940874035, "grad_norm": 0.5576183640944067, "learning_rate": 3.977418378566011e-05, "loss": 0.2408, "loss_nan_ranks": 0, "loss_rank_avg": 0.12192939221858978, "step": 1170, "valid_targets_mean": 4643.8, "valid_targets_min": 1323 }, { "epoch": 1.0068551842330762, "grad_norm": 0.6035479518237012, "learning_rate": 3.976773552340894e-05, "loss": 0.2384, "loss_nan_ranks": 0, "loss_rank_avg": 0.1091715395450592, "step": 1175, "valid_targets_mean": 5468.6, "valid_targets_min": 2461 }, { "epoch": 1.0111396743787489, "grad_norm": 0.5524878515251019, "learning_rate": 3.9761197023977924e-05, "loss": 0.2555, "loss_nan_ranks": 0, "loss_rank_avg": 0.10132533311843872, "step": 1180, "valid_targets_mean": 4217.8, "valid_targets_min": 1181 }, { "epoch": 1.0154241645244215, "grad_norm": 0.5302166537716149, "learning_rate": 3.975456831721447e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.12239775061607361, "step": 1185, "valid_targets_mean": 4477.5, "valid_targets_min": 1831 }, { "epoch": 1.0197086546700942, "grad_norm": 0.8143657797961059, "learning_rate": 3.974784943337776e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.11950390040874481, "step": 1190, "valid_targets_mean": 3528.0, "valid_targets_min": 1135 }, { "epoch": 1.0239931448157669, "grad_norm": 0.5145644173556422, "learning_rate": 3.9741040403138664e-05, "loss": 0.2275, "loss_nan_ranks": 0, "loss_rank_avg": 0.11581888794898987, "step": 1195, "valid_targets_mean": 5046.9, "valid_targets_min": 3252 }, { "epoch": 1.0282776349614395, "grad_norm": 0.5096075629051414, "learning_rate": 3.9734141257579516e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.11322258412837982, "step": 1200, "valid_targets_mean": 5094.9, "valid_targets_min": 1764 }, { "epoch": 1.0325621251071122, "grad_norm": 0.5452129236572999, "learning_rate": 3.972715202819403e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.1197786033153534, "step": 1205, "valid_targets_mean": 4397.4, "valid_targets_min": 1365 }, { "epoch": 1.0368466152527849, "grad_norm": 0.4836356248918647, "learning_rate": 3.9720072746887154e-05, "loss": 0.2394, "loss_nan_ranks": 0, "loss_rank_avg": 0.11884791404008865, "step": 1210, "valid_targets_mean": 5713.0, "valid_targets_min": 3133 }, { "epoch": 1.0411311053984575, "grad_norm": 0.5286827396131738, "learning_rate": 3.9712903445974894e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.11177793145179749, "step": 1215, "valid_targets_mean": 4789.9, "valid_targets_min": 1429 }, { "epoch": 1.0454155955441302, "grad_norm": 0.44979507798907414, "learning_rate": 3.9705644158184184e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.08846048265695572, "step": 1220, "valid_targets_mean": 5322.9, "valid_targets_min": 1743 }, { "epoch": 1.0497000856898029, "grad_norm": 0.48284818931206736, "learning_rate": 3.969829491665275e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.1184084340929985, "step": 1225, "valid_targets_mean": 5108.2, "valid_targets_min": 2100 }, { "epoch": 1.0539845758354756, "grad_norm": 0.5530452468519074, "learning_rate": 3.9690855754928936e-05, "loss": 0.2332, "loss_nan_ranks": 0, "loss_rank_avg": 0.10823780298233032, "step": 1230, "valid_targets_mean": 3682.9, "valid_targets_min": 1490 }, { "epoch": 1.0582690659811482, "grad_norm": 0.6477676224717895, "learning_rate": 3.968332670697157e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.15097667276859283, "step": 1235, "valid_targets_mean": 5090.2, "valid_targets_min": 1598 }, { "epoch": 1.062553556126821, "grad_norm": 0.4747704952236916, "learning_rate": 3.9675707807149774e-05, "loss": 0.2299, "loss_nan_ranks": 0, "loss_rank_avg": 0.11814823746681213, "step": 1240, "valid_targets_mean": 5738.4, "valid_targets_min": 3191 }, { "epoch": 1.0668380462724936, "grad_norm": 0.48119695863094186, "learning_rate": 3.966799909024286e-05, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.10638413578271866, "step": 1245, "valid_targets_mean": 5727.0, "valid_targets_min": 3135 }, { "epoch": 1.0711225364181662, "grad_norm": 0.5072465021718784, "learning_rate": 3.9660200591440136e-05, "loss": 0.235, "loss_nan_ranks": 0, "loss_rank_avg": 0.09678170084953308, "step": 1250, "valid_targets_mean": 4749.6, "valid_targets_min": 1223 }, { "epoch": 1.075407026563839, "grad_norm": 0.47861655127047764, "learning_rate": 3.9652312346340746e-05, "loss": 0.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.08683246374130249, "step": 1255, "valid_targets_mean": 4310.6, "valid_targets_min": 1645 }, { "epoch": 1.0796915167095116, "grad_norm": 0.5520967853377322, "learning_rate": 3.9644334390953514e-05, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.12760165333747864, "step": 1260, "valid_targets_mean": 4486.6, "valid_targets_min": 1234 }, { "epoch": 1.0839760068551842, "grad_norm": 0.5076375139897981, "learning_rate": 3.963626676169679e-05, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.11930255591869354, "step": 1265, "valid_targets_mean": 4789.0, "valid_targets_min": 2907 }, { "epoch": 1.088260497000857, "grad_norm": 0.5987933195720649, "learning_rate": 3.962810949539826e-05, "loss": 0.2513, "loss_nan_ranks": 0, "loss_rank_avg": 0.12798230350017548, "step": 1270, "valid_targets_mean": 4584.6, "valid_targets_min": 2098 }, { "epoch": 1.0925449871465296, "grad_norm": 0.5516383003650653, "learning_rate": 3.961986262929481e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.14063888788223267, "step": 1275, "valid_targets_mean": 5532.2, "valid_targets_min": 1121 }, { "epoch": 1.0968294772922023, "grad_norm": 0.5399383782336239, "learning_rate": 3.9611526201032336e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.11722411215305328, "step": 1280, "valid_targets_mean": 5993.0, "valid_targets_min": 4716 }, { "epoch": 1.101113967437875, "grad_norm": 0.5164083843201357, "learning_rate": 3.9603100248665536e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.13713915646076202, "step": 1285, "valid_targets_mean": 5326.6, "valid_targets_min": 1571 }, { "epoch": 1.1053984575835476, "grad_norm": 0.5589242182917155, "learning_rate": 3.959458481065782e-05, "loss": 0.2422, "loss_nan_ranks": 0, "loss_rank_avg": 0.11845184862613678, "step": 1290, "valid_targets_mean": 4219.1, "valid_targets_min": 2084 }, { "epoch": 1.1096829477292203, "grad_norm": 0.49734016852841817, "learning_rate": 3.9585979925881075e-05, "loss": 0.2349, "loss_nan_ranks": 0, "loss_rank_avg": 0.1256842315196991, "step": 1295, "valid_targets_mean": 5600.0, "valid_targets_min": 1568 }, { "epoch": 1.113967437874893, "grad_norm": 1.0796013091355239, "learning_rate": 3.9577285633615485e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.11703415215015411, "step": 1300, "valid_targets_mean": 4676.5, "valid_targets_min": 1971 }, { "epoch": 1.1182519280205656, "grad_norm": 0.5352032156238867, "learning_rate": 3.956850197354939e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.12584301829338074, "step": 1305, "valid_targets_mean": 4500.8, "valid_targets_min": 1902 }, { "epoch": 1.1225364181662383, "grad_norm": 0.5369977973721654, "learning_rate": 3.9559628985779075e-05, "loss": 0.2455, "loss_nan_ranks": 0, "loss_rank_avg": 0.06521826982498169, "step": 1310, "valid_targets_mean": 2152.4, "valid_targets_min": 578 }, { "epoch": 1.126820908311911, "grad_norm": 0.5394440535514909, "learning_rate": 3.955066671080858e-05, "loss": 0.2181, "loss_nan_ranks": 0, "loss_rank_avg": 0.09284225106239319, "step": 1315, "valid_targets_mean": 4841.8, "valid_targets_min": 3460 }, { "epoch": 1.1311053984575836, "grad_norm": 0.5167458668393816, "learning_rate": 3.954161518954956e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.13846097886562347, "step": 1320, "valid_targets_mean": 5263.6, "valid_targets_min": 2850 }, { "epoch": 1.1353898886032563, "grad_norm": 0.5249378449576371, "learning_rate": 3.9532474463321036e-05, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.10796986520290375, "step": 1325, "valid_targets_mean": 5340.2, "valid_targets_min": 1381 }, { "epoch": 1.139674378748929, "grad_norm": 0.5158354334741792, "learning_rate": 3.952324457384925e-05, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.13506674766540527, "step": 1330, "valid_targets_mean": 4589.1, "valid_targets_min": 2922 }, { "epoch": 1.1439588688946016, "grad_norm": 0.5350786311548035, "learning_rate": 3.951392556326747e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.114400215446949, "step": 1335, "valid_targets_mean": 3964.2, "valid_targets_min": 1625 }, { "epoch": 1.1482433590402743, "grad_norm": 0.507025132940053, "learning_rate": 3.950451747411579e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.14559516310691833, "step": 1340, "valid_targets_mean": 5644.9, "valid_targets_min": 807 }, { "epoch": 1.152527849185947, "grad_norm": 0.5534439903907535, "learning_rate": 3.949502034934092e-05, "loss": 0.234, "loss_nan_ranks": 0, "loss_rank_avg": 0.10887180268764496, "step": 1345, "valid_targets_mean": 5214.2, "valid_targets_min": 3494 }, { "epoch": 1.1568123393316196, "grad_norm": 0.4897888427615898, "learning_rate": 3.9485434232296034e-05, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.12154433131217957, "step": 1350, "valid_targets_mean": 6807.4, "valid_targets_min": 3141 }, { "epoch": 1.1610968294772923, "grad_norm": 0.5142647411009782, "learning_rate": 3.947575916674051e-05, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.15283022820949554, "step": 1355, "valid_targets_mean": 5998.6, "valid_targets_min": 4767 }, { "epoch": 1.165381319622965, "grad_norm": 0.578472327995002, "learning_rate": 3.94659951968398e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.16904443502426147, "step": 1360, "valid_targets_mean": 4652.2, "valid_targets_min": 2686 }, { "epoch": 1.1696658097686377, "grad_norm": 0.5012200266051032, "learning_rate": 3.9456142367165165e-05, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.13777001202106476, "step": 1365, "valid_targets_mean": 5621.0, "valid_targets_min": 2270 }, { "epoch": 1.17395029991431, "grad_norm": 0.5059125605439242, "learning_rate": 3.944620072269351e-05, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.10521627962589264, "step": 1370, "valid_targets_mean": 6382.9, "valid_targets_min": 2711 }, { "epoch": 1.1782347900599828, "grad_norm": 0.5461561352834591, "learning_rate": 3.9436170308807164e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.120382159948349, "step": 1375, "valid_targets_mean": 5325.1, "valid_targets_min": 3385 }, { "epoch": 1.1825192802056554, "grad_norm": 0.5037824311138134, "learning_rate": 3.94260511712937e-05, "loss": 0.238, "loss_nan_ranks": 0, "loss_rank_avg": 0.12292107194662094, "step": 1380, "valid_targets_mean": 4843.8, "valid_targets_min": 3123 }, { "epoch": 1.1868037703513281, "grad_norm": 0.5102819898803347, "learning_rate": 3.9415843356345664e-05, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.10522742569446564, "step": 1385, "valid_targets_mean": 4137.6, "valid_targets_min": 1397 }, { "epoch": 1.1910882604970008, "grad_norm": 0.5069734026849441, "learning_rate": 3.940554691056043e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.11096564680337906, "step": 1390, "valid_targets_mean": 4371.0, "valid_targets_min": 993 }, { "epoch": 1.1953727506426735, "grad_norm": 0.6163302866315783, "learning_rate": 3.939516188093996e-05, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.13463535904884338, "step": 1395, "valid_targets_mean": 5707.9, "valid_targets_min": 2948 }, { "epoch": 1.1996572407883461, "grad_norm": 0.4759043815168194, "learning_rate": 3.938468831489057e-05, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.10264989733695984, "step": 1400, "valid_targets_mean": 3913.9, "valid_targets_min": 1941 }, { "epoch": 1.2039417309340188, "grad_norm": 0.5280325447990015, "learning_rate": 3.937412626022276e-05, "loss": 0.2373, "loss_nan_ranks": 0, "loss_rank_avg": 0.11383386701345444, "step": 1405, "valid_targets_mean": 4232.0, "valid_targets_min": 2762 }, { "epoch": 1.2082262210796915, "grad_norm": 0.4313710336430502, "learning_rate": 3.936347576515096e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.11712110042572021, "step": 1410, "valid_targets_mean": 5636.2, "valid_targets_min": 1780 }, { "epoch": 1.2125107112253641, "grad_norm": 0.5678079911208448, "learning_rate": 3.935273687829329e-05, "loss": 0.2401, "loss_nan_ranks": 0, "loss_rank_avg": 0.14850357174873352, "step": 1415, "valid_targets_mean": 4743.9, "valid_targets_min": 1330 }, { "epoch": 1.2167952013710368, "grad_norm": 0.5436449188870729, "learning_rate": 3.934190964867142e-05, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.10638877749443054, "step": 1420, "valid_targets_mean": 4788.4, "valid_targets_min": 2395 }, { "epoch": 1.2210796915167095, "grad_norm": 0.5836160715561696, "learning_rate": 3.933099412571026e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.1167445033788681, "step": 1425, "valid_targets_mean": 3805.0, "valid_targets_min": 1026 }, { "epoch": 1.2253641816623821, "grad_norm": 0.5470623808192315, "learning_rate": 3.9319990359237754e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.10465378314256668, "step": 1430, "valid_targets_mean": 5702.0, "valid_targets_min": 1685 }, { "epoch": 1.2296486718080548, "grad_norm": 0.5805817722056696, "learning_rate": 3.930889839948472e-05, "loss": 0.2447, "loss_nan_ranks": 0, "loss_rank_avg": 0.13942649960517883, "step": 1435, "valid_targets_mean": 5853.0, "valid_targets_min": 3992 }, { "epoch": 1.2339331619537275, "grad_norm": 0.6131744635856514, "learning_rate": 3.92977182970845e-05, "loss": 0.2487, "loss_nan_ranks": 0, "loss_rank_avg": 0.11150114983320236, "step": 1440, "valid_targets_mean": 3655.6, "valid_targets_min": 1422 }, { "epoch": 1.2382176520994002, "grad_norm": 0.5838711652791473, "learning_rate": 3.9286450103072845e-05, "loss": 0.2363, "loss_nan_ranks": 0, "loss_rank_avg": 0.11811933666467667, "step": 1445, "valid_targets_mean": 5601.4, "valid_targets_min": 1721 }, { "epoch": 1.2425021422450728, "grad_norm": 0.5154752965394229, "learning_rate": 3.927509386888762e-05, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.08512001484632492, "step": 1450, "valid_targets_mean": 5162.0, "valid_targets_min": 1416 }, { "epoch": 1.2467866323907455, "grad_norm": 0.4974023561818171, "learning_rate": 3.9263649646368574e-05, "loss": 0.2325, "loss_nan_ranks": 0, "loss_rank_avg": 0.12567369639873505, "step": 1455, "valid_targets_mean": 5258.8, "valid_targets_min": 2672 }, { "epoch": 1.2510711225364182, "grad_norm": 0.5739391983178774, "learning_rate": 3.925211748775711e-05, "loss": 0.2265, "loss_nan_ranks": 0, "loss_rank_avg": 0.11506156623363495, "step": 1460, "valid_targets_mean": 5422.0, "valid_targets_min": 2651 }, { "epoch": 1.2553556126820908, "grad_norm": 0.4588309784359663, "learning_rate": 3.924049744569606e-05, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.10045787692070007, "step": 1465, "valid_targets_mean": 5433.0, "valid_targets_min": 2926 }, { "epoch": 1.2596401028277635, "grad_norm": 0.6336871374145083, "learning_rate": 3.9228789573229435e-05, "loss": 0.2376, "loss_nan_ranks": 0, "loss_rank_avg": 0.1141088455915451, "step": 1470, "valid_targets_mean": 6424.4, "valid_targets_min": 3386 }, { "epoch": 1.2639245929734362, "grad_norm": 0.5888888726481188, "learning_rate": 3.921699392380217e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.11039966344833374, "step": 1475, "valid_targets_mean": 3917.6, "valid_targets_min": 1241 }, { "epoch": 1.2682090831191088, "grad_norm": 0.4739663401324403, "learning_rate": 3.9205110551259887e-05, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.10644856095314026, "step": 1480, "valid_targets_mean": 5735.8, "valid_targets_min": 2296 }, { "epoch": 1.2724935732647815, "grad_norm": 0.4744561144457731, "learning_rate": 3.919313950984865e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.09622097760438919, "step": 1485, "valid_targets_mean": 5583.1, "valid_targets_min": 3786 }, { "epoch": 1.2767780634104542, "grad_norm": 0.46507247473662877, "learning_rate": 3.918108085421475e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.10571260750293732, "step": 1490, "valid_targets_mean": 4983.6, "valid_targets_min": 3087 }, { "epoch": 1.2810625535561269, "grad_norm": 0.520596404130355, "learning_rate": 3.916893463940439e-05, "loss": 0.2471, "loss_nan_ranks": 0, "loss_rank_avg": 0.10671904683113098, "step": 1495, "valid_targets_mean": 5082.2, "valid_targets_min": 1445 }, { "epoch": 1.2853470437017995, "grad_norm": 0.6672099202048909, "learning_rate": 3.91567009208635e-05, "loss": 0.2313, "loss_nan_ranks": 0, "loss_rank_avg": 0.09037558734416962, "step": 1500, "valid_targets_mean": 4235.4, "valid_targets_min": 1926 }, { "epoch": 1.2896315338474722, "grad_norm": 0.5003672248035446, "learning_rate": 3.914437975443741e-05, "loss": 0.2349, "loss_nan_ranks": 0, "loss_rank_avg": 0.10948409140110016, "step": 1505, "valid_targets_mean": 4737.6, "valid_targets_min": 1773 }, { "epoch": 1.2939160239931449, "grad_norm": 0.6007120324301214, "learning_rate": 3.91319711963707e-05, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.12115178257226944, "step": 1510, "valid_targets_mean": 3282.4, "valid_targets_min": 1669 }, { "epoch": 1.2982005141388175, "grad_norm": 0.44395621445516503, "learning_rate": 3.911947530330683e-05, "loss": 0.2234, "loss_nan_ranks": 0, "loss_rank_avg": 0.13494271039962769, "step": 1515, "valid_targets_mean": 5397.8, "valid_targets_min": 2902 }, { "epoch": 1.3024850042844902, "grad_norm": 0.4727033453216096, "learning_rate": 3.910689213228795e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.11796768754720688, "step": 1520, "valid_targets_mean": 5473.4, "valid_targets_min": 3285 }, { "epoch": 1.3067694944301629, "grad_norm": 0.4409730908944917, "learning_rate": 3.909422174075462e-05, "loss": 0.2375, "loss_nan_ranks": 0, "loss_rank_avg": 0.09463514387607574, "step": 1525, "valid_targets_mean": 4376.8, "valid_targets_min": 1670 }, { "epoch": 1.3110539845758356, "grad_norm": 0.4902923230647443, "learning_rate": 3.908146418654556e-05, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.09760729223489761, "step": 1530, "valid_targets_mean": 5181.0, "valid_targets_min": 2707 }, { "epoch": 1.3153384747215082, "grad_norm": 0.5157944969179804, "learning_rate": 3.9068619527897366e-05, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.07778498530387878, "step": 1535, "valid_targets_mean": 3545.9, "valid_targets_min": 1097 }, { "epoch": 1.3196229648671807, "grad_norm": 0.5078174223015692, "learning_rate": 3.905568782344426e-05, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.10518595576286316, "step": 1540, "valid_targets_mean": 4583.6, "valid_targets_min": 852 }, { "epoch": 1.3239074550128533, "grad_norm": 0.5457009602166955, "learning_rate": 3.904266913221784e-05, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.12312053143978119, "step": 1545, "valid_targets_mean": 4720.4, "valid_targets_min": 1836 }, { "epoch": 1.328191945158526, "grad_norm": 0.5099687710270526, "learning_rate": 3.9029563513646724e-05, "loss": 0.2385, "loss_nan_ranks": 0, "loss_rank_avg": 0.10449822247028351, "step": 1550, "valid_targets_mean": 4636.4, "valid_targets_min": 1042 }, { "epoch": 1.3324764353041987, "grad_norm": 0.5287799852413793, "learning_rate": 3.9016371027556396e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.11712635308504105, "step": 1555, "valid_targets_mean": 4263.0, "valid_targets_min": 1504 }, { "epoch": 1.3367609254498714, "grad_norm": 0.5810619731197988, "learning_rate": 3.900309173416888e-05, "loss": 0.2293, "loss_nan_ranks": 0, "loss_rank_avg": 0.13848112523555756, "step": 1560, "valid_targets_mean": 4872.2, "valid_targets_min": 2033 }, { "epoch": 1.341045415595544, "grad_norm": 0.5273047760121564, "learning_rate": 3.898972569410243e-05, "loss": 0.2277, "loss_nan_ranks": 0, "loss_rank_avg": 0.11683964729309082, "step": 1565, "valid_targets_mean": 5287.6, "valid_targets_min": 1893 }, { "epoch": 1.3453299057412167, "grad_norm": 0.49578100784275103, "learning_rate": 3.897627296837131e-05, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.11568988859653473, "step": 1570, "valid_targets_mean": 5398.9, "valid_targets_min": 3649 }, { "epoch": 1.3496143958868894, "grad_norm": 0.46855836444786286, "learning_rate": 3.8962733618385506e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.11565341055393219, "step": 1575, "valid_targets_mean": 4907.6, "valid_targets_min": 2337 }, { "epoch": 1.353898886032562, "grad_norm": 0.4958189472696427, "learning_rate": 3.894910770595039e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.09800922870635986, "step": 1580, "valid_targets_mean": 6002.4, "valid_targets_min": 1912 }, { "epoch": 1.3581833761782347, "grad_norm": 0.5894328386022706, "learning_rate": 3.8935395293266516e-05, "loss": 0.2525, "loss_nan_ranks": 0, "loss_rank_avg": 0.0854383036494255, "step": 1585, "valid_targets_mean": 4064.6, "valid_targets_min": 1383 }, { "epoch": 1.3624678663239074, "grad_norm": 0.49166187454600596, "learning_rate": 3.89215964429293e-05, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.11674100160598755, "step": 1590, "valid_targets_mean": 5408.1, "valid_targets_min": 1931 }, { "epoch": 1.36675235646958, "grad_norm": 0.5772449814015101, "learning_rate": 3.890771121792872e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.15250825881958008, "step": 1595, "valid_targets_mean": 5092.9, "valid_targets_min": 2054 }, { "epoch": 1.3710368466152527, "grad_norm": 0.5085778895382281, "learning_rate": 3.889373968164905e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.09528356790542603, "step": 1600, "valid_targets_mean": 4869.2, "valid_targets_min": 1497 }, { "epoch": 1.3753213367609254, "grad_norm": 0.5243776347992599, "learning_rate": 3.887968189786856e-05, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.0885411947965622, "step": 1605, "valid_targets_mean": 4016.6, "valid_targets_min": 830 }, { "epoch": 1.379605826906598, "grad_norm": 0.5220292901952734, "learning_rate": 3.886553793075924e-05, "loss": 0.2321, "loss_nan_ranks": 0, "loss_rank_avg": 0.11466914415359497, "step": 1610, "valid_targets_mean": 5926.9, "valid_targets_min": 4034 }, { "epoch": 1.3838903170522707, "grad_norm": 0.5076872075997929, "learning_rate": 3.885130784488647e-05, "loss": 0.2239, "loss_nan_ranks": 0, "loss_rank_avg": 0.10209037363529205, "step": 1615, "valid_targets_mean": 5117.1, "valid_targets_min": 2323 }, { "epoch": 1.3881748071979434, "grad_norm": 0.5633778381637327, "learning_rate": 3.8836991705208776e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.13901841640472412, "step": 1620, "valid_targets_mean": 5037.9, "valid_targets_min": 1173 }, { "epoch": 1.392459297343616, "grad_norm": 0.5172796487217647, "learning_rate": 3.8822589577077516e-05, "loss": 0.2327, "loss_nan_ranks": 0, "loss_rank_avg": 0.11917863041162491, "step": 1625, "valid_targets_mean": 4597.6, "valid_targets_min": 738 }, { "epoch": 1.3967437874892887, "grad_norm": 0.5836629834083695, "learning_rate": 3.880810152623655e-05, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.1187589019536972, "step": 1630, "valid_targets_mean": 5212.9, "valid_targets_min": 2639 }, { "epoch": 1.4010282776349614, "grad_norm": 0.46315449970055106, "learning_rate": 3.879352761882196e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.11266039311885834, "step": 1635, "valid_targets_mean": 5534.8, "valid_targets_min": 449 }, { "epoch": 1.405312767780634, "grad_norm": 0.48359082235776496, "learning_rate": 3.877886792136179e-05, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.11315010488033295, "step": 1640, "valid_targets_mean": 5587.9, "valid_targets_min": 3047 }, { "epoch": 1.4095972579263067, "grad_norm": 0.5036320475550751, "learning_rate": 3.876412250077566e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.11478479206562042, "step": 1645, "valid_targets_mean": 4597.0, "valid_targets_min": 2566 }, { "epoch": 1.4138817480719794, "grad_norm": 0.5576450862795339, "learning_rate": 3.874929142437454e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.15003828704357147, "step": 1650, "valid_targets_mean": 6018.1, "valid_targets_min": 3425 }, { "epoch": 1.418166238217652, "grad_norm": 0.5004516414353842, "learning_rate": 3.8734374759860384e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.11132154613733292, "step": 1655, "valid_targets_mean": 5050.9, "valid_targets_min": 1796 }, { "epoch": 1.4224507283633248, "grad_norm": 0.5009886073584217, "learning_rate": 3.8719372575325856e-05, "loss": 0.213, "loss_nan_ranks": 0, "loss_rank_avg": 0.10907307267189026, "step": 1660, "valid_targets_mean": 6238.2, "valid_targets_min": 3435 }, { "epoch": 1.4267352185089974, "grad_norm": 0.7075590218522548, "learning_rate": 3.8704284939254016e-05, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.11796370148658752, "step": 1665, "valid_targets_mean": 4848.0, "valid_targets_min": 2130 }, { "epoch": 1.43101970865467, "grad_norm": 0.4737684683625076, "learning_rate": 3.868911192051798e-05, "loss": 0.236, "loss_nan_ranks": 0, "loss_rank_avg": 0.12450909614562988, "step": 1670, "valid_targets_mean": 4871.0, "valid_targets_min": 2607 }, { "epoch": 1.4353041988003428, "grad_norm": 0.49240871949752624, "learning_rate": 3.8673853588380636e-05, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.1182079166173935, "step": 1675, "valid_targets_mean": 5182.0, "valid_targets_min": 3373 }, { "epoch": 1.4395886889460154, "grad_norm": 0.5645221728062096, "learning_rate": 3.8658510012494315e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.12042039632797241, "step": 1680, "valid_targets_mean": 5086.6, "valid_targets_min": 2631 }, { "epoch": 1.443873179091688, "grad_norm": 0.4866729059138686, "learning_rate": 3.864308126290048e-05, "loss": 0.2353, "loss_nan_ranks": 0, "loss_rank_avg": 0.11386478692293167, "step": 1685, "valid_targets_mean": 5221.1, "valid_targets_min": 3102 }, { "epoch": 1.4481576692373608, "grad_norm": 0.4658043009744602, "learning_rate": 3.8627567410029384e-05, "loss": 0.2245, "loss_nan_ranks": 0, "loss_rank_avg": 0.09366113692522049, "step": 1690, "valid_targets_mean": 4225.1, "valid_targets_min": 2334 }, { "epoch": 1.4524421593830334, "grad_norm": 0.6858090737961489, "learning_rate": 3.8611968524699785e-05, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.11841071397066116, "step": 1695, "valid_targets_mean": 5201.1, "valid_targets_min": 644 }, { "epoch": 1.4567266495287061, "grad_norm": 0.4830762365406248, "learning_rate": 3.85962846781186e-05, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.08972778916358948, "step": 1700, "valid_targets_mean": 3782.6, "valid_targets_min": 719 }, { "epoch": 1.4610111396743788, "grad_norm": 0.5067013636299821, "learning_rate": 3.8580515941880575e-05, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.10617825388908386, "step": 1705, "valid_targets_mean": 4790.6, "valid_targets_min": 2243 }, { "epoch": 1.4652956298200515, "grad_norm": 0.4674148374739586, "learning_rate": 3.856466238796797e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.11428733170032501, "step": 1710, "valid_targets_mean": 5591.4, "valid_targets_min": 2066 }, { "epoch": 1.4695801199657241, "grad_norm": 0.5011619719025958, "learning_rate": 3.8548724088750226e-05, "loss": 0.2183, "loss_nan_ranks": 0, "loss_rank_avg": 0.11932536959648132, "step": 1715, "valid_targets_mean": 5395.4, "valid_targets_min": 2465 }, { "epoch": 1.4738646101113968, "grad_norm": 0.43993044430943745, "learning_rate": 3.853270111698364e-05, "loss": 0.2188, "loss_nan_ranks": 0, "loss_rank_avg": 0.10304902493953705, "step": 1720, "valid_targets_mean": 5551.4, "valid_targets_min": 2404 }, { "epoch": 1.4781491002570695, "grad_norm": 0.45745867204854895, "learning_rate": 3.851659354581102e-05, "loss": 0.2214, "loss_nan_ranks": 0, "loss_rank_avg": 0.10135609656572342, "step": 1725, "valid_targets_mean": 5176.1, "valid_targets_min": 3026 }, { "epoch": 1.4824335904027421, "grad_norm": 0.4826171730375347, "learning_rate": 3.850040144876138e-05, "loss": 0.2299, "loss_nan_ranks": 0, "loss_rank_avg": 0.11102210730314255, "step": 1730, "valid_targets_mean": 5723.2, "valid_targets_min": 2724 }, { "epoch": 1.4867180805484148, "grad_norm": 0.5631587425192481, "learning_rate": 3.8484124899749546e-05, "loss": 0.2431, "loss_nan_ranks": 0, "loss_rank_avg": 0.14050203561782837, "step": 1735, "valid_targets_mean": 4802.1, "valid_targets_min": 1329 }, { "epoch": 1.4910025706940875, "grad_norm": 0.4778645712533244, "learning_rate": 3.846776397307589e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.13428761065006256, "step": 1740, "valid_targets_mean": 6715.9, "valid_targets_min": 1410 }, { "epoch": 1.4952870608397602, "grad_norm": 0.47558774254834896, "learning_rate": 3.8451318743425956e-05, "loss": 0.2338, "loss_nan_ranks": 0, "loss_rank_avg": 0.14050710201263428, "step": 1745, "valid_targets_mean": 5461.2, "valid_targets_min": 2104 }, { "epoch": 1.4995715509854328, "grad_norm": 0.5020280960692198, "learning_rate": 3.8434789285870086e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.12446136027574539, "step": 1750, "valid_targets_mean": 4883.2, "valid_targets_min": 2589 }, { "epoch": 1.5038560411311055, "grad_norm": 0.46458323275607555, "learning_rate": 3.8418175675863156e-05, "loss": 0.2235, "loss_nan_ranks": 0, "loss_rank_avg": 0.11468029022216797, "step": 1755, "valid_targets_mean": 5307.2, "valid_targets_min": 2860 }, { "epoch": 1.5081405312767782, "grad_norm": 0.46789760447295525, "learning_rate": 3.840147798924416e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.11490252614021301, "step": 1760, "valid_targets_mean": 5207.2, "valid_targets_min": 3608 }, { "epoch": 1.5124250214224508, "grad_norm": 0.5021006585006861, "learning_rate": 3.83846963022359e-05, "loss": 0.2316, "loss_nan_ranks": 0, "loss_rank_avg": 0.110697902739048, "step": 1765, "valid_targets_mean": 5780.4, "valid_targets_min": 1822 }, { "epoch": 1.5167095115681235, "grad_norm": 0.469853039317634, "learning_rate": 3.836783069144463e-05, "loss": 0.2229, "loss_nan_ranks": 0, "loss_rank_avg": 0.1256060153245926, "step": 1770, "valid_targets_mean": 6065.6, "valid_targets_min": 1991 }, { "epoch": 1.5209940017137962, "grad_norm": 0.4716821318464838, "learning_rate": 3.8350881233859685e-05, "loss": 0.2472, "loss_nan_ranks": 0, "loss_rank_avg": 0.11349677294492722, "step": 1775, "valid_targets_mean": 4324.6, "valid_targets_min": 1790 }, { "epoch": 1.5252784918594688, "grad_norm": 0.536991970869005, "learning_rate": 3.833384800685319e-05, "loss": 0.2318, "loss_nan_ranks": 0, "loss_rank_avg": 0.10904942452907562, "step": 1780, "valid_targets_mean": 3615.6, "valid_targets_min": 505 }, { "epoch": 1.5295629820051415, "grad_norm": 0.485747456917392, "learning_rate": 3.831673108817963e-05, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.10863450169563293, "step": 1785, "valid_targets_mean": 5838.9, "valid_targets_min": 4549 }, { "epoch": 1.5338474721508142, "grad_norm": 0.5198449290197883, "learning_rate": 3.829953055597555e-05, "loss": 0.2441, "loss_nan_ranks": 0, "loss_rank_avg": 0.12037435919046402, "step": 1790, "valid_targets_mean": 4294.2, "valid_targets_min": 1412 }, { "epoch": 1.5381319622964869, "grad_norm": 0.4606032330821934, "learning_rate": 3.8282246488759176e-05, "loss": 0.2291, "loss_nan_ranks": 0, "loss_rank_avg": 0.10967078804969788, "step": 1795, "valid_targets_mean": 5616.6, "valid_targets_min": 2014 }, { "epoch": 1.5424164524421595, "grad_norm": 0.5099176146994311, "learning_rate": 3.8264878965430054e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.12301696091890335, "step": 1800, "valid_targets_mean": 5868.0, "valid_targets_min": 2649 }, { "epoch": 1.5467009425878322, "grad_norm": 0.46299916466979724, "learning_rate": 3.824742806526871e-05, "loss": 0.2215, "loss_nan_ranks": 0, "loss_rank_avg": 0.09365905821323395, "step": 1805, "valid_targets_mean": 5420.4, "valid_targets_min": 1664 }, { "epoch": 1.5509854327335049, "grad_norm": 0.4617740195208103, "learning_rate": 3.8229893867936276e-05, "loss": 0.2368, "loss_nan_ranks": 0, "loss_rank_avg": 0.11876237392425537, "step": 1810, "valid_targets_mean": 5358.9, "valid_targets_min": 3369 }, { "epoch": 1.5552699228791775, "grad_norm": 0.5626159117550897, "learning_rate": 3.821227645347409e-05, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.15046226978302002, "step": 1815, "valid_targets_mean": 5776.0, "valid_targets_min": 3152 }, { "epoch": 1.5595544130248502, "grad_norm": 0.4959252152313045, "learning_rate": 3.819457590230342e-05, "loss": 0.2397, "loss_nan_ranks": 0, "loss_rank_avg": 0.14104165136814117, "step": 1820, "valid_targets_mean": 5804.4, "valid_targets_min": 3132 }, { "epoch": 1.5638389031705227, "grad_norm": 0.48077074587515184, "learning_rate": 3.8176792295224994e-05, "loss": 0.2305, "loss_nan_ranks": 0, "loss_rank_avg": 0.13259726762771606, "step": 1825, "valid_targets_mean": 4807.0, "valid_targets_min": 935 }, { "epoch": 1.5681233933161953, "grad_norm": 0.5242143074489919, "learning_rate": 3.815892571341871e-05, "loss": 0.2467, "loss_nan_ranks": 0, "loss_rank_avg": 0.1247769221663475, "step": 1830, "valid_targets_mean": 5371.4, "valid_targets_min": 2433 }, { "epoch": 1.572407883461868, "grad_norm": 0.4281594807768039, "learning_rate": 3.814097623844322e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.11494001746177673, "step": 1835, "valid_targets_mean": 5965.5, "valid_targets_min": 1483 }, { "epoch": 1.5766923736075407, "grad_norm": 0.422218804665581, "learning_rate": 3.8122943952235576e-05, "loss": 0.2251, "loss_nan_ranks": 0, "loss_rank_avg": 0.09081430733203888, "step": 1840, "valid_targets_mean": 4779.8, "valid_targets_min": 1111 }, { "epoch": 1.5809768637532133, "grad_norm": 0.5163048678096387, "learning_rate": 3.810482893711086e-05, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.15263834595680237, "step": 1845, "valid_targets_mean": 5439.9, "valid_targets_min": 1915 }, { "epoch": 1.585261353898886, "grad_norm": 0.5418579237620981, "learning_rate": 3.8086631275761795e-05, "loss": 0.218, "loss_nan_ranks": 0, "loss_rank_avg": 0.10625886172056198, "step": 1850, "valid_targets_mean": 4995.9, "valid_targets_min": 2001 }, { "epoch": 1.5895458440445587, "grad_norm": 0.47484588455080984, "learning_rate": 3.806835105125837e-05, "loss": 0.2225, "loss_nan_ranks": 0, "loss_rank_avg": 0.10894256830215454, "step": 1855, "valid_targets_mean": 5525.2, "valid_targets_min": 2468 }, { "epoch": 1.5938303341902313, "grad_norm": 0.5207951893762186, "learning_rate": 3.804998834704746e-05, "loss": 0.2289, "loss_nan_ranks": 0, "loss_rank_avg": 0.1276807188987732, "step": 1860, "valid_targets_mean": 4585.6, "valid_targets_min": 1850 }, { "epoch": 1.598114824335904, "grad_norm": 0.514875419878507, "learning_rate": 3.803154324695248e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.11865563690662384, "step": 1865, "valid_targets_mean": 4956.0, "valid_targets_min": 1346 }, { "epoch": 1.6023993144815767, "grad_norm": 0.4886307508960448, "learning_rate": 3.801301583517292e-05, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.09256631880998611, "step": 1870, "valid_targets_mean": 4049.8, "valid_targets_min": 1177 }, { "epoch": 1.6066838046272494, "grad_norm": 0.5480634986060973, "learning_rate": 3.799440619628406e-05, "loss": 0.2538, "loss_nan_ranks": 0, "loss_rank_avg": 0.27145320177078247, "step": 1875, "valid_targets_mean": 6011.6, "valid_targets_min": 2061 }, { "epoch": 1.610968294772922, "grad_norm": 0.48254595774152576, "learning_rate": 3.797571441523652e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.11581829190254211, "step": 1880, "valid_targets_mean": 4414.2, "valid_targets_min": 1389 }, { "epoch": 1.6152527849185947, "grad_norm": 0.4647566333863733, "learning_rate": 3.795694057735586e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.1067863404750824, "step": 1885, "valid_targets_mean": 5442.4, "valid_targets_min": 3921 }, { "epoch": 1.6195372750642674, "grad_norm": 0.5357115187409527, "learning_rate": 3.793808476834228e-05, "loss": 0.2255, "loss_nan_ranks": 0, "loss_rank_avg": 0.1260157823562622, "step": 1890, "valid_targets_mean": 5031.4, "valid_targets_min": 467 }, { "epoch": 1.62382176520994, "grad_norm": 0.44411910008494787, "learning_rate": 3.79191470742701e-05, "loss": 0.2272, "loss_nan_ranks": 0, "loss_rank_avg": 0.08977937698364258, "step": 1895, "valid_targets_mean": 4903.1, "valid_targets_min": 3398 }, { "epoch": 1.6281062553556127, "grad_norm": 0.6058848653295341, "learning_rate": 3.790012758158749e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.1174095869064331, "step": 1900, "valid_targets_mean": 6338.4, "valid_targets_min": 3480 }, { "epoch": 1.6323907455012854, "grad_norm": 0.46118509931806967, "learning_rate": 3.7881026377115985e-05, "loss": 0.2274, "loss_nan_ranks": 0, "loss_rank_avg": 0.11545247584581375, "step": 1905, "valid_targets_mean": 5339.1, "valid_targets_min": 1100 }, { "epoch": 1.636675235646958, "grad_norm": 0.47188924482314787, "learning_rate": 3.786184354805014e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.1037750393152237, "step": 1910, "valid_targets_mean": 5157.8, "valid_targets_min": 1471 }, { "epoch": 1.6409597257926307, "grad_norm": 0.4760249550925058, "learning_rate": 3.784257918195711e-05, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.104103222489357, "step": 1915, "valid_targets_mean": 4309.8, "valid_targets_min": 2781 }, { "epoch": 1.6452442159383034, "grad_norm": 0.737205338310611, "learning_rate": 3.782323336677626e-05, "loss": 0.2276, "loss_nan_ranks": 0, "loss_rank_avg": 0.11420521140098572, "step": 1920, "valid_targets_mean": 3715.8, "valid_targets_min": 1727 }, { "epoch": 1.649528706083976, "grad_norm": 0.527920669307789, "learning_rate": 3.780380619081876e-05, "loss": 0.2238, "loss_nan_ranks": 0, "loss_rank_avg": 0.10416075587272644, "step": 1925, "valid_targets_mean": 4639.4, "valid_targets_min": 1275 }, { "epoch": 1.6538131962296485, "grad_norm": 0.4736895787140529, "learning_rate": 3.778429774276717e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.11791656166315079, "step": 1930, "valid_targets_mean": 5350.2, "valid_targets_min": 2054 }, { "epoch": 1.6580976863753212, "grad_norm": 0.5005815340680339, "learning_rate": 3.7764708111675056e-05, "loss": 0.2082, "loss_nan_ranks": 0, "loss_rank_avg": 0.10442407429218292, "step": 1935, "valid_targets_mean": 7008.9, "valid_targets_min": 1658 }, { "epoch": 1.6623821765209938, "grad_norm": 0.5195739036849526, "learning_rate": 3.774503738696659e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.12746137380599976, "step": 1940, "valid_targets_mean": 4134.6, "valid_targets_min": 2320 }, { "epoch": 1.6666666666666665, "grad_norm": 0.4847015952377785, "learning_rate": 3.772528565843609e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.13392658531665802, "step": 1945, "valid_targets_mean": 6174.6, "valid_targets_min": 1862 }, { "epoch": 1.6709511568123392, "grad_norm": 0.4797232277084971, "learning_rate": 3.770545301624768e-05, "loss": 0.2372, "loss_nan_ranks": 0, "loss_rank_avg": 0.12461329251527786, "step": 1950, "valid_targets_mean": 4713.5, "valid_targets_min": 1071 }, { "epoch": 1.6752356469580119, "grad_norm": 0.4168554029651549, "learning_rate": 3.7685539550934824e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.10524686425924301, "step": 1955, "valid_targets_mean": 5712.0, "valid_targets_min": 1974 }, { "epoch": 1.6795201371036845, "grad_norm": 0.4359677674072398, "learning_rate": 3.766554535339995e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.09910120069980621, "step": 1960, "valid_targets_mean": 5346.0, "valid_targets_min": 3455 }, { "epoch": 1.6838046272493572, "grad_norm": 0.5279298884270155, "learning_rate": 3.764547051491399e-05, "loss": 0.2271, "loss_nan_ranks": 0, "loss_rank_avg": 0.12458719313144684, "step": 1965, "valid_targets_mean": 5258.2, "valid_targets_min": 1920 }, { "epoch": 1.6880891173950299, "grad_norm": 0.5009594685257963, "learning_rate": 3.762531512711602e-05, "loss": 0.2241, "loss_nan_ranks": 0, "loss_rank_avg": 0.10473014414310455, "step": 1970, "valid_targets_mean": 5807.4, "valid_targets_min": 980 }, { "epoch": 1.6923736075407025, "grad_norm": 0.4489171770839222, "learning_rate": 3.76050792820128e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.09549927711486816, "step": 1975, "valid_targets_mean": 5834.2, "valid_targets_min": 1428 }, { "epoch": 1.6966580976863752, "grad_norm": 0.4874910810752834, "learning_rate": 3.758476307197837e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.11774912476539612, "step": 1980, "valid_targets_mean": 5110.4, "valid_targets_min": 1711 }, { "epoch": 1.7009425878320479, "grad_norm": 0.45409870644959277, "learning_rate": 3.756436658975363e-05, "loss": 0.2393, "loss_nan_ranks": 0, "loss_rank_avg": 0.13284586369991302, "step": 1985, "valid_targets_mean": 5634.4, "valid_targets_min": 2901 }, { "epoch": 1.7052270779777206, "grad_norm": 0.5009345769885237, "learning_rate": 3.754388992844591e-05, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.14606676995754242, "step": 1990, "valid_targets_mean": 5623.9, "valid_targets_min": 2457 }, { "epoch": 1.7095115681233932, "grad_norm": 0.465963716185065, "learning_rate": 3.7523333181528536e-05, "loss": 0.235, "loss_nan_ranks": 0, "loss_rank_avg": 0.12039413303136826, "step": 1995, "valid_targets_mean": 4879.8, "valid_targets_min": 2333 }, { "epoch": 1.713796058269066, "grad_norm": 0.49285296134297085, "learning_rate": 3.7502696442840424e-05, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.11541670560836792, "step": 2000, "valid_targets_mean": 5865.6, "valid_targets_min": 2986 }, { "epoch": 1.7180805484147386, "grad_norm": 0.48303222679304736, "learning_rate": 3.7481979806585654e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.10086794197559357, "step": 2005, "valid_targets_mean": 5970.1, "valid_targets_min": 2852 }, { "epoch": 1.7223650385604112, "grad_norm": 0.4583874773594575, "learning_rate": 3.746118336733301e-05, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.14557163417339325, "step": 2010, "valid_targets_mean": 7418.1, "valid_targets_min": 2612 }, { "epoch": 1.726649528706084, "grad_norm": 0.5839102741671757, "learning_rate": 3.744030722001556e-05, "loss": 0.2243, "loss_nan_ranks": 0, "loss_rank_avg": 0.12097503244876862, "step": 2015, "valid_targets_mean": 5231.9, "valid_targets_min": 1248 }, { "epoch": 1.7309340188517566, "grad_norm": 0.4679557970967644, "learning_rate": 3.741935145993026e-05, "loss": 0.2266, "loss_nan_ranks": 0, "loss_rank_avg": 0.12258268147706985, "step": 2020, "valid_targets_mean": 5119.0, "valid_targets_min": 2507 }, { "epoch": 1.7352185089974292, "grad_norm": 0.4916485486601471, "learning_rate": 3.739831618273746e-05, "loss": 0.2335, "loss_nan_ranks": 0, "loss_rank_avg": 0.10012927651405334, "step": 2025, "valid_targets_mean": 4079.2, "valid_targets_min": 1147 }, { "epoch": 1.739502999143102, "grad_norm": 0.5414661267399626, "learning_rate": 3.7377201484460516e-05, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.11908154934644699, "step": 2030, "valid_targets_mean": 4558.2, "valid_targets_min": 1874 }, { "epoch": 1.7437874892887746, "grad_norm": 0.48355263559472655, "learning_rate": 3.73560074614853e-05, "loss": 0.2294, "loss_nan_ranks": 0, "loss_rank_avg": 0.1211392879486084, "step": 2035, "valid_targets_mean": 5351.6, "valid_targets_min": 3687 }, { "epoch": 1.7480719794344473, "grad_norm": 0.454722234661219, "learning_rate": 3.733473421055983e-05, "loss": 0.2253, "loss_nan_ranks": 0, "loss_rank_avg": 0.09652171283960342, "step": 2040, "valid_targets_mean": 5261.1, "valid_targets_min": 1546 }, { "epoch": 1.75235646958012, "grad_norm": 0.5511450722174028, "learning_rate": 3.731338182879376e-05, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.11845758557319641, "step": 2045, "valid_targets_mean": 3688.6, "valid_targets_min": 1168 }, { "epoch": 1.7566409597257926, "grad_norm": 0.4282004392379052, "learning_rate": 3.729195041365798e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.10152602195739746, "step": 2050, "valid_targets_mean": 5710.8, "valid_targets_min": 3035 }, { "epoch": 1.7609254498714653, "grad_norm": 0.44868158141916553, "learning_rate": 3.7270440062984155e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.09024541825056076, "step": 2055, "valid_targets_mean": 5247.6, "valid_targets_min": 1394 }, { "epoch": 1.765209940017138, "grad_norm": 0.4723931524742898, "learning_rate": 3.7248850874964284e-05, "loss": 0.2109, "loss_nan_ranks": 0, "loss_rank_avg": 0.10666035115718842, "step": 2060, "valid_targets_mean": 5078.1, "valid_targets_min": 3050 }, { "epoch": 1.7694944301628106, "grad_norm": 0.4823220352807819, "learning_rate": 3.7227182948150235e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.11269587278366089, "step": 2065, "valid_targets_mean": 5477.6, "valid_targets_min": 3002 }, { "epoch": 1.7737789203084833, "grad_norm": 0.5474865566919354, "learning_rate": 3.7205436381453325e-05, "loss": 0.2248, "loss_nan_ranks": 0, "loss_rank_avg": 0.12877508997917175, "step": 2070, "valid_targets_mean": 4364.1, "valid_targets_min": 1699 }, { "epoch": 1.778063410454156, "grad_norm": 0.4596942382402779, "learning_rate": 3.718361127414384e-05, "loss": 0.2146, "loss_nan_ranks": 0, "loss_rank_avg": 0.10272775590419769, "step": 2075, "valid_targets_mean": 5257.1, "valid_targets_min": 3299 }, { "epoch": 1.7823479005998286, "grad_norm": 0.6641809993375568, "learning_rate": 3.71617077258506e-05, "loss": 0.2259, "loss_nan_ranks": 0, "loss_rank_avg": 0.125893235206604, "step": 2080, "valid_targets_mean": 4647.0, "valid_targets_min": 1603 }, { "epoch": 1.7866323907455013, "grad_norm": 0.5016510769637406, "learning_rate": 3.71397258365605e-05, "loss": 0.2238, "loss_nan_ranks": 0, "loss_rank_avg": 0.11946600675582886, "step": 2085, "valid_targets_mean": 5398.1, "valid_targets_min": 2260 }, { "epoch": 1.790916880891174, "grad_norm": 0.40018325885445133, "learning_rate": 3.711766570661805e-05, "loss": 0.2159, "loss_nan_ranks": 0, "loss_rank_avg": 0.09395642578601837, "step": 2090, "valid_targets_mean": 5911.4, "valid_targets_min": 2664 }, { "epoch": 1.7952013710368466, "grad_norm": 0.48624128496277386, "learning_rate": 3.70955274367249e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.1076192706823349, "step": 2095, "valid_targets_mean": 5477.1, "valid_targets_min": 1540 }, { "epoch": 1.7994858611825193, "grad_norm": 0.6049349014182495, "learning_rate": 3.7073311127939434e-05, "loss": 0.2469, "loss_nan_ranks": 0, "loss_rank_avg": 0.15382909774780273, "step": 2100, "valid_targets_mean": 4850.2, "valid_targets_min": 2910 }, { "epoch": 1.803770351328192, "grad_norm": 0.4602861225585512, "learning_rate": 3.705101688167625e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.10993652045726776, "step": 2105, "valid_targets_mean": 5117.2, "valid_targets_min": 3344 }, { "epoch": 1.8080548414738646, "grad_norm": 0.4573276660119421, "learning_rate": 3.702864479970572e-05, "loss": 0.2336, "loss_nan_ranks": 0, "loss_rank_avg": 0.09111273288726807, "step": 2110, "valid_targets_mean": 4376.4, "valid_targets_min": 1914 }, { "epoch": 1.8123393316195373, "grad_norm": 0.45701318648217, "learning_rate": 3.7006194984153536e-05, "loss": 0.2133, "loss_nan_ranks": 0, "loss_rank_avg": 0.09573175013065338, "step": 2115, "valid_targets_mean": 5533.2, "valid_targets_min": 3051 }, { "epoch": 1.81662382176521, "grad_norm": 0.5098679742063379, "learning_rate": 3.6983667537500226e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.13827547430992126, "step": 2120, "valid_targets_mean": 4585.8, "valid_targets_min": 2714 }, { "epoch": 1.8209083119108826, "grad_norm": 0.46205848208851363, "learning_rate": 3.696106256258071e-05, "loss": 0.2403, "loss_nan_ranks": 0, "loss_rank_avg": 0.10701566934585571, "step": 2125, "valid_targets_mean": 4941.9, "valid_targets_min": 1446 }, { "epoch": 1.8251928020565553, "grad_norm": 0.5012775704899749, "learning_rate": 3.6938380162583784e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.1033095270395279, "step": 2130, "valid_targets_mean": 5638.0, "valid_targets_min": 1965 }, { "epoch": 1.829477292202228, "grad_norm": 0.4747025798124583, "learning_rate": 3.6915620441051706e-05, "loss": 0.229, "loss_nan_ranks": 0, "loss_rank_avg": 0.1287415474653244, "step": 2135, "valid_targets_mean": 5183.9, "valid_targets_min": 2699 }, { "epoch": 1.8337617823479007, "grad_norm": 0.5375748900531672, "learning_rate": 3.689278350187969e-05, "loss": 0.2286, "loss_nan_ranks": 0, "loss_rank_avg": 0.1322089433670044, "step": 2140, "valid_targets_mean": 5262.1, "valid_targets_min": 2255 }, { "epoch": 1.8380462724935733, "grad_norm": 0.520531827518314, "learning_rate": 3.686986944931544e-05, "loss": 0.2324, "loss_nan_ranks": 0, "loss_rank_avg": 0.12290707975625992, "step": 2145, "valid_targets_mean": 5127.6, "valid_targets_min": 2904 }, { "epoch": 1.842330762639246, "grad_norm": 0.468452706681642, "learning_rate": 3.684687838795867e-05, "loss": 0.2211, "loss_nan_ranks": 0, "loss_rank_avg": 0.10318892449140549, "step": 2150, "valid_targets_mean": 5195.9, "valid_targets_min": 2905 }, { "epoch": 1.8466152527849187, "grad_norm": 0.4894073955207035, "learning_rate": 3.682381042276062e-05, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.13634109497070312, "step": 2155, "valid_targets_mean": 4727.5, "valid_targets_min": 1388 }, { "epoch": 1.8508997429305913, "grad_norm": 0.5063303905317564, "learning_rate": 3.68006656590236e-05, "loss": 0.2355, "loss_nan_ranks": 0, "loss_rank_avg": 0.11118605732917786, "step": 2160, "valid_targets_mean": 5055.9, "valid_targets_min": 3056 }, { "epoch": 1.855184233076264, "grad_norm": 0.413860193373722, "learning_rate": 3.67774442024005e-05, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.10318203270435333, "step": 2165, "valid_targets_mean": 6153.2, "valid_targets_min": 2380 }, { "epoch": 1.8594687232219367, "grad_norm": 0.5664320802607056, "learning_rate": 3.6754146158894274e-05, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.13304372131824493, "step": 2170, "valid_targets_mean": 4987.5, "valid_targets_min": 1806 }, { "epoch": 1.8637532133676094, "grad_norm": 0.49595955527913155, "learning_rate": 3.673077163485753e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.12880939245224, "step": 2175, "valid_targets_mean": 5107.0, "valid_targets_min": 2167 }, { "epoch": 1.868037703513282, "grad_norm": 0.46081595732819347, "learning_rate": 3.670732073699196e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.11992570012807846, "step": 2180, "valid_targets_mean": 5616.6, "valid_targets_min": 2212 }, { "epoch": 1.8723221936589547, "grad_norm": 0.452165893709852, "learning_rate": 3.6683793572347905e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.08756551146507263, "step": 2185, "valid_targets_mean": 4324.8, "valid_targets_min": 2018 }, { "epoch": 1.8766066838046274, "grad_norm": 0.598100612012415, "learning_rate": 3.666019024832387e-05, "loss": 0.232, "loss_nan_ranks": 0, "loss_rank_avg": 0.12989911437034607, "step": 2190, "valid_targets_mean": 4225.9, "valid_targets_min": 2347 }, { "epoch": 1.8808911739503, "grad_norm": 0.5526053715780299, "learning_rate": 3.6636510872665995e-05, "loss": 0.22, "loss_nan_ranks": 0, "loss_rank_avg": 0.12627767026424408, "step": 2195, "valid_targets_mean": 4753.0, "valid_targets_min": 2165 }, { "epoch": 1.8851756640959727, "grad_norm": 0.4847762020789575, "learning_rate": 3.66127555534676e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.132424995303154, "step": 2200, "valid_targets_mean": 5307.9, "valid_targets_min": 1651 }, { "epoch": 1.8894601542416454, "grad_norm": 0.5046411208346194, "learning_rate": 3.6588924399168664e-05, "loss": 0.2219, "loss_nan_ranks": 0, "loss_rank_avg": 0.09791286289691925, "step": 2205, "valid_targets_mean": 4715.8, "valid_targets_min": 439 }, { "epoch": 1.893744644387318, "grad_norm": 0.5338025713849385, "learning_rate": 3.656501751855537e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.1205880269408226, "step": 2210, "valid_targets_mean": 5110.4, "valid_targets_min": 2460 }, { "epoch": 1.8980291345329907, "grad_norm": 0.511539137370197, "learning_rate": 3.6541035020759555e-05, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.10615777969360352, "step": 2215, "valid_targets_mean": 4384.9, "valid_targets_min": 1217 }, { "epoch": 1.9023136246786634, "grad_norm": 0.5360317696651323, "learning_rate": 3.651697701525825e-05, "loss": 0.2329, "loss_nan_ranks": 0, "loss_rank_avg": 0.09040658921003342, "step": 2220, "valid_targets_mean": 4914.2, "valid_targets_min": 1091 }, { "epoch": 1.906598114824336, "grad_norm": 0.5170648753277196, "learning_rate": 3.6492843611873164e-05, "loss": 0.2196, "loss_nan_ranks": 0, "loss_rank_avg": 0.1084122285246849, "step": 2225, "valid_targets_mean": 4081.0, "valid_targets_min": 512 }, { "epoch": 1.9108826049700087, "grad_norm": 0.4745365155640128, "learning_rate": 3.64686349207702e-05, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.10846118628978729, "step": 2230, "valid_targets_mean": 4990.8, "valid_targets_min": 3201 }, { "epoch": 1.9151670951156814, "grad_norm": 0.4758545058789654, "learning_rate": 3.6444351052458924e-05, "loss": 0.2399, "loss_nan_ranks": 0, "loss_rank_avg": 0.10121801495552063, "step": 2235, "valid_targets_mean": 4110.4, "valid_targets_min": 1497 }, { "epoch": 1.919451585261354, "grad_norm": 0.4514826598697308, "learning_rate": 3.641999211779208e-05, "loss": 0.2068, "loss_nan_ranks": 0, "loss_rank_avg": 0.10626526921987534, "step": 2240, "valid_targets_mean": 6423.8, "valid_targets_min": 2306 }, { "epoch": 1.9237360754070265, "grad_norm": 0.49670895196681053, "learning_rate": 3.6395558227965094e-05, "loss": 0.2252, "loss_nan_ranks": 0, "loss_rank_avg": 0.11679775267839432, "step": 2245, "valid_targets_mean": 4890.6, "valid_targets_min": 1631 }, { "epoch": 1.9280205655526992, "grad_norm": 0.4838984020881071, "learning_rate": 3.637104949451554e-05, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.09723664820194244, "step": 2250, "valid_targets_mean": 4169.4, "valid_targets_min": 1639 }, { "epoch": 1.9323050556983719, "grad_norm": 0.44509857111678414, "learning_rate": 3.6346466029322636e-05, "loss": 0.2262, "loss_nan_ranks": 0, "loss_rank_avg": 0.11195631325244904, "step": 2255, "valid_targets_mean": 4828.4, "valid_targets_min": 2573 }, { "epoch": 1.9365895458440445, "grad_norm": 0.4858864351791111, "learning_rate": 3.632180794460676e-05, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.11188924312591553, "step": 2260, "valid_targets_mean": 4487.5, "valid_targets_min": 1524 }, { "epoch": 1.9408740359897172, "grad_norm": 0.413600120478062, "learning_rate": 3.629707535292891e-05, "loss": 0.2048, "loss_nan_ranks": 0, "loss_rank_avg": 0.10609625279903412, "step": 2265, "valid_targets_mean": 6128.2, "valid_targets_min": 4528 }, { "epoch": 1.9451585261353899, "grad_norm": 0.4494778547641328, "learning_rate": 3.627226836719019e-05, "loss": 0.2179, "loss_nan_ranks": 0, "loss_rank_avg": 0.11913739144802094, "step": 2270, "valid_targets_mean": 4749.6, "valid_targets_min": 1433 }, { "epoch": 1.9494430162810625, "grad_norm": 0.5304785163709616, "learning_rate": 3.624738710063132e-05, "loss": 0.2205, "loss_nan_ranks": 0, "loss_rank_avg": 0.13347581028938293, "step": 2275, "valid_targets_mean": 4066.4, "valid_targets_min": 2419 }, { "epoch": 1.9537275064267352, "grad_norm": 0.45353166493326297, "learning_rate": 3.622243166683209e-05, "loss": 0.2252, "loss_nan_ranks": 0, "loss_rank_avg": 0.0952456071972847, "step": 2280, "valid_targets_mean": 4990.4, "valid_targets_min": 4051 }, { "epoch": 1.9580119965724079, "grad_norm": 0.4539289969108042, "learning_rate": 3.619740217971086e-05, "loss": 0.2172, "loss_nan_ranks": 0, "loss_rank_avg": 0.09723306447267532, "step": 2285, "valid_targets_mean": 5118.4, "valid_targets_min": 1774 }, { "epoch": 1.9622964867180805, "grad_norm": 0.46233942047553034, "learning_rate": 3.617229875352403e-05, "loss": 0.23, "loss_nan_ranks": 0, "loss_rank_avg": 0.09375040233135223, "step": 2290, "valid_targets_mean": 4558.5, "valid_targets_min": 1897 }, { "epoch": 1.9665809768637532, "grad_norm": 0.4218514068432325, "learning_rate": 3.614712150286552e-05, "loss": 0.2171, "loss_nan_ranks": 0, "loss_rank_avg": 0.11099795252084732, "step": 2295, "valid_targets_mean": 5717.6, "valid_targets_min": 2203 }, { "epoch": 1.9708654670094259, "grad_norm": 0.45789692025390966, "learning_rate": 3.6121870542666256e-05, "loss": 0.2293, "loss_nan_ranks": 0, "loss_rank_avg": 0.13194692134857178, "step": 2300, "valid_targets_mean": 6161.2, "valid_targets_min": 2376 }, { "epoch": 1.9751499571550986, "grad_norm": 0.47632168461685737, "learning_rate": 3.609654598819364e-05, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.1115507110953331, "step": 2305, "valid_targets_mean": 5124.5, "valid_targets_min": 2677 }, { "epoch": 1.9794344473007712, "grad_norm": 0.45583728590859696, "learning_rate": 3.6071147955051016e-05, "loss": 0.2177, "loss_nan_ranks": 0, "loss_rank_avg": 0.10582319647073746, "step": 2310, "valid_targets_mean": 5469.5, "valid_targets_min": 2316 }, { "epoch": 1.983718937446444, "grad_norm": 0.48697460061754, "learning_rate": 3.6045676559177156e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.11527565121650696, "step": 2315, "valid_targets_mean": 4943.4, "valid_targets_min": 1153 }, { "epoch": 1.9880034275921166, "grad_norm": 0.4731822430894365, "learning_rate": 3.60201319168457e-05, "loss": 0.2281, "loss_nan_ranks": 0, "loss_rank_avg": 0.10451348125934601, "step": 2320, "valid_targets_mean": 4202.4, "valid_targets_min": 1502 }, { "epoch": 1.9922879177377892, "grad_norm": 0.4556151371510566, "learning_rate": 3.599451414466469e-05, "loss": 0.2269, "loss_nan_ranks": 0, "loss_rank_avg": 0.10072088986635208, "step": 2325, "valid_targets_mean": 5196.8, "valid_targets_min": 1988 }, { "epoch": 1.996572407883462, "grad_norm": 0.4193240280740944, "learning_rate": 3.5968823359575965e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.10769035667181015, "step": 2330, "valid_targets_mean": 6380.5, "valid_targets_min": 2703 }, { "epoch": 2.0008568980291344, "grad_norm": 0.4798142878195261, "learning_rate": 3.594305967885466e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.13428811728954315, "step": 2335, "valid_targets_mean": 6203.6, "valid_targets_min": 2349 }, { "epoch": 2.005141388174807, "grad_norm": 0.4839034707974094, "learning_rate": 3.591722322010869e-05, "loss": 0.1998, "loss_nan_ranks": 0, "loss_rank_avg": 0.0971929281949997, "step": 2340, "valid_targets_mean": 5707.4, "valid_targets_min": 2730 }, { "epoch": 2.0094258783204797, "grad_norm": 0.48112037071217567, "learning_rate": 3.589131410127817e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.10458128899335861, "step": 2345, "valid_targets_mean": 5635.6, "valid_targets_min": 2717 }, { "epoch": 2.0137103684661524, "grad_norm": 0.4420284708052282, "learning_rate": 3.5865332440634906e-05, "loss": 0.206, "loss_nan_ranks": 0, "loss_rank_avg": 0.07776182889938354, "step": 2350, "valid_targets_mean": 5238.4, "valid_targets_min": 2509 }, { "epoch": 2.017994858611825, "grad_norm": 0.4930492802262695, "learning_rate": 3.583927835678186e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.07519136369228363, "step": 2355, "valid_targets_mean": 3908.9, "valid_targets_min": 1777 }, { "epoch": 2.0222793487574977, "grad_norm": 0.48606257170744127, "learning_rate": 3.581315196865257e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.10364539921283722, "step": 2360, "valid_targets_mean": 5116.8, "valid_targets_min": 3772 }, { "epoch": 2.0265638389031704, "grad_norm": 0.5146962374677706, "learning_rate": 3.5786953395510664e-05, "loss": 0.206, "loss_nan_ranks": 0, "loss_rank_avg": 0.10978688299655914, "step": 2365, "valid_targets_mean": 4928.8, "valid_targets_min": 1727 }, { "epoch": 2.030848329048843, "grad_norm": 0.4378443621517526, "learning_rate": 3.576068275694927e-05, "loss": 0.2033, "loss_nan_ranks": 0, "loss_rank_avg": 0.08051362633705139, "step": 2370, "valid_targets_mean": 6912.5, "valid_targets_min": 3311 }, { "epoch": 2.0351328191945157, "grad_norm": 0.5386581392854123, "learning_rate": 3.573434017289048e-05, "loss": 0.2066, "loss_nan_ranks": 0, "loss_rank_avg": 0.1055622398853302, "step": 2375, "valid_targets_mean": 4388.2, "valid_targets_min": 1279 }, { "epoch": 2.0394173093401884, "grad_norm": 0.5240571401301507, "learning_rate": 3.570792576358482e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.09677842259407043, "step": 2380, "valid_targets_mean": 4769.2, "valid_targets_min": 1944 }, { "epoch": 2.043701799485861, "grad_norm": 0.478161437533347, "learning_rate": 3.568143964961069e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.08123594522476196, "step": 2385, "valid_targets_mean": 6699.8, "valid_targets_min": 4104 }, { "epoch": 2.0479862896315337, "grad_norm": 0.4583846295744667, "learning_rate": 3.56548819518738e-05, "loss": 0.2048, "loss_nan_ranks": 0, "loss_rank_avg": 0.11680682003498077, "step": 2390, "valid_targets_mean": 5929.0, "valid_targets_min": 1390 }, { "epoch": 2.0522707797772064, "grad_norm": 0.4488261353496457, "learning_rate": 3.562825279160663e-05, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.10441552102565765, "step": 2395, "valid_targets_mean": 5957.9, "valid_targets_min": 1250 }, { "epoch": 2.056555269922879, "grad_norm": 0.5419790810037427, "learning_rate": 3.560155229036789e-05, "loss": 0.2091, "loss_nan_ranks": 0, "loss_rank_avg": 0.1211346834897995, "step": 2400, "valid_targets_mean": 4245.8, "valid_targets_min": 3184 }, { "epoch": 2.0608397600685517, "grad_norm": 0.48698288645147914, "learning_rate": 3.557478057004196e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.12603498995304108, "step": 2405, "valid_targets_mean": 4773.8, "valid_targets_min": 1426 }, { "epoch": 2.0651242502142244, "grad_norm": 0.45972267451212057, "learning_rate": 3.5547937752838296e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.12184608727693558, "step": 2410, "valid_targets_mean": 5739.6, "valid_targets_min": 1705 }, { "epoch": 2.069408740359897, "grad_norm": 0.5052359876559305, "learning_rate": 3.552102396129093e-05, "loss": 0.2117, "loss_nan_ranks": 0, "loss_rank_avg": 0.12169013917446136, "step": 2415, "valid_targets_mean": 4769.2, "valid_targets_min": 1612 }, { "epoch": 2.0736932305055698, "grad_norm": 0.46583683006954374, "learning_rate": 3.549403931825787e-05, "loss": 0.2044, "loss_nan_ranks": 0, "loss_rank_avg": 0.09529776126146317, "step": 2420, "valid_targets_mean": 6170.0, "valid_targets_min": 2466 }, { "epoch": 2.0779777206512424, "grad_norm": 0.5103020607049007, "learning_rate": 3.546698394692054e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.10125349462032318, "step": 2425, "valid_targets_mean": 5250.1, "valid_targets_min": 3092 }, { "epoch": 2.082262210796915, "grad_norm": 0.6724602759927233, "learning_rate": 3.543985797078326e-05, "loss": 0.2076, "loss_nan_ranks": 0, "loss_rank_avg": 0.09732373058795929, "step": 2430, "valid_targets_mean": 4869.6, "valid_targets_min": 1902 }, { "epoch": 2.0865467009425878, "grad_norm": 0.4710418734332259, "learning_rate": 3.5412661513672635e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.07645601034164429, "step": 2435, "valid_targets_mean": 5544.9, "valid_targets_min": 2866 }, { "epoch": 2.0908311910882604, "grad_norm": 0.5696628205752358, "learning_rate": 3.538539469973699e-05, "loss": 0.2117, "loss_nan_ranks": 0, "loss_rank_avg": 0.12250518798828125, "step": 2440, "valid_targets_mean": 3794.1, "valid_targets_min": 1345 }, { "epoch": 2.095115681233933, "grad_norm": 0.4713107612195895, "learning_rate": 3.535805765344587e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.09606672078371048, "step": 2445, "valid_targets_mean": 4874.5, "valid_targets_min": 1698 }, { "epoch": 2.0994001713796058, "grad_norm": 0.5120423087865809, "learning_rate": 3.533065049958936e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.10608918964862823, "step": 2450, "valid_targets_mean": 4431.9, "valid_targets_min": 1820 }, { "epoch": 2.1036846615252784, "grad_norm": 0.44536739766857203, "learning_rate": 3.530317336327761e-05, "loss": 0.2309, "loss_nan_ranks": 0, "loss_rank_avg": 0.1180947870016098, "step": 2455, "valid_targets_mean": 6261.0, "valid_targets_min": 2680 }, { "epoch": 2.107969151670951, "grad_norm": 0.48777347702473567, "learning_rate": 3.5275626369940226e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.09988237917423248, "step": 2460, "valid_targets_mean": 5259.1, "valid_targets_min": 2737 }, { "epoch": 2.112253641816624, "grad_norm": 0.53585728228521, "learning_rate": 3.5248009645325715e-05, "loss": 0.2111, "loss_nan_ranks": 0, "loss_rank_avg": 0.1207893043756485, "step": 2465, "valid_targets_mean": 4266.6, "valid_targets_min": 1976 }, { "epoch": 2.1165381319622965, "grad_norm": 0.5083574721252143, "learning_rate": 3.522032331550088e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.10587166994810104, "step": 2470, "valid_targets_mean": 4353.4, "valid_targets_min": 1318 }, { "epoch": 2.120822622107969, "grad_norm": 0.8426373316811898, "learning_rate": 3.519256750685027e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.0982590913772583, "step": 2475, "valid_targets_mean": 5417.4, "valid_targets_min": 1229 }, { "epoch": 2.125107112253642, "grad_norm": 0.4797781453173742, "learning_rate": 3.5164742346075586e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.1159694492816925, "step": 2480, "valid_targets_mean": 5555.8, "valid_targets_min": 2557 }, { "epoch": 2.1293916023993145, "grad_norm": 0.5759990368448268, "learning_rate": 3.5136847960195133e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.1255708783864975, "step": 2485, "valid_targets_mean": 5154.9, "valid_targets_min": 3061 }, { "epoch": 2.133676092544987, "grad_norm": 0.5142715372317823, "learning_rate": 3.5108884476543204e-05, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.11523468792438507, "step": 2490, "valid_targets_mean": 5533.1, "valid_targets_min": 3318 }, { "epoch": 2.13796058269066, "grad_norm": 0.5401336125170897, "learning_rate": 3.508085202276952e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.1292748749256134, "step": 2495, "valid_targets_mean": 4863.1, "valid_targets_min": 1367 }, { "epoch": 2.1422450728363325, "grad_norm": 0.5151114715150518, "learning_rate": 3.505275072683864e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.08936254680156708, "step": 2500, "valid_targets_mean": 5512.5, "valid_targets_min": 2314 }, { "epoch": 2.146529562982005, "grad_norm": 0.44524209721883445, "learning_rate": 3.502458071702938e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.08574520796537399, "step": 2505, "valid_targets_mean": 5010.2, "valid_targets_min": 3171 }, { "epoch": 2.150814053127678, "grad_norm": 0.4745350777906336, "learning_rate": 3.4996342121934225e-05, "loss": 0.2181, "loss_nan_ranks": 0, "loss_rank_avg": 0.12945052981376648, "step": 2510, "valid_targets_mean": 6108.2, "valid_targets_min": 2530 }, { "epoch": 2.1550985432733505, "grad_norm": 0.5461131598088633, "learning_rate": 3.4968035070458745e-05, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.13106781244277954, "step": 2515, "valid_targets_mean": 3841.6, "valid_targets_min": 1190 }, { "epoch": 2.159383033419023, "grad_norm": 0.4937762829697131, "learning_rate": 3.4939659691821005e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.11381436884403229, "step": 2520, "valid_targets_mean": 6040.9, "valid_targets_min": 3076 }, { "epoch": 2.163667523564696, "grad_norm": 0.47189409527732573, "learning_rate": 3.491121611555096e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.08889122307300568, "step": 2525, "valid_targets_mean": 5620.0, "valid_targets_min": 3232 }, { "epoch": 2.1679520137103685, "grad_norm": 0.6019995157437676, "learning_rate": 3.488270447148991e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.13497303426265717, "step": 2530, "valid_targets_mean": 3912.2, "valid_targets_min": 2096 }, { "epoch": 2.172236503856041, "grad_norm": 0.48550078769805255, "learning_rate": 3.485412488978984e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.1056138426065445, "step": 2535, "valid_targets_mean": 4961.4, "valid_targets_min": 1818 }, { "epoch": 2.176520994001714, "grad_norm": 0.4629235375663915, "learning_rate": 3.4825477500912894e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.0837879553437233, "step": 2540, "valid_targets_mean": 4675.6, "valid_targets_min": 980 }, { "epoch": 2.1808054841473865, "grad_norm": 0.4928325443486428, "learning_rate": 3.479676243563072e-05, "loss": 0.2185, "loss_nan_ranks": 0, "loss_rank_avg": 0.11683500558137894, "step": 2545, "valid_targets_mean": 5289.5, "valid_targets_min": 3087 }, { "epoch": 2.185089974293059, "grad_norm": 0.4893658082842753, "learning_rate": 3.476797982502391e-05, "loss": 0.2096, "loss_nan_ranks": 0, "loss_rank_avg": 0.11225201934576035, "step": 2550, "valid_targets_mean": 4724.6, "valid_targets_min": 3685 }, { "epoch": 2.189374464438732, "grad_norm": 0.5695749570671081, "learning_rate": 3.4739129800481406e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.0752904862165451, "step": 2555, "valid_targets_mean": 4190.8, "valid_targets_min": 1558 }, { "epoch": 2.1936589545844045, "grad_norm": 0.5777670022037187, "learning_rate": 3.4710212493699867e-05, "loss": 0.2156, "loss_nan_ranks": 0, "loss_rank_avg": 0.1446160078048706, "step": 2560, "valid_targets_mean": 5293.1, "valid_targets_min": 2412 }, { "epoch": 2.197943444730077, "grad_norm": 0.4326574462697901, "learning_rate": 3.4681228036683085e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.07848373800516129, "step": 2565, "valid_targets_mean": 5972.1, "valid_targets_min": 1630 }, { "epoch": 2.20222793487575, "grad_norm": 0.4840416081525319, "learning_rate": 3.465217656174141e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.10920464247465134, "step": 2570, "valid_targets_mean": 4751.2, "valid_targets_min": 1185 }, { "epoch": 2.2065124250214225, "grad_norm": 0.47442024176086667, "learning_rate": 3.462305820149109e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.08478060364723206, "step": 2575, "valid_targets_mean": 4709.0, "valid_targets_min": 1991 }, { "epoch": 2.210796915167095, "grad_norm": 0.5073332229567192, "learning_rate": 3.4593873088853716e-05, "loss": 0.2133, "loss_nan_ranks": 0, "loss_rank_avg": 0.11226142197847366, "step": 2580, "valid_targets_mean": 4234.8, "valid_targets_min": 1878 }, { "epoch": 2.215081405312768, "grad_norm": 0.4721289019762803, "learning_rate": 3.4564621357055573e-05, "loss": 0.2081, "loss_nan_ranks": 0, "loss_rank_avg": 0.09325413405895233, "step": 2585, "valid_targets_mean": 5800.1, "valid_targets_min": 3763 }, { "epoch": 2.2193658954584405, "grad_norm": 0.48760680488450414, "learning_rate": 3.453530313962709e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.09359925240278244, "step": 2590, "valid_targets_mean": 4446.0, "valid_targets_min": 1774 }, { "epoch": 2.223650385604113, "grad_norm": 0.532150303219305, "learning_rate": 3.450591857040215e-05, "loss": 0.2104, "loss_nan_ranks": 0, "loss_rank_avg": 0.10448680818080902, "step": 2595, "valid_targets_mean": 4132.4, "valid_targets_min": 1109 }, { "epoch": 2.227934875749786, "grad_norm": 0.4818587245261894, "learning_rate": 3.4476467783517576e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.08007673174142838, "step": 2600, "valid_targets_mean": 4857.9, "valid_targets_min": 1727 }, { "epoch": 2.2322193658954586, "grad_norm": 0.5052456440668673, "learning_rate": 3.4446950913412406e-05, "loss": 0.2172, "loss_nan_ranks": 0, "loss_rank_avg": 0.1390840858221054, "step": 2605, "valid_targets_mean": 4809.4, "valid_targets_min": 1705 }, { "epoch": 2.236503856041131, "grad_norm": 0.5909119312145202, "learning_rate": 3.441736809482739e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.12171690165996552, "step": 2610, "valid_targets_mean": 4481.1, "valid_targets_min": 2084 }, { "epoch": 2.240788346186804, "grad_norm": 0.5198439433298654, "learning_rate": 3.4387719462804296e-05, "loss": 0.207, "loss_nan_ranks": 0, "loss_rank_avg": 0.10234121233224869, "step": 2615, "valid_targets_mean": 4727.2, "valid_targets_min": 2308 }, { "epoch": 2.2450728363324766, "grad_norm": 0.524554938779893, "learning_rate": 3.435800515268533e-05, "loss": 0.2156, "loss_nan_ranks": 0, "loss_rank_avg": 0.14251066744327545, "step": 2620, "valid_targets_mean": 5830.2, "valid_targets_min": 3293 }, { "epoch": 2.2493573264781492, "grad_norm": 0.4516713254788256, "learning_rate": 3.432822530011252e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.11865200102329254, "step": 2625, "valid_targets_mean": 5070.9, "valid_targets_min": 728 }, { "epoch": 2.253641816623822, "grad_norm": 0.48771244356564863, "learning_rate": 3.429838004102707e-05, "loss": 0.2115, "loss_nan_ranks": 0, "loss_rank_avg": 0.1007542833685875, "step": 2630, "valid_targets_mean": 4801.2, "valid_targets_min": 2899 }, { "epoch": 2.2579263067694946, "grad_norm": 0.4941928389134593, "learning_rate": 3.426846951166876e-05, "loss": 0.2178, "loss_nan_ranks": 0, "loss_rank_avg": 0.11054898798465729, "step": 2635, "valid_targets_mean": 4868.9, "valid_targets_min": 1349 }, { "epoch": 2.2622107969151672, "grad_norm": 0.504860332302527, "learning_rate": 3.423849384857532e-05, "loss": 0.2112, "loss_nan_ranks": 0, "loss_rank_avg": 0.11777180433273315, "step": 2640, "valid_targets_mean": 5324.9, "valid_targets_min": 1285 }, { "epoch": 2.26649528706084, "grad_norm": 0.459939251999804, "learning_rate": 3.420845318858184e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.0937754213809967, "step": 2645, "valid_targets_mean": 5160.6, "valid_targets_min": 1706 }, { "epoch": 2.2707797772065126, "grad_norm": 0.5132192935657194, "learning_rate": 3.417834766882005e-05, "loss": 0.2016, "loss_nan_ranks": 0, "loss_rank_avg": 0.09987785667181015, "step": 2650, "valid_targets_mean": 4889.0, "valid_targets_min": 1651 }, { "epoch": 2.2750642673521853, "grad_norm": 0.4960047556364684, "learning_rate": 3.41481774267178e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.09927482903003693, "step": 2655, "valid_targets_mean": 5076.6, "valid_targets_min": 1539 }, { "epoch": 2.279348757497858, "grad_norm": 0.4696575743098189, "learning_rate": 3.411794259999839e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.07672121375799179, "step": 2660, "valid_targets_mean": 4167.1, "valid_targets_min": 1731 }, { "epoch": 2.2836332476435306, "grad_norm": 0.44652313999302545, "learning_rate": 3.408764332667992e-05, "loss": 0.1976, "loss_nan_ranks": 0, "loss_rank_avg": 0.09379899501800537, "step": 2665, "valid_targets_mean": 5656.6, "valid_targets_min": 2313 }, { "epoch": 2.2879177377892033, "grad_norm": 0.45677683642611405, "learning_rate": 3.4057279745074696e-05, "loss": 0.1935, "loss_nan_ranks": 0, "loss_rank_avg": 0.09468834847211838, "step": 2670, "valid_targets_mean": 5627.0, "valid_targets_min": 2577 }, { "epoch": 2.292202227934876, "grad_norm": 0.4628339227087412, "learning_rate": 3.402685199378857e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.08526807278394699, "step": 2675, "valid_targets_mean": 5128.9, "valid_targets_min": 1877 }, { "epoch": 2.2964867180805486, "grad_norm": 0.48877181789580515, "learning_rate": 3.399636021172034e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.092775359749794, "step": 2680, "valid_targets_mean": 4849.2, "valid_targets_min": 2735 }, { "epoch": 2.3007712082262213, "grad_norm": 0.4854806416818893, "learning_rate": 3.396580453806107e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.10871044546365738, "step": 2685, "valid_targets_mean": 6293.9, "valid_targets_min": 3431 }, { "epoch": 2.305055698371894, "grad_norm": 0.5323163601667085, "learning_rate": 3.393518511229351e-05, "loss": 0.226, "loss_nan_ranks": 0, "loss_rank_avg": 0.13361677527427673, "step": 2690, "valid_targets_mean": 4992.9, "valid_targets_min": 1685 }, { "epoch": 2.3093401885175666, "grad_norm": 0.46863816721964147, "learning_rate": 3.3904502074191405e-05, "loss": 0.1952, "loss_nan_ranks": 0, "loss_rank_avg": 0.0967712551355362, "step": 2695, "valid_targets_mean": 4828.0, "valid_targets_min": 1880 }, { "epoch": 2.3136246786632393, "grad_norm": 0.4937021877713454, "learning_rate": 3.38737555638189e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.11895988881587982, "step": 2700, "valid_targets_mean": 4830.0, "valid_targets_min": 1780 }, { "epoch": 2.317909168808912, "grad_norm": 0.5425049113594594, "learning_rate": 3.384294572152986e-05, "loss": 0.2114, "loss_nan_ranks": 0, "loss_rank_avg": 0.11120740324258804, "step": 2705, "valid_targets_mean": 3873.9, "valid_targets_min": 2068 }, { "epoch": 2.3221936589545846, "grad_norm": 0.46221874375889965, "learning_rate": 3.3812072687967286e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.10035630315542221, "step": 2710, "valid_targets_mean": 4683.9, "valid_targets_min": 1965 }, { "epoch": 2.3264781491002573, "grad_norm": 0.4358452001193529, "learning_rate": 3.378113660406261e-05, "loss": 0.2026, "loss_nan_ranks": 0, "loss_rank_avg": 0.09401911497116089, "step": 2715, "valid_targets_mean": 6308.2, "valid_targets_min": 4481 }, { "epoch": 2.33076263924593, "grad_norm": 0.4971478285651246, "learning_rate": 3.3750137611035096e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.10292759537696838, "step": 2720, "valid_targets_mean": 4957.5, "valid_targets_min": 2267 }, { "epoch": 2.3350471293916026, "grad_norm": 0.4829059484138484, "learning_rate": 3.3719075850391174e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.09821857511997223, "step": 2725, "valid_targets_mean": 6403.6, "valid_targets_min": 3302 }, { "epoch": 2.3393316195372753, "grad_norm": 0.42495114876627665, "learning_rate": 3.36879514639238e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.08856787532567978, "step": 2730, "valid_targets_mean": 5714.2, "valid_targets_min": 3273 }, { "epoch": 2.343616109682948, "grad_norm": 0.4919645273602842, "learning_rate": 3.365676459371181e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.09872014075517654, "step": 2735, "valid_targets_mean": 5452.1, "valid_targets_min": 2308 }, { "epoch": 2.34790059982862, "grad_norm": 0.49482547215601524, "learning_rate": 3.362551538211927e-05, "loss": 0.2034, "loss_nan_ranks": 0, "loss_rank_avg": 0.08632953464984894, "step": 2740, "valid_targets_mean": 5981.2, "valid_targets_min": 1924 }, { "epoch": 2.352185089974293, "grad_norm": 0.44873956381323665, "learning_rate": 3.359420397179483e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.09699660539627075, "step": 2745, "valid_targets_mean": 4944.5, "valid_targets_min": 1397 }, { "epoch": 2.3564695801199655, "grad_norm": 0.49552476816804186, "learning_rate": 3.3562830505671065e-05, "loss": 0.2012, "loss_nan_ranks": 0, "loss_rank_avg": 0.10512469708919525, "step": 2750, "valid_targets_mean": 5890.2, "valid_targets_min": 3051 }, { "epoch": 2.360754070265638, "grad_norm": 0.48348438529624993, "learning_rate": 3.353139512696383e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.07310528308153152, "step": 2755, "valid_targets_mean": 4501.5, "valid_targets_min": 2621 }, { "epoch": 2.365038560411311, "grad_norm": 0.4828132476454937, "learning_rate": 3.34998979791716e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.11672252416610718, "step": 2760, "valid_targets_mean": 5034.0, "valid_targets_min": 1177 }, { "epoch": 2.3693230505569836, "grad_norm": 0.47308712313036416, "learning_rate": 3.3468339206074815e-05, "loss": 0.2072, "loss_nan_ranks": 0, "loss_rank_avg": 0.10690588504076004, "step": 2765, "valid_targets_mean": 5897.6, "valid_targets_min": 2412 }, { "epoch": 2.3736075407026562, "grad_norm": 0.4653042324351704, "learning_rate": 3.343671895173524e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.08077119290828705, "step": 2770, "valid_targets_mean": 5471.0, "valid_targets_min": 2227 }, { "epoch": 2.377892030848329, "grad_norm": 0.437950561918184, "learning_rate": 3.340503736049527e-05, "loss": 0.1917, "loss_nan_ranks": 0, "loss_rank_avg": 0.08129626512527466, "step": 2775, "valid_targets_mean": 5579.0, "valid_targets_min": 3308 }, { "epoch": 2.3821765209940016, "grad_norm": 0.509302804118846, "learning_rate": 3.3373294576977313e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.11761146783828735, "step": 2780, "valid_targets_mean": 4584.9, "valid_targets_min": 1504 }, { "epoch": 2.3864610111396742, "grad_norm": 0.4814389942194716, "learning_rate": 3.3341490746083125e-05, "loss": 0.1974, "loss_nan_ranks": 0, "loss_rank_avg": 0.13504838943481445, "step": 2785, "valid_targets_mean": 5767.0, "valid_targets_min": 2377 }, { "epoch": 2.390745501285347, "grad_norm": 0.45161396380264546, "learning_rate": 3.33096260129931e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.08189062774181366, "step": 2790, "valid_targets_mean": 4240.6, "valid_targets_min": 842 }, { "epoch": 2.3950299914310196, "grad_norm": 0.5218339855169469, "learning_rate": 3.327770052316567e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.1058935672044754, "step": 2795, "valid_targets_mean": 5277.1, "valid_targets_min": 2821 }, { "epoch": 2.3993144815766922, "grad_norm": 0.5190837299505044, "learning_rate": 3.3245714422336615e-05, "loss": 0.2192, "loss_nan_ranks": 0, "loss_rank_avg": 0.1227574422955513, "step": 2800, "valid_targets_mean": 5310.6, "valid_targets_min": 2024 }, { "epoch": 2.403598971722365, "grad_norm": 0.4771751306499786, "learning_rate": 3.321366785651837e-05, "loss": 0.2036, "loss_nan_ranks": 0, "loss_rank_avg": 0.09484189748764038, "step": 2805, "valid_targets_mean": 4509.6, "valid_targets_min": 2628 }, { "epoch": 2.4078834618680376, "grad_norm": 0.5173351776105665, "learning_rate": 3.31815609719994e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.11100342869758606, "step": 2810, "valid_targets_mean": 6206.4, "valid_targets_min": 4923 }, { "epoch": 2.4121679520137103, "grad_norm": 0.4357793385013147, "learning_rate": 3.314939391534354e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.10164409875869751, "step": 2815, "valid_targets_mean": 6839.2, "valid_targets_min": 4419 }, { "epoch": 2.416452442159383, "grad_norm": 0.5023728125638247, "learning_rate": 3.311716683338927e-05, "loss": 0.1973, "loss_nan_ranks": 0, "loss_rank_avg": 0.10916950553655624, "step": 2820, "valid_targets_mean": 5020.1, "valid_targets_min": 1666 }, { "epoch": 2.4207369323050556, "grad_norm": 0.44497761259747304, "learning_rate": 3.308487987324908e-05, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.08513899147510529, "step": 2825, "valid_targets_mean": 4916.0, "valid_targets_min": 2516 }, { "epoch": 2.4250214224507283, "grad_norm": 0.499349034804837, "learning_rate": 3.305253318230882e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.1289609670639038, "step": 2830, "valid_targets_mean": 5271.5, "valid_targets_min": 3094 }, { "epoch": 2.429305912596401, "grad_norm": 0.5463948445725036, "learning_rate": 3.302012690822698e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.10212835669517517, "step": 2835, "valid_targets_mean": 4947.0, "valid_targets_min": 2836 }, { "epoch": 2.4335904027420736, "grad_norm": 0.4086429133907161, "learning_rate": 3.2987661198934066e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.09139082580804825, "step": 2840, "valid_targets_mean": 7052.8, "valid_targets_min": 5042 }, { "epoch": 2.4378748928877463, "grad_norm": 0.4876443641286558, "learning_rate": 3.295513620263187e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.12413141876459122, "step": 2845, "valid_targets_mean": 5646.8, "valid_targets_min": 2418 }, { "epoch": 2.442159383033419, "grad_norm": 0.49316864024616114, "learning_rate": 3.292255206779282e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.096271812915802, "step": 2850, "valid_targets_mean": 4577.0, "valid_targets_min": 1955 }, { "epoch": 2.4464438731790916, "grad_norm": 0.4964219050365118, "learning_rate": 3.2889908943159335e-05, "loss": 0.1902, "loss_nan_ranks": 0, "loss_rank_avg": 0.1023876965045929, "step": 2855, "valid_targets_mean": 7298.4, "valid_targets_min": 4788 }, { "epoch": 2.4507283633247643, "grad_norm": 0.4990305688617052, "learning_rate": 3.285720697774309e-05, "loss": 0.2021, "loss_nan_ranks": 0, "loss_rank_avg": 0.11171339452266693, "step": 2860, "valid_targets_mean": 5601.4, "valid_targets_min": 2756 }, { "epoch": 2.455012853470437, "grad_norm": 0.41817374740108504, "learning_rate": 3.282444632082437e-05, "loss": 0.2028, "loss_nan_ranks": 0, "loss_rank_avg": 0.08068175613880157, "step": 2865, "valid_targets_mean": 5683.9, "valid_targets_min": 738 }, { "epoch": 2.4592973436161096, "grad_norm": 0.43554569977825025, "learning_rate": 3.279162712195137e-05, "loss": 0.2053, "loss_nan_ranks": 0, "loss_rank_avg": 0.11963269114494324, "step": 2870, "valid_targets_mean": 7243.9, "valid_targets_min": 4833 }, { "epoch": 2.4635818337617823, "grad_norm": 0.48826855861952745, "learning_rate": 3.275874953093953e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.10686782747507095, "step": 2875, "valid_targets_mean": 6170.8, "valid_targets_min": 3494 }, { "epoch": 2.467866323907455, "grad_norm": 0.5068519289504925, "learning_rate": 3.272581369787085e-05, "loss": 0.192, "loss_nan_ranks": 0, "loss_rank_avg": 0.11042851209640503, "step": 2880, "valid_targets_mean": 4609.8, "valid_targets_min": 2343 }, { "epoch": 2.4721508140531276, "grad_norm": 0.46615869185497966, "learning_rate": 3.2692819773093176e-05, "loss": 0.2032, "loss_nan_ranks": 0, "loss_rank_avg": 0.09782660007476807, "step": 2885, "valid_targets_mean": 5556.2, "valid_targets_min": 3460 }, { "epoch": 2.4764353041988003, "grad_norm": 0.4967868181924323, "learning_rate": 3.265976790721955e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.09430047124624252, "step": 2890, "valid_targets_mean": 3529.8, "valid_targets_min": 1223 }, { "epoch": 2.480719794344473, "grad_norm": 0.5205596403786918, "learning_rate": 3.2626658251127504e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.0845278799533844, "step": 2895, "valid_targets_mean": 5316.0, "valid_targets_min": 1397 }, { "epoch": 2.4850042844901457, "grad_norm": 0.587813292998456, "learning_rate": 3.2593490955958374e-05, "loss": 0.2063, "loss_nan_ranks": 0, "loss_rank_avg": 0.1236010491847992, "step": 2900, "valid_targets_mean": 4464.0, "valid_targets_min": 908 }, { "epoch": 2.4892887746358183, "grad_norm": 0.5067347323119288, "learning_rate": 3.256026617311662e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.09447930008172989, "step": 2905, "valid_targets_mean": 4661.0, "valid_targets_min": 2243 }, { "epoch": 2.493573264781491, "grad_norm": 0.5698817677028789, "learning_rate": 3.252698405426912e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.09549528360366821, "step": 2910, "valid_targets_mean": 4545.1, "valid_targets_min": 648 }, { "epoch": 2.4978577549271637, "grad_norm": 0.5216276128702821, "learning_rate": 3.249364475134447e-05, "loss": 0.203, "loss_nan_ranks": 0, "loss_rank_avg": 0.1125568151473999, "step": 2915, "valid_targets_mean": 4951.6, "valid_targets_min": 2860 }, { "epoch": 2.5021422450728363, "grad_norm": 0.42280291475452436, "learning_rate": 3.246024841653233e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.0859423577785492, "step": 2920, "valid_targets_mean": 5395.1, "valid_targets_min": 1793 }, { "epoch": 2.506426735218509, "grad_norm": 0.5223758050374674, "learning_rate": 3.2426795202282675e-05, "loss": 0.1963, "loss_nan_ranks": 0, "loss_rank_avg": 0.08532857149839401, "step": 2925, "valid_targets_mean": 6232.2, "valid_targets_min": 4735 }, { "epoch": 2.5107112253641817, "grad_norm": 0.4856689543602733, "learning_rate": 3.239328526130516e-05, "loss": 0.2011, "loss_nan_ranks": 0, "loss_rank_avg": 0.09928176552057266, "step": 2930, "valid_targets_mean": 5423.1, "valid_targets_min": 1613 }, { "epoch": 2.5149957155098543, "grad_norm": 0.4321558846322626, "learning_rate": 3.235971874656835e-05, "loss": 0.1907, "loss_nan_ranks": 0, "loss_rank_avg": 0.08418859541416168, "step": 2935, "valid_targets_mean": 5001.8, "valid_targets_min": 1040 }, { "epoch": 2.519280205655527, "grad_norm": 0.48854417396408445, "learning_rate": 3.2326095811299096e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.10312269628047943, "step": 2940, "valid_targets_mean": 4326.8, "valid_targets_min": 2391 }, { "epoch": 2.5235646958011997, "grad_norm": 0.47592753685481903, "learning_rate": 3.22924166089818e-05, "loss": 0.2075, "loss_nan_ranks": 0, "loss_rank_avg": 0.10614067316055298, "step": 2945, "valid_targets_mean": 5605.1, "valid_targets_min": 2827 }, { "epoch": 2.5278491859468724, "grad_norm": 0.48528302022832537, "learning_rate": 3.225868129335768e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.09091340005397797, "step": 2950, "valid_targets_mean": 4797.1, "valid_targets_min": 1697 }, { "epoch": 2.532133676092545, "grad_norm": 0.5251980386220312, "learning_rate": 3.2224890018424156e-05, "loss": 0.2037, "loss_nan_ranks": 0, "loss_rank_avg": 0.09622952342033386, "step": 2955, "valid_targets_mean": 4853.0, "valid_targets_min": 2149 }, { "epoch": 2.5364181662382177, "grad_norm": 0.541458693239247, "learning_rate": 3.219104293843405e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.10172342509031296, "step": 2960, "valid_targets_mean": 4165.2, "valid_targets_min": 1455 }, { "epoch": 2.5407026563838904, "grad_norm": 0.5178417669621618, "learning_rate": 3.215714020789495e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.09176942706108093, "step": 2965, "valid_targets_mean": 3891.8, "valid_targets_min": 981 }, { "epoch": 2.544987146529563, "grad_norm": 0.4483728443085302, "learning_rate": 3.212318198156848e-05, "loss": 0.2074, "loss_nan_ranks": 0, "loss_rank_avg": 0.09753090143203735, "step": 2970, "valid_targets_mean": 5039.6, "valid_targets_min": 2813 }, { "epoch": 2.5492716366752357, "grad_norm": 0.43906680838014805, "learning_rate": 3.208916841446959e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.08158387988805771, "step": 2975, "valid_targets_mean": 5588.9, "valid_targets_min": 3214 }, { "epoch": 2.5535561268209084, "grad_norm": 0.42515686500054095, "learning_rate": 3.2055099661865854e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.09098470211029053, "step": 2980, "valid_targets_mean": 5731.4, "valid_targets_min": 3643 }, { "epoch": 2.557840616966581, "grad_norm": 0.4667107050928945, "learning_rate": 3.202097587927676e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.11131277680397034, "step": 2985, "valid_targets_mean": 4814.0, "valid_targets_min": 1697 }, { "epoch": 2.5621251071122537, "grad_norm": 0.5191660325554805, "learning_rate": 3.1986797222473016e-05, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.102913036942482, "step": 2990, "valid_targets_mean": 4120.5, "valid_targets_min": 1392 }, { "epoch": 2.5664095972579264, "grad_norm": 0.5098529158119127, "learning_rate": 3.1952563847475805e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.10675621777772903, "step": 2995, "valid_targets_mean": 5657.0, "valid_targets_min": 1446 }, { "epoch": 2.570694087403599, "grad_norm": 0.4757706576119366, "learning_rate": 3.191827591055609e-05, "loss": 0.187, "loss_nan_ranks": 0, "loss_rank_avg": 0.08147279173135757, "step": 3000, "valid_targets_mean": 4523.4, "valid_targets_min": 1596 }, { "epoch": 2.5749785775492717, "grad_norm": 0.47439322539254747, "learning_rate": 3.1883933568233915e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.08240111172199249, "step": 3005, "valid_targets_mean": 6329.6, "valid_targets_min": 4234 }, { "epoch": 2.5792630676949444, "grad_norm": 0.4301275527510319, "learning_rate": 3.184953697727767e-05, "loss": 0.202, "loss_nan_ranks": 0, "loss_rank_avg": 0.09618514031171799, "step": 3010, "valid_targets_mean": 6511.9, "valid_targets_min": 3879 }, { "epoch": 2.583547557840617, "grad_norm": 0.4585872283916217, "learning_rate": 3.181508629470339e-05, "loss": 0.2221, "loss_nan_ranks": 0, "loss_rank_avg": 0.1063903272151947, "step": 3015, "valid_targets_mean": 3837.1, "valid_targets_min": 1377 }, { "epoch": 2.5878320479862897, "grad_norm": 0.4767544940704192, "learning_rate": 3.1780581677774026e-05, "loss": 0.1959, "loss_nan_ranks": 0, "loss_rank_avg": 0.10895279049873352, "step": 3020, "valid_targets_mean": 5447.4, "valid_targets_min": 1774 }, { "epoch": 2.5921165381319624, "grad_norm": 0.505750162963359, "learning_rate": 3.1746023283998736e-05, "loss": 0.1955, "loss_nan_ranks": 0, "loss_rank_avg": 0.0998040959239006, "step": 3025, "valid_targets_mean": 3948.4, "valid_targets_min": 1631 }, { "epoch": 2.596401028277635, "grad_norm": 0.4324680394219439, "learning_rate": 3.1711411271132156e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.09612485021352768, "step": 3030, "valid_targets_mean": 5286.2, "valid_targets_min": 1612 }, { "epoch": 2.6006855184233078, "grad_norm": 0.44679380951456976, "learning_rate": 3.1676745797173685e-05, "loss": 0.1929, "loss_nan_ranks": 0, "loss_rank_avg": 0.08475670218467712, "step": 3035, "valid_targets_mean": 5412.5, "valid_targets_min": 2685 }, { "epoch": 2.6049700085689804, "grad_norm": 0.45529448999326766, "learning_rate": 3.164202702036677e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.11184944212436676, "step": 3040, "valid_targets_mean": 6625.9, "valid_targets_min": 4048 }, { "epoch": 2.609254498714653, "grad_norm": 0.5200508408646883, "learning_rate": 3.16072550991982e-05, "loss": 0.2133, "loss_nan_ranks": 0, "loss_rank_avg": 0.10833759605884552, "step": 3045, "valid_targets_mean": 4254.2, "valid_targets_min": 1634 }, { "epoch": 2.6135389888603258, "grad_norm": 0.47583075311418843, "learning_rate": 3.157243019239731e-05, "loss": 0.1901, "loss_nan_ranks": 0, "loss_rank_avg": 0.09005630761384964, "step": 3050, "valid_targets_mean": 4993.1, "valid_targets_min": 1900 }, { "epoch": 2.6178234790059984, "grad_norm": 0.47116305006250425, "learning_rate": 3.1537552458935356e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.08517856150865555, "step": 3055, "valid_targets_mean": 5333.1, "valid_targets_min": 1795 }, { "epoch": 2.622107969151671, "grad_norm": 0.46550629698322077, "learning_rate": 3.150262205802472e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.09626109898090363, "step": 3060, "valid_targets_mean": 5502.6, "valid_targets_min": 3489 }, { "epoch": 2.6263924592973438, "grad_norm": 0.5190463480248941, "learning_rate": 3.1467639149118195e-05, "loss": 0.1979, "loss_nan_ranks": 0, "loss_rank_avg": 0.08040817081928253, "step": 3065, "valid_targets_mean": 4047.1, "valid_targets_min": 996 }, { "epoch": 2.6306769494430164, "grad_norm": 0.47565052334057345, "learning_rate": 3.1432603891908295e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.10391212999820709, "step": 3070, "valid_targets_mean": 6069.5, "valid_targets_min": 2558 }, { "epoch": 2.6349614395886887, "grad_norm": 0.49248862544332433, "learning_rate": 3.1397516446326464e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.10490263998508453, "step": 3075, "valid_targets_mean": 5443.2, "valid_targets_min": 2735 }, { "epoch": 2.6392459297343613, "grad_norm": 0.4861909277172617, "learning_rate": 3.136237697254241e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.11516415327787399, "step": 3080, "valid_targets_mean": 5015.1, "valid_targets_min": 2795 }, { "epoch": 2.643530419880034, "grad_norm": 0.6286859927618421, "learning_rate": 3.132718563096332e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.09952767938375473, "step": 3085, "valid_targets_mean": 5225.5, "valid_targets_min": 2651 }, { "epoch": 2.6478149100257067, "grad_norm": 0.5524151436612424, "learning_rate": 3.129194258223316e-05, "loss": 0.2082, "loss_nan_ranks": 0, "loss_rank_avg": 0.11292801052331924, "step": 3090, "valid_targets_mean": 4077.6, "valid_targets_min": 1330 }, { "epoch": 2.6520994001713794, "grad_norm": 0.495231500813035, "learning_rate": 3.125664798723193e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.10587464272975922, "step": 3095, "valid_targets_mean": 5196.5, "valid_targets_min": 3772 }, { "epoch": 2.656383890317052, "grad_norm": 0.4357989088506872, "learning_rate": 3.122130200707494e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.09586100280284882, "step": 3100, "valid_targets_mean": 5426.6, "valid_targets_min": 1967 }, { "epoch": 2.6606683804627247, "grad_norm": 0.5325689265202237, "learning_rate": 3.118590480311206e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.08797873556613922, "step": 3105, "valid_targets_mean": 3848.8, "valid_targets_min": 1716 }, { "epoch": 2.6649528706083974, "grad_norm": 0.4396920701228743, "learning_rate": 3.115045653692698e-05, "loss": 0.1957, "loss_nan_ranks": 0, "loss_rank_avg": 0.09114794433116913, "step": 3110, "valid_targets_mean": 4718.9, "valid_targets_min": 2123 }, { "epoch": 2.66923736075407, "grad_norm": 0.550751313514682, "learning_rate": 3.111495737033651e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.10032795369625092, "step": 3115, "valid_targets_mean": 3613.1, "valid_targets_min": 1622 }, { "epoch": 2.6735218508997427, "grad_norm": 0.41079175675526175, "learning_rate": 3.107940746538978e-05, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.08481456339359283, "step": 3120, "valid_targets_mean": 5954.8, "valid_targets_min": 3243 }, { "epoch": 2.6778063410454154, "grad_norm": 0.5076145326822086, "learning_rate": 3.104380698436757e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.12480606138706207, "step": 3125, "valid_targets_mean": 5253.0, "valid_targets_min": 1945 }, { "epoch": 2.682090831191088, "grad_norm": 0.49899317879815436, "learning_rate": 3.100815608978149e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.09135354310274124, "step": 3130, "valid_targets_mean": 4251.4, "valid_targets_min": 2493 }, { "epoch": 2.6863753213367607, "grad_norm": 0.6388457405969222, "learning_rate": 3.097245494437333e-05, "loss": 0.204, "loss_nan_ranks": 0, "loss_rank_avg": 0.09539501368999481, "step": 3135, "valid_targets_mean": 4684.8, "valid_targets_min": 976 }, { "epoch": 2.6906598114824334, "grad_norm": 0.4922925574234516, "learning_rate": 3.093670371111423e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.09869565814733505, "step": 3140, "valid_targets_mean": 3889.5, "valid_targets_min": 2515 }, { "epoch": 2.694944301628106, "grad_norm": 0.4788156391819075, "learning_rate": 3.0900902553204e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.0883324146270752, "step": 3145, "valid_targets_mean": 6716.8, "valid_targets_min": 3263 }, { "epoch": 2.6992287917737787, "grad_norm": 0.5726806445817842, "learning_rate": 3.086505163407032e-05, "loss": 0.1973, "loss_nan_ranks": 0, "loss_rank_avg": 0.12586042284965515, "step": 3150, "valid_targets_mean": 5087.8, "valid_targets_min": 3199 }, { "epoch": 2.7035132819194514, "grad_norm": 0.4559348559533937, "learning_rate": 3.082915111736807e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.09658126533031464, "step": 3155, "valid_targets_mean": 5267.8, "valid_targets_min": 2678 }, { "epoch": 2.707797772065124, "grad_norm": 0.5227607109278021, "learning_rate": 3.0793201166978476e-05, "loss": 0.1999, "loss_nan_ranks": 0, "loss_rank_avg": 0.11674916744232178, "step": 3160, "valid_targets_mean": 5233.1, "valid_targets_min": 2110 }, { "epoch": 2.7120822622107967, "grad_norm": 0.5381499374038914, "learning_rate": 3.0757201947008483e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.1280943900346756, "step": 3165, "valid_targets_mean": 5339.1, "valid_targets_min": 1444 }, { "epoch": 2.7163667523564694, "grad_norm": 0.4876029858247357, "learning_rate": 3.07211536217899e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.09767451882362366, "step": 3170, "valid_targets_mean": 4989.1, "valid_targets_min": 1777 }, { "epoch": 2.720651242502142, "grad_norm": 0.5259217745782021, "learning_rate": 3.0685056355878726e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.12681160867214203, "step": 3175, "valid_targets_mean": 4674.9, "valid_targets_min": 974 }, { "epoch": 2.7249357326478147, "grad_norm": 0.4762818016196657, "learning_rate": 3.064891031405434e-05, "loss": 0.1943, "loss_nan_ranks": 0, "loss_rank_avg": 0.11337507516145706, "step": 3180, "valid_targets_mean": 5564.9, "valid_targets_min": 1805 }, { "epoch": 2.7292202227934874, "grad_norm": 0.453669260564161, "learning_rate": 3.0612715661318805e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.1022944450378418, "step": 3185, "valid_targets_mean": 5294.9, "valid_targets_min": 1899 }, { "epoch": 2.73350471293916, "grad_norm": 0.4889641599281156, "learning_rate": 3.0576472562896075e-05, "loss": 0.2022, "loss_nan_ranks": 0, "loss_rank_avg": 0.08817283809185028, "step": 3190, "valid_targets_mean": 5229.1, "valid_targets_min": 2106 }, { "epoch": 2.7377892030848328, "grad_norm": 0.49903719744109054, "learning_rate": 3.054018118423124e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.1024971455335617, "step": 3195, "valid_targets_mean": 5159.2, "valid_targets_min": 2495 }, { "epoch": 2.7420736932305054, "grad_norm": 0.49119777255841934, "learning_rate": 3.0503841690989796e-05, "loss": 0.1884, "loss_nan_ranks": 0, "loss_rank_avg": 0.09236447513103485, "step": 3200, "valid_targets_mean": 4263.9, "valid_targets_min": 1124 }, { "epoch": 2.746358183376178, "grad_norm": 0.42139121040252897, "learning_rate": 3.046745424905688e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.0806296318769455, "step": 3205, "valid_targets_mean": 5324.8, "valid_targets_min": 2062 }, { "epoch": 2.7506426735218508, "grad_norm": 0.8660851118774108, "learning_rate": 3.043101902453649e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.09605230391025543, "step": 3210, "valid_targets_mean": 4066.8, "valid_targets_min": 1700 }, { "epoch": 2.7549271636675234, "grad_norm": 0.5879290547420875, "learning_rate": 3.0394536183750767e-05, "loss": 0.1951, "loss_nan_ranks": 0, "loss_rank_avg": 0.09734377264976501, "step": 3215, "valid_targets_mean": 4280.2, "valid_targets_min": 1991 }, { "epoch": 2.759211653813196, "grad_norm": 0.4906383846943346, "learning_rate": 3.03580058932392e-05, "loss": 0.1843, "loss_nan_ranks": 0, "loss_rank_avg": 0.07829025387763977, "step": 3220, "valid_targets_mean": 4240.2, "valid_targets_min": 2774 }, { "epoch": 2.763496143958869, "grad_norm": 0.4477719224428516, "learning_rate": 3.0321428319757893e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.08995410054922104, "step": 3225, "valid_targets_mean": 5337.2, "valid_targets_min": 2546 }, { "epoch": 2.7677806341045414, "grad_norm": 0.48047544514516427, "learning_rate": 3.0284803630278775e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.091777004301548, "step": 3230, "valid_targets_mean": 4903.8, "valid_targets_min": 3388 }, { "epoch": 2.772065124250214, "grad_norm": 0.47975164003492826, "learning_rate": 3.0248131991988857e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.1095355898141861, "step": 3235, "valid_targets_mean": 5540.9, "valid_targets_min": 2016 }, { "epoch": 2.776349614395887, "grad_norm": 0.465247942884362, "learning_rate": 3.0211413572289482e-05, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.10163888335227966, "step": 3240, "valid_targets_mean": 5639.5, "valid_targets_min": 3602 }, { "epoch": 2.7806341045415595, "grad_norm": 0.4641303234289437, "learning_rate": 3.0174648538795515e-05, "loss": 0.2, "loss_nan_ranks": 0, "loss_rank_avg": 0.10476160049438477, "step": 3245, "valid_targets_mean": 5816.5, "valid_targets_min": 3071 }, { "epoch": 2.784918594687232, "grad_norm": 0.505653288338379, "learning_rate": 3.013783705933463e-05, "loss": 0.1948, "loss_nan_ranks": 0, "loss_rank_avg": 0.10704667121171951, "step": 3250, "valid_targets_mean": 5718.9, "valid_targets_min": 2908 }, { "epoch": 2.789203084832905, "grad_norm": 0.4816018494525304, "learning_rate": 3.0100979301946532e-05, "loss": 0.1971, "loss_nan_ranks": 0, "loss_rank_avg": 0.10598535090684891, "step": 3255, "valid_targets_mean": 4577.1, "valid_targets_min": 2044 }, { "epoch": 2.7934875749785775, "grad_norm": 0.4266350764785256, "learning_rate": 3.0064075434882132e-05, "loss": 0.1931, "loss_nan_ranks": 0, "loss_rank_avg": 0.09043243527412415, "step": 3260, "valid_targets_mean": 6281.5, "valid_targets_min": 3937 }, { "epoch": 2.79777206512425, "grad_norm": 0.4644479409123575, "learning_rate": 3.0027125626602873e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.08926934003829956, "step": 3265, "valid_targets_mean": 5050.8, "valid_targets_min": 2544 }, { "epoch": 2.802056555269923, "grad_norm": 0.4396938445335989, "learning_rate": 2.9990130045779883e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.0825769230723381, "step": 3270, "valid_targets_mean": 5007.4, "valid_targets_min": 1194 }, { "epoch": 2.8063410454155955, "grad_norm": 0.5118083821075619, "learning_rate": 2.9953088861293262e-05, "loss": 0.2037, "loss_nan_ranks": 0, "loss_rank_avg": 0.10184841603040695, "step": 3275, "valid_targets_mean": 3770.6, "valid_targets_min": 1691 }, { "epoch": 2.810625535561268, "grad_norm": 0.5105152513424626, "learning_rate": 2.9916002242231262e-05, "loss": 0.1961, "loss_nan_ranks": 0, "loss_rank_avg": 0.132453054189682, "step": 3280, "valid_targets_mean": 5373.8, "valid_targets_min": 865 }, { "epoch": 2.814910025706941, "grad_norm": 0.49738165894659575, "learning_rate": 2.9878870357889544e-05, "loss": 0.1921, "loss_nan_ranks": 0, "loss_rank_avg": 0.1020285040140152, "step": 3285, "valid_targets_mean": 5117.5, "valid_targets_min": 1751 }, { "epoch": 2.8191945158526135, "grad_norm": 0.4634789342087233, "learning_rate": 2.9841693377770416e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.08905909955501556, "step": 3290, "valid_targets_mean": 5624.5, "valid_targets_min": 2650 }, { "epoch": 2.823479005998286, "grad_norm": 0.4864734023517098, "learning_rate": 2.980447147158202e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.12124571949243546, "step": 3295, "valid_targets_mean": 5532.0, "valid_targets_min": 1678 }, { "epoch": 2.827763496143959, "grad_norm": 0.4764156499362963, "learning_rate": 2.9767204809237588e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.10643521696329117, "step": 3300, "valid_targets_mean": 6071.6, "valid_targets_min": 1965 }, { "epoch": 2.8320479862896315, "grad_norm": 0.5007611593322627, "learning_rate": 2.972989356085466e-05, "loss": 0.1954, "loss_nan_ranks": 0, "loss_rank_avg": 0.09378144145011902, "step": 3305, "valid_targets_mean": 4657.8, "valid_targets_min": 1111 }, { "epoch": 2.836332476435304, "grad_norm": 0.5005017672048564, "learning_rate": 2.9692537896754298e-05, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.11224367469549179, "step": 3310, "valid_targets_mean": 4564.1, "valid_targets_min": 2544 }, { "epoch": 2.840616966580977, "grad_norm": 0.48187504122875946, "learning_rate": 2.9655137987460335e-05, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.08884987235069275, "step": 3315, "valid_targets_mean": 5739.2, "valid_targets_min": 2278 }, { "epoch": 2.8449014567266495, "grad_norm": 0.4741640143584193, "learning_rate": 2.9617694003698562e-05, "loss": 0.176, "loss_nan_ranks": 0, "loss_rank_avg": 0.08888500183820724, "step": 3320, "valid_targets_mean": 4935.2, "valid_targets_min": 1853 }, { "epoch": 2.849185946872322, "grad_norm": 0.5052854112998219, "learning_rate": 2.958020611639596e-05, "loss": 0.1922, "loss_nan_ranks": 0, "loss_rank_avg": 0.12267468869686127, "step": 3325, "valid_targets_mean": 6198.9, "valid_targets_min": 4193 }, { "epoch": 2.853470437017995, "grad_norm": 0.5101750578437945, "learning_rate": 2.9542674496679934e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.09153853356838226, "step": 3330, "valid_targets_mean": 4406.9, "valid_targets_min": 958 }, { "epoch": 2.8577549271636675, "grad_norm": 0.49964993139780745, "learning_rate": 2.9505099315877523e-05, "loss": 0.1858, "loss_nan_ranks": 0, "loss_rank_avg": 0.09591518342494965, "step": 3335, "valid_targets_mean": 5327.9, "valid_targets_min": 2086 }, { "epoch": 2.86203941730934, "grad_norm": 0.4801936085794442, "learning_rate": 2.9467480745514602e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.10366001725196838, "step": 3340, "valid_targets_mean": 5311.1, "valid_targets_min": 2174 }, { "epoch": 2.866323907455013, "grad_norm": 0.5427472421890712, "learning_rate": 2.9429818957315136e-05, "loss": 0.1904, "loss_nan_ranks": 0, "loss_rank_avg": 0.1099645346403122, "step": 3345, "valid_targets_mean": 4822.6, "valid_targets_min": 2990 }, { "epoch": 2.8706083976006855, "grad_norm": 0.4766043311462836, "learning_rate": 2.9392114123200364e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.10909044742584229, "step": 3350, "valid_targets_mean": 5208.8, "valid_targets_min": 3584 }, { "epoch": 2.874892887746358, "grad_norm": 0.5119800749708363, "learning_rate": 2.9354366415288014e-05, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.09974499046802521, "step": 3355, "valid_targets_mean": 4476.0, "valid_targets_min": 1244 }, { "epoch": 2.879177377892031, "grad_norm": 0.48951315745386836, "learning_rate": 2.9316576005891542e-05, "loss": 0.1857, "loss_nan_ranks": 0, "loss_rank_avg": 0.08528132736682892, "step": 3360, "valid_targets_mean": 4576.9, "valid_targets_min": 2041 }, { "epoch": 2.8834618680377035, "grad_norm": 0.49140619995629536, "learning_rate": 2.9278743067519326e-05, "loss": 0.1891, "loss_nan_ranks": 0, "loss_rank_avg": 0.13168025016784668, "step": 3365, "valid_targets_mean": 6030.4, "valid_targets_min": 2371 }, { "epoch": 2.887746358183376, "grad_norm": 0.4819206963434024, "learning_rate": 2.9240867772873874e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.1023363322019577, "step": 3370, "valid_targets_mean": 4449.2, "valid_targets_min": 3215 }, { "epoch": 2.892030848329049, "grad_norm": 0.5091994742881791, "learning_rate": 2.920295029485106e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.10762618482112885, "step": 3375, "valid_targets_mean": 5931.4, "valid_targets_min": 2190 }, { "epoch": 2.8963153384747216, "grad_norm": 0.45100342040875835, "learning_rate": 2.916499080653931e-05, "loss": 0.1751, "loss_nan_ranks": 0, "loss_rank_avg": 0.10775713622570038, "step": 3380, "valid_targets_mean": 5796.4, "valid_targets_min": 1079 }, { "epoch": 2.9005998286203942, "grad_norm": 0.4190962708075657, "learning_rate": 2.9126989481218825e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.08602378517389297, "step": 3385, "valid_targets_mean": 5787.2, "valid_targets_min": 1951 }, { "epoch": 2.904884318766067, "grad_norm": 0.5697440698751479, "learning_rate": 2.9088946492360785e-05, "loss": 0.2074, "loss_nan_ranks": 0, "loss_rank_avg": 0.1274511069059372, "step": 3390, "valid_targets_mean": 4970.1, "valid_targets_min": 1205 }, { "epoch": 2.9091688089117396, "grad_norm": 0.4196775106056009, "learning_rate": 2.9050862013626564e-05, "loss": 0.1893, "loss_nan_ranks": 0, "loss_rank_avg": 0.0831018015742302, "step": 3395, "valid_targets_mean": 5513.4, "valid_targets_min": 1654 }, { "epoch": 2.9134532990574122, "grad_norm": 0.5081613353431708, "learning_rate": 2.901273621886693e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.10517710447311401, "step": 3400, "valid_targets_mean": 3801.2, "valid_targets_min": 1711 }, { "epoch": 2.917737789203085, "grad_norm": 0.45930708882009963, "learning_rate": 2.8974569282121234e-05, "loss": 0.197, "loss_nan_ranks": 0, "loss_rank_avg": 0.06961196660995483, "step": 3405, "valid_targets_mean": 4856.4, "valid_targets_min": 2652 }, { "epoch": 2.9220222793487576, "grad_norm": 0.481696740533411, "learning_rate": 2.893636137761667e-05, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.09374944865703583, "step": 3410, "valid_targets_mean": 5881.6, "valid_targets_min": 3134 }, { "epoch": 2.9263067694944302, "grad_norm": 0.4503892609201548, "learning_rate": 2.8898112679767423e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.08698620647192001, "step": 3415, "valid_targets_mean": 6453.8, "valid_targets_min": 3057 }, { "epoch": 2.930591259640103, "grad_norm": 0.5118223470574057, "learning_rate": 2.8859823363173895e-05, "loss": 0.1877, "loss_nan_ranks": 0, "loss_rank_avg": 0.0849127247929573, "step": 3420, "valid_targets_mean": 5139.4, "valid_targets_min": 1009 }, { "epoch": 2.9348757497857756, "grad_norm": 0.6604188562733819, "learning_rate": 2.8821493602621905e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.0802006646990776, "step": 3425, "valid_targets_mean": 3835.0, "valid_targets_min": 505 }, { "epoch": 2.9391602399314483, "grad_norm": 0.4628759246456681, "learning_rate": 2.8783123573081914e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.08029916882514954, "step": 3430, "valid_targets_mean": 4832.9, "valid_targets_min": 2019 }, { "epoch": 2.943444730077121, "grad_norm": 0.46129914147611034, "learning_rate": 2.8744713449708177e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.10295387357473373, "step": 3435, "valid_targets_mean": 5271.5, "valid_targets_min": 2478 }, { "epoch": 2.9477292202227936, "grad_norm": 0.441159023257155, "learning_rate": 2.8706263407837987e-05, "loss": 0.1923, "loss_nan_ranks": 0, "loss_rank_avg": 0.0948648527264595, "step": 3440, "valid_targets_mean": 5663.5, "valid_targets_min": 1505 }, { "epoch": 2.9520137103684663, "grad_norm": 0.45438783348338496, "learning_rate": 2.8667773622990866e-05, "loss": 0.1908, "loss_nan_ranks": 0, "loss_rank_avg": 0.07966434955596924, "step": 3445, "valid_targets_mean": 4331.8, "valid_targets_min": 1691 }, { "epoch": 2.956298200514139, "grad_norm": 0.4711518580687224, "learning_rate": 2.862924427086774e-05, "loss": 0.1946, "loss_nan_ranks": 0, "loss_rank_avg": 0.08603475242853165, "step": 3450, "valid_targets_mean": 4567.8, "valid_targets_min": 1840 }, { "epoch": 2.9605826906598116, "grad_norm": 0.47190988623418867, "learning_rate": 2.8590675527350176e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.09044405072927475, "step": 3455, "valid_targets_mean": 5541.8, "valid_targets_min": 1713 }, { "epoch": 2.9648671808054843, "grad_norm": 0.4720059395646641, "learning_rate": 2.855206756849954e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.10311125218868256, "step": 3460, "valid_targets_mean": 6031.2, "valid_targets_min": 3389 }, { "epoch": 2.969151670951157, "grad_norm": 0.4655184637568635, "learning_rate": 2.8513420570556215e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.1196562647819519, "step": 3465, "valid_targets_mean": 6100.0, "valid_targets_min": 2060 }, { "epoch": 2.9734361610968296, "grad_norm": 0.47509143615627447, "learning_rate": 2.84747347099388e-05, "loss": 0.193, "loss_nan_ranks": 0, "loss_rank_avg": 0.10468809306621552, "step": 3470, "valid_targets_mean": 5777.6, "valid_targets_min": 3849 }, { "epoch": 2.9777206512425023, "grad_norm": 0.498289537677379, "learning_rate": 2.8436010163243287e-05, "loss": 0.1943, "loss_nan_ranks": 0, "loss_rank_avg": 0.09609770029783249, "step": 3475, "valid_targets_mean": 4283.6, "valid_targets_min": 1896 }, { "epoch": 2.982005141388175, "grad_norm": 0.507469384352556, "learning_rate": 2.8397247107242277e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.08562733232975006, "step": 3480, "valid_targets_mean": 4300.0, "valid_targets_min": 1174 }, { "epoch": 2.9862896315338476, "grad_norm": 0.47299832417200927, "learning_rate": 2.835844571888415e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.07681527733802795, "step": 3485, "valid_targets_mean": 4179.5, "valid_targets_min": 2248 }, { "epoch": 2.9905741216795203, "grad_norm": 0.4667157029346048, "learning_rate": 2.8319606175292268e-05, "loss": 0.1855, "loss_nan_ranks": 0, "loss_rank_avg": 0.09336496889591217, "step": 3490, "valid_targets_mean": 5837.1, "valid_targets_min": 3571 }, { "epoch": 2.994858611825193, "grad_norm": 0.4634512544107229, "learning_rate": 2.828072865376418e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.08310113102197647, "step": 3495, "valid_targets_mean": 5144.8, "valid_targets_min": 2286 }, { "epoch": 2.9991431019708656, "grad_norm": 0.49616404871527503, "learning_rate": 2.824181333177078e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.06787382811307907, "step": 3500, "valid_targets_mean": 4116.4, "valid_targets_min": 1676 }, { "epoch": 3.0034275921165383, "grad_norm": 0.4456602655142074, "learning_rate": 2.8202860386955534e-05, "loss": 0.1831, "loss_nan_ranks": 0, "loss_rank_avg": 0.06987389177083969, "step": 3505, "valid_targets_mean": 4272.9, "valid_targets_min": 1939 }, { "epoch": 3.007712082262211, "grad_norm": 0.5110710630191438, "learning_rate": 2.816386999713365e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.09876535832881927, "step": 3510, "valid_targets_mean": 5605.4, "valid_targets_min": 2389 }, { "epoch": 3.0119965724078837, "grad_norm": 0.5107222623720482, "learning_rate": 2.812484234029124e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.0746680349111557, "step": 3515, "valid_targets_mean": 4642.9, "valid_targets_min": 2104 }, { "epoch": 3.0162810625535563, "grad_norm": 0.5128074506697414, "learning_rate": 2.808577759458458e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.07372597604990005, "step": 3520, "valid_targets_mean": 4467.4, "valid_targets_min": 2243 }, { "epoch": 3.020565552699229, "grad_norm": 0.4834848424338338, "learning_rate": 2.8046675938339225e-05, "loss": 0.186, "loss_nan_ranks": 0, "loss_rank_avg": 0.08008388429880142, "step": 3525, "valid_targets_mean": 5414.8, "valid_targets_min": 2880 }, { "epoch": 3.0248500428449017, "grad_norm": 0.4846106856666557, "learning_rate": 2.8007537550049217e-05, "loss": 0.1859, "loss_nan_ranks": 0, "loss_rank_avg": 0.0926634818315506, "step": 3530, "valid_targets_mean": 5325.6, "valid_targets_min": 3692 }, { "epoch": 3.0291345329905743, "grad_norm": 0.5380320550491385, "learning_rate": 2.7968362608376286e-05, "loss": 0.1786, "loss_nan_ranks": 0, "loss_rank_avg": 0.09920945763587952, "step": 3535, "valid_targets_mean": 4871.8, "valid_targets_min": 1352 }, { "epoch": 3.033419023136247, "grad_norm": 0.5268363683831023, "learning_rate": 2.792915129214902e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.1121433675289154, "step": 3540, "valid_targets_mean": 5245.8, "valid_targets_min": 2337 }, { "epoch": 3.0377035132819197, "grad_norm": 0.5235815428498671, "learning_rate": 2.7889903780362063e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.07933693379163742, "step": 3545, "valid_targets_mean": 3886.6, "valid_targets_min": 1805 }, { "epoch": 3.041988003427592, "grad_norm": 0.4745143364972243, "learning_rate": 2.785062025217526e-05, "loss": 0.1589, "loss_nan_ranks": 0, "loss_rank_avg": 0.06564758718013763, "step": 3550, "valid_targets_mean": 5061.2, "valid_targets_min": 3020 }, { "epoch": 3.0462724935732646, "grad_norm": 0.5901591936966151, "learning_rate": 2.78113008869129e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.11617127805948257, "step": 3555, "valid_targets_mean": 4354.5, "valid_targets_min": 2177 }, { "epoch": 3.0505569837189372, "grad_norm": 0.5031895790828588, "learning_rate": 2.7771945864062847e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.09542632848024368, "step": 3560, "valid_targets_mean": 4467.2, "valid_targets_min": 2041 }, { "epoch": 3.05484147386461, "grad_norm": 0.5067028918137597, "learning_rate": 2.773255536327573e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.1154802069067955, "step": 3565, "valid_targets_mean": 4982.1, "valid_targets_min": 2672 }, { "epoch": 3.0591259640102826, "grad_norm": 0.5295274273062762, "learning_rate": 2.7693129564364138e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.10568901896476746, "step": 3570, "valid_targets_mean": 4102.6, "valid_targets_min": 1626 }, { "epoch": 3.0634104541559553, "grad_norm": 0.5184377694152152, "learning_rate": 2.7653668647301797e-05, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.08287379145622253, "step": 3575, "valid_targets_mean": 5492.0, "valid_targets_min": 2635 }, { "epoch": 3.067694944301628, "grad_norm": 0.4426511184640844, "learning_rate": 2.7614172792222737e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.07739445567131042, "step": 3580, "valid_targets_mean": 5844.0, "valid_targets_min": 1437 }, { "epoch": 3.0719794344473006, "grad_norm": 0.6163269967783526, "learning_rate": 2.7574642179420467e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.09435909986495972, "step": 3585, "valid_targets_mean": 5930.0, "valid_targets_min": 1412 }, { "epoch": 3.0762639245929733, "grad_norm": 0.4912971796430249, "learning_rate": 2.7535076989347182e-05, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.10539242625236511, "step": 3590, "valid_targets_mean": 5639.5, "valid_targets_min": 3804 }, { "epoch": 3.080548414738646, "grad_norm": 0.49155347164096125, "learning_rate": 2.7495477402612905e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.09726318717002869, "step": 3595, "valid_targets_mean": 4792.0, "valid_targets_min": 1491 }, { "epoch": 3.0848329048843186, "grad_norm": 0.46870008979654276, "learning_rate": 2.7455843599984658e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.08482338488101959, "step": 3600, "valid_targets_mean": 5219.8, "valid_targets_min": 1497 }, { "epoch": 3.0891173950299913, "grad_norm": 0.5315024980579985, "learning_rate": 2.7416175762385687e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.105237677693367, "step": 3605, "valid_targets_mean": 5123.6, "valid_targets_min": 3354 }, { "epoch": 3.093401885175664, "grad_norm": 0.5074302541744373, "learning_rate": 2.737647407089459e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.08297023177146912, "step": 3610, "valid_targets_mean": 4989.2, "valid_targets_min": 2494 }, { "epoch": 3.0976863753213366, "grad_norm": 0.5224620565734408, "learning_rate": 2.7336738706744494e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.07492747157812119, "step": 3615, "valid_targets_mean": 4522.4, "valid_targets_min": 964 }, { "epoch": 3.1019708654670093, "grad_norm": 0.44188115834719727, "learning_rate": 2.7296969851322246e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.07636836171150208, "step": 3620, "valid_targets_mean": 5345.1, "valid_targets_min": 1656 }, { "epoch": 3.106255355612682, "grad_norm": 0.48164647718897613, "learning_rate": 2.7257167686167577e-05, "loss": 0.1763, "loss_nan_ranks": 0, "loss_rank_avg": 0.07908610999584198, "step": 3625, "valid_targets_mean": 4995.0, "valid_targets_min": 1741 }, { "epoch": 3.1105398457583546, "grad_norm": 0.46223745921085535, "learning_rate": 2.721733239297228e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.08104974031448364, "step": 3630, "valid_targets_mean": 5590.5, "valid_targets_min": 1385 }, { "epoch": 3.1148243359040273, "grad_norm": 0.5550320490512014, "learning_rate": 2.7177464153579345e-05, "loss": 0.1748, "loss_nan_ranks": 0, "loss_rank_avg": 0.07732957601547241, "step": 3635, "valid_targets_mean": 4547.8, "valid_targets_min": 2008 }, { "epoch": 3.1191088260497, "grad_norm": 0.5493528497955329, "learning_rate": 2.713756314998219e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.09979130327701569, "step": 3640, "valid_targets_mean": 4378.2, "valid_targets_min": 814 }, { "epoch": 3.1233933161953726, "grad_norm": 0.5292553656306752, "learning_rate": 2.7097629564323784e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.09737001359462738, "step": 3645, "valid_targets_mean": 3762.6, "valid_targets_min": 2046 }, { "epoch": 3.1276778063410453, "grad_norm": 0.5153566581021852, "learning_rate": 2.705766357889582e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.08181529492139816, "step": 3650, "valid_targets_mean": 3764.9, "valid_targets_min": 1832 }, { "epoch": 3.131962296486718, "grad_norm": 0.533212309221076, "learning_rate": 2.701766537613791e-05, "loss": 0.196, "loss_nan_ranks": 0, "loss_rank_avg": 0.10756025463342667, "step": 3655, "valid_targets_mean": 4934.1, "valid_targets_min": 3003 }, { "epoch": 3.1362467866323906, "grad_norm": 0.4730794348004389, "learning_rate": 2.6977635138636725e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.08242323994636536, "step": 3660, "valid_targets_mean": 5205.4, "valid_targets_min": 1267 }, { "epoch": 3.1405312767780633, "grad_norm": 0.5082206695922894, "learning_rate": 2.693757304912516e-05, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.08571913838386536, "step": 3665, "valid_targets_mean": 5586.2, "valid_targets_min": 2777 }, { "epoch": 3.144815766923736, "grad_norm": 0.5194249572852877, "learning_rate": 2.6897479290481537e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.08359972387552261, "step": 3670, "valid_targets_mean": 5197.6, "valid_targets_min": 1005 }, { "epoch": 3.1491002570694087, "grad_norm": 0.5024393062086439, "learning_rate": 2.685735404572871e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.07878033071756363, "step": 3675, "valid_targets_mean": 4835.9, "valid_targets_min": 2000 }, { "epoch": 3.1533847472150813, "grad_norm": 0.4909761470748089, "learning_rate": 2.6817197498033282e-05, "loss": 0.19, "loss_nan_ranks": 0, "loss_rank_avg": 0.09674154222011566, "step": 3680, "valid_targets_mean": 5215.1, "valid_targets_min": 2439 }, { "epoch": 3.157669237360754, "grad_norm": 0.5894183379504294, "learning_rate": 2.6777009830704767e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.09668425470590591, "step": 3685, "valid_targets_mean": 3794.5, "valid_targets_min": 1774 }, { "epoch": 3.1619537275064267, "grad_norm": 0.53445260586619, "learning_rate": 2.6736791227194694e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.07560717314481735, "step": 3690, "valid_targets_mean": 4421.9, "valid_targets_min": 1630 }, { "epoch": 3.1662382176520993, "grad_norm": 0.4985541351909853, "learning_rate": 2.669654187109585e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.08976177871227264, "step": 3695, "valid_targets_mean": 6416.4, "valid_targets_min": 3572 }, { "epoch": 3.170522707797772, "grad_norm": 0.5327057742708573, "learning_rate": 2.665626194614138e-05, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.09565296024084091, "step": 3700, "valid_targets_mean": 6072.0, "valid_targets_min": 3138 }, { "epoch": 3.1748071979434447, "grad_norm": 0.5530367088343197, "learning_rate": 2.6615951636203983e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.09422317147254944, "step": 3705, "valid_targets_mean": 3588.1, "valid_targets_min": 1818 }, { "epoch": 3.1790916880891174, "grad_norm": 0.4790691676535246, "learning_rate": 2.657561112529506e-05, "loss": 0.1675, "loss_nan_ranks": 0, "loss_rank_avg": 0.09259481728076935, "step": 3710, "valid_targets_mean": 5763.2, "valid_targets_min": 3117 }, { "epoch": 3.18337617823479, "grad_norm": 0.49104439000892763, "learning_rate": 2.653524059756387e-05, "loss": 0.1854, "loss_nan_ranks": 0, "loss_rank_avg": 0.1050562709569931, "step": 3715, "valid_targets_mean": 5120.1, "valid_targets_min": 1274 }, { "epoch": 3.1876606683804627, "grad_norm": 0.5244108830562542, "learning_rate": 2.649484023729671e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.10317362844944, "step": 3720, "valid_targets_mean": 4561.6, "valid_targets_min": 1123 }, { "epoch": 3.1919451585261354, "grad_norm": 0.5382322149811951, "learning_rate": 2.6454410228916037e-05, "loss": 0.1956, "loss_nan_ranks": 0, "loss_rank_avg": 0.07304810732603073, "step": 3725, "valid_targets_mean": 4988.5, "valid_targets_min": 2542 }, { "epoch": 3.196229648671808, "grad_norm": 0.480710934454029, "learning_rate": 2.6413950756979662e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.07215426862239838, "step": 3730, "valid_targets_mean": 5174.0, "valid_targets_min": 3332 }, { "epoch": 3.2005141388174807, "grad_norm": 0.48834989667916534, "learning_rate": 2.6373462006179895e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.09519222378730774, "step": 3735, "valid_targets_mean": 6658.1, "valid_targets_min": 2450 }, { "epoch": 3.2047986289631534, "grad_norm": 0.49688774009942777, "learning_rate": 2.6332944161342697e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.09624415636062622, "step": 3740, "valid_targets_mean": 6799.4, "valid_targets_min": 3828 }, { "epoch": 3.209083119108826, "grad_norm": 0.4506399758467214, "learning_rate": 2.6292397407426826e-05, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.07406134903430939, "step": 3745, "valid_targets_mean": 5605.9, "valid_targets_min": 3460 }, { "epoch": 3.2133676092544987, "grad_norm": 0.5409584270562771, "learning_rate": 2.625182192952303e-05, "loss": 0.1894, "loss_nan_ranks": 0, "loss_rank_avg": 0.08308728039264679, "step": 3750, "valid_targets_mean": 3723.2, "valid_targets_min": 1233 }, { "epoch": 3.2176520994001714, "grad_norm": 0.5487106876988163, "learning_rate": 2.621121791285316e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.0809471383690834, "step": 3755, "valid_targets_mean": 3911.8, "valid_targets_min": 2035 }, { "epoch": 3.221936589545844, "grad_norm": 0.4873880044416427, "learning_rate": 2.6170585542769353e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.08481766283512115, "step": 3760, "valid_targets_mean": 4059.0, "valid_targets_min": 1602 }, { "epoch": 3.2262210796915167, "grad_norm": 0.5884861590780336, "learning_rate": 2.6129925004753173e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.10550187528133392, "step": 3765, "valid_targets_mean": 4256.6, "valid_targets_min": 2465 }, { "epoch": 3.2305055698371894, "grad_norm": 0.4904994688232888, "learning_rate": 2.6089236484414767e-05, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.08721703290939331, "step": 3770, "valid_targets_mean": 6815.4, "valid_targets_min": 2390 }, { "epoch": 3.234790059982862, "grad_norm": 0.49949775985853045, "learning_rate": 2.604852016749201e-05, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.08349231630563736, "step": 3775, "valid_targets_mean": 5104.8, "valid_targets_min": 3264 }, { "epoch": 3.2390745501285347, "grad_norm": 0.49538203709639544, "learning_rate": 2.6007776239849678e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.08115263283252716, "step": 3780, "valid_targets_mean": 5585.4, "valid_targets_min": 2132 }, { "epoch": 3.2433590402742074, "grad_norm": 0.4743043011897055, "learning_rate": 2.5967004887478582e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.07015199214220047, "step": 3785, "valid_targets_mean": 5265.1, "valid_targets_min": 1307 }, { "epoch": 3.24764353041988, "grad_norm": 0.4774324868777757, "learning_rate": 2.592620629649472e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.08552783727645874, "step": 3790, "valid_targets_mean": 5696.9, "valid_targets_min": 2495 }, { "epoch": 3.2519280205655527, "grad_norm": 0.47726321679965944, "learning_rate": 2.588538065313842e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.09820352494716644, "step": 3795, "valid_targets_mean": 6080.5, "valid_targets_min": 3405 }, { "epoch": 3.2562125107112254, "grad_norm": 0.47184919744601855, "learning_rate": 2.5844528143773536e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.08200445771217346, "step": 3800, "valid_targets_mean": 5325.4, "valid_targets_min": 2574 }, { "epoch": 3.260497000856898, "grad_norm": 0.5480095421683794, "learning_rate": 2.5803648954886526e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.07922104001045227, "step": 3805, "valid_targets_mean": 4847.6, "valid_targets_min": 1832 }, { "epoch": 3.2647814910025708, "grad_norm": 0.4563494451988351, "learning_rate": 2.5762743273085642e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.07653181999921799, "step": 3810, "valid_targets_mean": 5683.8, "valid_targets_min": 2964 }, { "epoch": 3.2690659811482434, "grad_norm": 0.5664265801776952, "learning_rate": 2.5721811285100094e-05, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.08541962504386902, "step": 3815, "valid_targets_mean": 4073.6, "valid_targets_min": 992 }, { "epoch": 3.273350471293916, "grad_norm": 0.506078224016259, "learning_rate": 2.5680853177779156e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.11393250524997711, "step": 3820, "valid_targets_mean": 6029.9, "valid_targets_min": 1457 }, { "epoch": 3.2776349614395888, "grad_norm": 0.494273020347569, "learning_rate": 2.563986913809134e-05, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.06963160634040833, "step": 3825, "valid_targets_mean": 4817.8, "valid_targets_min": 1059 }, { "epoch": 3.2819194515852614, "grad_norm": 0.4941550710602732, "learning_rate": 2.5598859353123544e-05, "loss": 0.2005, "loss_nan_ranks": 0, "loss_rank_avg": 0.10108497738838196, "step": 3830, "valid_targets_mean": 4969.1, "valid_targets_min": 937 }, { "epoch": 3.286203941730934, "grad_norm": 0.44118797019685824, "learning_rate": 2.5557824010080167e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.07035285234451294, "step": 3835, "valid_targets_mean": 5435.5, "valid_targets_min": 2621 }, { "epoch": 3.290488431876607, "grad_norm": 0.535660164763162, "learning_rate": 2.5516763296282304e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.08199736475944519, "step": 3840, "valid_targets_mean": 5702.1, "valid_targets_min": 2302 }, { "epoch": 3.2947729220222794, "grad_norm": 0.5406302387494281, "learning_rate": 2.5475677399166846e-05, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.08630575984716415, "step": 3845, "valid_targets_mean": 5694.1, "valid_targets_min": 1559 }, { "epoch": 3.299057412167952, "grad_norm": 0.5368623601343584, "learning_rate": 2.5434566506285652e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.0820312350988388, "step": 3850, "valid_targets_mean": 4866.5, "valid_targets_min": 2259 }, { "epoch": 3.303341902313625, "grad_norm": 0.42391830685772136, "learning_rate": 2.5393430805304684e-05, "loss": 0.1656, "loss_nan_ranks": 0, "loss_rank_avg": 0.07458534836769104, "step": 3855, "valid_targets_mean": 6219.2, "valid_targets_min": 4199 }, { "epoch": 3.3076263924592975, "grad_norm": 0.46723573532937834, "learning_rate": 2.5352270484003136e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.06834311783313751, "step": 3860, "valid_targets_mean": 4890.8, "valid_targets_min": 1499 }, { "epoch": 3.31191088260497, "grad_norm": 0.5042670913751731, "learning_rate": 2.5311085730272615e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.08892189711332321, "step": 3865, "valid_targets_mean": 5347.4, "valid_targets_min": 3761 }, { "epoch": 3.316195372750643, "grad_norm": 0.5146453940010698, "learning_rate": 2.5269876732116232e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.08683112263679504, "step": 3870, "valid_targets_mean": 4728.5, "valid_targets_min": 1387 }, { "epoch": 3.3204798628963155, "grad_norm": 0.5179841404789549, "learning_rate": 2.522864367764779e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.0970543771982193, "step": 3875, "valid_targets_mean": 5566.1, "valid_targets_min": 1279 }, { "epoch": 3.324764353041988, "grad_norm": 0.5586468052716015, "learning_rate": 2.5187386755090896e-05, "loss": 0.1941, "loss_nan_ranks": 0, "loss_rank_avg": 0.10074944794178009, "step": 3880, "valid_targets_mean": 4139.8, "valid_targets_min": 1357 }, { "epoch": 3.329048843187661, "grad_norm": 0.5151397548165649, "learning_rate": 2.5146106152778123e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.08319426327943802, "step": 3885, "valid_targets_mean": 5424.5, "valid_targets_min": 2426 }, { "epoch": 3.3333333333333335, "grad_norm": 0.4720092194356925, "learning_rate": 2.5104802059150116e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.07055439800024033, "step": 3890, "valid_targets_mean": 5038.0, "valid_targets_min": 1381 }, { "epoch": 3.337617823479006, "grad_norm": 0.5657582007478067, "learning_rate": 2.506347466275479e-05, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.09392206370830536, "step": 3895, "valid_targets_mean": 3641.5, "valid_targets_min": 810 }, { "epoch": 3.341902313624679, "grad_norm": 0.46332448819773575, "learning_rate": 2.5022124152246408e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.08185388147830963, "step": 3900, "valid_targets_mean": 5194.2, "valid_targets_min": 1295 }, { "epoch": 3.3461868037703515, "grad_norm": 0.5276021301125949, "learning_rate": 2.4980750716384742e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.11507555842399597, "step": 3905, "valid_targets_mean": 5921.0, "valid_targets_min": 3081 }, { "epoch": 3.350471293916024, "grad_norm": 0.5243579270007013, "learning_rate": 2.4939354544034227e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.11897942423820496, "step": 3910, "valid_targets_mean": 5501.2, "valid_targets_min": 2765 }, { "epoch": 3.354755784061697, "grad_norm": 0.4397898226348528, "learning_rate": 2.48979358241631e-05, "loss": 0.1744, "loss_nan_ranks": 0, "loss_rank_avg": 0.08484429121017456, "step": 3915, "valid_targets_mean": 6601.0, "valid_targets_min": 4025 }, { "epoch": 3.3590402742073695, "grad_norm": 0.48471277085423436, "learning_rate": 2.4856494745842494e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.09149546921253204, "step": 3920, "valid_targets_mean": 5834.6, "valid_targets_min": 2135 }, { "epoch": 3.363324764353042, "grad_norm": 0.640251930186407, "learning_rate": 2.481503149824563e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.09592543542385101, "step": 3925, "valid_targets_mean": 5464.4, "valid_targets_min": 2672 }, { "epoch": 3.367609254498715, "grad_norm": 0.7077370709133005, "learning_rate": 2.4773546270646924e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.08654675632715225, "step": 3930, "valid_targets_mean": 3764.9, "valid_targets_min": 1305 }, { "epoch": 3.371893744644387, "grad_norm": 0.5667813121104889, "learning_rate": 2.4732039252421124e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.10520567744970322, "step": 3935, "valid_targets_mean": 4461.2, "valid_targets_min": 1390 }, { "epoch": 3.3761782347900597, "grad_norm": 0.5242448683415644, "learning_rate": 2.4690510633042434e-05, "loss": 0.1713, "loss_nan_ranks": 0, "loss_rank_avg": 0.08278533816337585, "step": 3940, "valid_targets_mean": 4752.5, "valid_targets_min": 2392 }, { "epoch": 3.3804627249357324, "grad_norm": 0.5049433307182706, "learning_rate": 2.46489606020837e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.08539880812168121, "step": 3945, "valid_targets_mean": 4561.8, "valid_targets_min": 1711 }, { "epoch": 3.384747215081405, "grad_norm": 0.5227073441087726, "learning_rate": 2.4607389349215486e-05, "loss": 0.1808, "loss_nan_ranks": 0, "loss_rank_avg": 0.09328305721282959, "step": 3950, "valid_targets_mean": 5030.6, "valid_targets_min": 2456 }, { "epoch": 3.3890317052270778, "grad_norm": 0.5292754389388692, "learning_rate": 2.456579706420522e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.0860356017947197, "step": 3955, "valid_targets_mean": 4216.2, "valid_targets_min": 2060 }, { "epoch": 3.3933161953727504, "grad_norm": 0.4865013112852646, "learning_rate": 2.4524183936916375e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.10694333910942078, "step": 3960, "valid_targets_mean": 5631.4, "valid_targets_min": 3043 }, { "epoch": 3.397600685518423, "grad_norm": 0.44020607224044916, "learning_rate": 2.4482550157307535e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.07197045534849167, "step": 3965, "valid_targets_mean": 5408.6, "valid_targets_min": 3985 }, { "epoch": 3.4018851756640958, "grad_norm": 0.5010961069712251, "learning_rate": 2.4440895915431564e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.07832053303718567, "step": 3970, "valid_targets_mean": 4119.0, "valid_targets_min": 1678 }, { "epoch": 3.4061696658097684, "grad_norm": 0.460386431994602, "learning_rate": 2.4399221401434744e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.08432082831859589, "step": 3975, "valid_targets_mean": 6040.0, "valid_targets_min": 2483 }, { "epoch": 3.410454155955441, "grad_norm": 0.46018138510892553, "learning_rate": 2.4357526805555898e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.07811066508293152, "step": 3980, "valid_targets_mean": 6039.2, "valid_targets_min": 2097 }, { "epoch": 3.4147386461011138, "grad_norm": 0.44313847646961696, "learning_rate": 2.431581231812551e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.08324681967496872, "step": 3985, "valid_targets_mean": 6093.0, "valid_targets_min": 1795 }, { "epoch": 3.4190231362467864, "grad_norm": 0.49476268172484367, "learning_rate": 2.4274078129564865e-05, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.08022307604551315, "step": 3990, "valid_targets_mean": 4712.8, "valid_targets_min": 2631 }, { "epoch": 3.423307626392459, "grad_norm": 0.5552227552355836, "learning_rate": 2.4232324430385186e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.1327175348997116, "step": 3995, "valid_targets_mean": 4551.5, "valid_targets_min": 1184 }, { "epoch": 3.427592116538132, "grad_norm": 0.5185839985435154, "learning_rate": 2.4190551411186772e-05, "loss": 0.1896, "loss_nan_ranks": 0, "loss_rank_avg": 0.08617275208234787, "step": 4000, "valid_targets_mean": 4747.9, "valid_targets_min": 1219 }, { "epoch": 3.4318766066838045, "grad_norm": 0.4709991819622267, "learning_rate": 2.414875926265809e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.07815124839544296, "step": 4005, "valid_targets_mean": 5581.9, "valid_targets_min": 2606 }, { "epoch": 3.436161096829477, "grad_norm": 0.48407163673156856, "learning_rate": 2.410694817557495e-05, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.1021660715341568, "step": 4010, "valid_targets_mean": 5507.0, "valid_targets_min": 2411 }, { "epoch": 3.44044558697515, "grad_norm": 0.5232737652771369, "learning_rate": 2.406511834079961e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.07770241796970367, "step": 4015, "valid_targets_mean": 4428.8, "valid_targets_min": 996 }, { "epoch": 3.4447300771208225, "grad_norm": 0.5393197148717728, "learning_rate": 2.4023269949279896e-05, "loss": 0.1895, "loss_nan_ranks": 0, "loss_rank_avg": 0.10861536860466003, "step": 4020, "valid_targets_mean": 5138.0, "valid_targets_min": 854 }, { "epoch": 3.449014567266495, "grad_norm": 0.4959778784971376, "learning_rate": 2.398140319204836e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.0765412300825119, "step": 4025, "valid_targets_mean": 4376.9, "valid_targets_min": 2131 }, { "epoch": 3.453299057412168, "grad_norm": 0.44539828071435855, "learning_rate": 2.393951826022139e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.0800006315112114, "step": 4030, "valid_targets_mean": 6357.0, "valid_targets_min": 2336 }, { "epoch": 3.4575835475578405, "grad_norm": 0.5009575823756433, "learning_rate": 2.3897615344998316e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.0751371756196022, "step": 4035, "valid_targets_mean": 4151.1, "valid_targets_min": 1054 }, { "epoch": 3.461868037703513, "grad_norm": 0.5659099414288352, "learning_rate": 2.38556946376606e-05, "loss": 0.1919, "loss_nan_ranks": 0, "loss_rank_avg": 0.08233688771724701, "step": 4040, "valid_targets_mean": 4852.5, "valid_targets_min": 3043 }, { "epoch": 3.466152527849186, "grad_norm": 0.48964486978436755, "learning_rate": 2.381375632957088e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.09233547747135162, "step": 4045, "valid_targets_mean": 6505.9, "valid_targets_min": 1066 }, { "epoch": 3.4704370179948585, "grad_norm": 0.6366684492336043, "learning_rate": 2.377180061217217e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.10365661233663559, "step": 4050, "valid_targets_mean": 5608.6, "valid_targets_min": 2391 }, { "epoch": 3.474721508140531, "grad_norm": 0.5178869224071108, "learning_rate": 2.372982767698694e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.09731529653072357, "step": 4055, "valid_targets_mean": 5259.2, "valid_targets_min": 3468 }, { "epoch": 3.479005998286204, "grad_norm": 0.4979000344639998, "learning_rate": 2.3687837715616265e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.09686636924743652, "step": 4060, "valid_targets_mean": 5191.6, "valid_targets_min": 2305 }, { "epoch": 3.4832904884318765, "grad_norm": 0.4673954502395025, "learning_rate": 2.3645830919738934e-05, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.06930539011955261, "step": 4065, "valid_targets_mean": 5102.1, "valid_targets_min": 1840 }, { "epoch": 3.487574978577549, "grad_norm": 0.4603399923475969, "learning_rate": 2.3603807481110582e-05, "loss": 0.1849, "loss_nan_ranks": 0, "loss_rank_avg": 0.07954011112451553, "step": 4070, "valid_targets_mean": 4994.6, "valid_targets_min": 2915 }, { "epoch": 3.491859468723222, "grad_norm": 0.4598435838646931, "learning_rate": 2.3561767591562838e-05, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.07119995355606079, "step": 4075, "valid_targets_mean": 5935.2, "valid_targets_min": 3691 }, { "epoch": 3.4961439588688945, "grad_norm": 0.518348370256928, "learning_rate": 2.3519711443002403e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.08827964216470718, "step": 4080, "valid_targets_mean": 5031.9, "valid_targets_min": 1483 }, { "epoch": 3.500428449014567, "grad_norm": 0.45898367296651266, "learning_rate": 2.3477639227410203e-05, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.07615832984447479, "step": 4085, "valid_targets_mean": 4248.0, "valid_targets_min": 1181 }, { "epoch": 3.50471293916024, "grad_norm": 0.5048500740270604, "learning_rate": 2.3435551136840516e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.08330333232879639, "step": 4090, "valid_targets_mean": 4459.8, "valid_targets_min": 2015 }, { "epoch": 3.5089974293059125, "grad_norm": 0.5215915294355933, "learning_rate": 2.3393447363420086e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.1037408709526062, "step": 4095, "valid_targets_mean": 5052.2, "valid_targets_min": 3269 }, { "epoch": 3.513281919451585, "grad_norm": 0.4962196427584831, "learning_rate": 2.335132809934723e-05, "loss": 0.1865, "loss_nan_ranks": 0, "loss_rank_avg": 0.06860017776489258, "step": 4100, "valid_targets_mean": 4654.9, "valid_targets_min": 1920 }, { "epoch": 3.517566409597258, "grad_norm": 0.489981385343179, "learning_rate": 2.3309193536891005e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.08288254588842392, "step": 4105, "valid_targets_mean": 5823.2, "valid_targets_min": 1714 }, { "epoch": 3.5218508997429305, "grad_norm": 0.656955220664152, "learning_rate": 2.3267043868390294e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.08202258497476578, "step": 4110, "valid_targets_mean": 4970.4, "valid_targets_min": 2605 }, { "epoch": 3.526135389888603, "grad_norm": 0.5037309614923813, "learning_rate": 2.3224879286252912e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.1043175458908081, "step": 4115, "valid_targets_mean": 5029.6, "valid_targets_min": 2077 }, { "epoch": 3.530419880034276, "grad_norm": 0.5175047493676703, "learning_rate": 2.3182699982954798e-05, "loss": 0.174, "loss_nan_ranks": 0, "loss_rank_avg": 0.07466578483581543, "step": 4120, "valid_targets_mean": 4483.4, "valid_targets_min": 2113 }, { "epoch": 3.5347043701799485, "grad_norm": 0.47635693359402775, "learning_rate": 2.3140506151039056e-05, "loss": 0.1746, "loss_nan_ranks": 0, "loss_rank_avg": 0.09035299718379974, "step": 4125, "valid_targets_mean": 5929.0, "valid_targets_min": 3412 }, { "epoch": 3.538988860325621, "grad_norm": 0.4565464264321229, "learning_rate": 2.309829798311512e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.0775737538933754, "step": 4130, "valid_targets_mean": 5772.6, "valid_targets_min": 1234 }, { "epoch": 3.543273350471294, "grad_norm": 0.46993348068850305, "learning_rate": 2.3056075671857873e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.08100612461566925, "step": 4135, "valid_targets_mean": 4891.2, "valid_targets_min": 1548 }, { "epoch": 3.5475578406169666, "grad_norm": 0.5042039449397279, "learning_rate": 2.3013839410006752e-05, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.10945829749107361, "step": 4140, "valid_targets_mean": 4754.5, "valid_targets_min": 1194 }, { "epoch": 3.551842330762639, "grad_norm": 0.5219428536509176, "learning_rate": 2.2971589390364883e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.08812487125396729, "step": 4145, "valid_targets_mean": 4773.4, "valid_targets_min": 2528 }, { "epoch": 3.556126820908312, "grad_norm": 0.4595032270725784, "learning_rate": 2.2929325805798193e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.09251895546913147, "step": 4150, "valid_targets_mean": 5433.2, "valid_targets_min": 2510 }, { "epoch": 3.5604113110539846, "grad_norm": 0.592306139102451, "learning_rate": 2.288704884923454e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.09715113043785095, "step": 4155, "valid_targets_mean": 4493.5, "valid_targets_min": 229 }, { "epoch": 3.5646958011996572, "grad_norm": 0.4670380137898987, "learning_rate": 2.2844758713662792e-05, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.07353829592466354, "step": 4160, "valid_targets_mean": 6750.5, "valid_targets_min": 2466 }, { "epoch": 3.56898029134533, "grad_norm": 0.5225853631870525, "learning_rate": 2.2802455592132016e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.0953027755022049, "step": 4165, "valid_targets_mean": 5718.2, "valid_targets_min": 3231 }, { "epoch": 3.5732647814910026, "grad_norm": 0.4638223398798671, "learning_rate": 2.2760139677750535e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.09025826305150986, "step": 4170, "valid_targets_mean": 5769.9, "valid_targets_min": 2480 }, { "epoch": 3.5775492716366752, "grad_norm": 0.5579887756037205, "learning_rate": 2.2717811163685083e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.07685058563947678, "step": 4175, "valid_targets_mean": 3841.8, "valid_targets_min": 908 }, { "epoch": 3.581833761782348, "grad_norm": 0.4948096539474111, "learning_rate": 2.267547024315989e-05, "loss": 0.1773, "loss_nan_ranks": 0, "loss_rank_avg": 0.08701218664646149, "step": 4180, "valid_targets_mean": 5586.2, "valid_targets_min": 2833 }, { "epoch": 3.5861182519280206, "grad_norm": 0.4838736011672868, "learning_rate": 2.2633117109455842e-05, "loss": 0.1777, "loss_nan_ranks": 0, "loss_rank_avg": 0.09145478904247284, "step": 4185, "valid_targets_mean": 6145.4, "valid_targets_min": 2143 }, { "epoch": 3.5904027420736933, "grad_norm": 0.45606871426482026, "learning_rate": 2.259075195590957e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.07948420941829681, "step": 4190, "valid_targets_mean": 5401.1, "valid_targets_min": 2076 }, { "epoch": 3.594687232219366, "grad_norm": 0.5025562342810775, "learning_rate": 2.2548374975912566e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.07993195205926895, "step": 4195, "valid_targets_mean": 4961.0, "valid_targets_min": 1661 }, { "epoch": 3.5989717223650386, "grad_norm": 0.505770776087417, "learning_rate": 2.250598636291032e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.08299499750137329, "step": 4200, "valid_targets_mean": 4817.9, "valid_targets_min": 1747 }, { "epoch": 3.6032562125107113, "grad_norm": 0.4954913757966641, "learning_rate": 2.2463586310401415e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.08894240856170654, "step": 4205, "valid_targets_mean": 4411.9, "valid_targets_min": 1142 }, { "epoch": 3.607540702656384, "grad_norm": 0.5418588144667075, "learning_rate": 2.242117501193666e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.11070725321769714, "step": 4210, "valid_targets_mean": 5323.1, "valid_targets_min": 1367 }, { "epoch": 3.6118251928020566, "grad_norm": 0.531263626146356, "learning_rate": 2.2378752661118196e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.08583134412765503, "step": 4215, "valid_targets_mean": 4969.5, "valid_targets_min": 1849 }, { "epoch": 3.6161096829477293, "grad_norm": 0.5612122432997662, "learning_rate": 2.233631945159862e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.08974435925483704, "step": 4220, "valid_targets_mean": 4273.5, "valid_targets_min": 2028 }, { "epoch": 3.620394173093402, "grad_norm": 0.48142060702080514, "learning_rate": 2.2293875577080096e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.07660025358200073, "step": 4225, "valid_targets_mean": 3994.6, "valid_targets_min": 953 }, { "epoch": 3.6246786632390746, "grad_norm": 0.4848066208026919, "learning_rate": 2.2251421231313476e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.07478651404380798, "step": 4230, "valid_targets_mean": 5517.0, "valid_targets_min": 3239 }, { "epoch": 3.6289631533847473, "grad_norm": 0.49899057473509, "learning_rate": 2.2208956608097404e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.06353067606687546, "step": 4235, "valid_targets_mean": 5502.9, "valid_targets_min": 2124 }, { "epoch": 3.63324764353042, "grad_norm": 0.5813828678411174, "learning_rate": 2.2166481901277445e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.1088082492351532, "step": 4240, "valid_targets_mean": 3780.8, "valid_targets_min": 1875 }, { "epoch": 3.6375321336760926, "grad_norm": 0.4817039168502182, "learning_rate": 2.2123997304745197e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.09596549719572067, "step": 4245, "valid_targets_mean": 4660.6, "valid_targets_min": 2130 }, { "epoch": 3.6418166238217653, "grad_norm": 0.4792499434827214, "learning_rate": 2.20815030124374e-05, "loss": 0.1983, "loss_nan_ranks": 0, "loss_rank_avg": 0.08193084597587585, "step": 4250, "valid_targets_mean": 4666.0, "valid_targets_min": 2073 }, { "epoch": 3.646101113967438, "grad_norm": 0.5304247034774922, "learning_rate": 2.2038999218335052e-05, "loss": 0.1756, "loss_nan_ranks": 0, "loss_rank_avg": 0.11344555020332336, "step": 4255, "valid_targets_mean": 4205.0, "valid_targets_min": 1741 }, { "epoch": 3.6503856041131106, "grad_norm": 0.561201430702449, "learning_rate": 2.1996486116462518e-05, "loss": 0.1944, "loss_nan_ranks": 0, "loss_rank_avg": 0.10015340894460678, "step": 4260, "valid_targets_mean": 4303.4, "valid_targets_min": 976 }, { "epoch": 3.6546700942587833, "grad_norm": 0.5025165588665476, "learning_rate": 2.1953963900886678e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.0987139567732811, "step": 4265, "valid_targets_mean": 6982.6, "valid_targets_min": 3682 }, { "epoch": 3.658954584404456, "grad_norm": 0.4734958218505094, "learning_rate": 2.1911432765715984e-05, "loss": 0.1903, "loss_nan_ranks": 0, "loss_rank_avg": 0.09380441159009933, "step": 4270, "valid_targets_mean": 4911.9, "valid_targets_min": 2569 }, { "epoch": 3.6632390745501286, "grad_norm": 0.47972395955451463, "learning_rate": 2.186889290509963e-05, "loss": 0.1784, "loss_nan_ranks": 0, "loss_rank_avg": 0.08934134244918823, "step": 4275, "valid_targets_mean": 5794.8, "valid_targets_min": 1794 }, { "epoch": 3.6675235646958013, "grad_norm": 0.5054146734195408, "learning_rate": 2.1826344513226612e-05, "loss": 0.1784, "loss_nan_ranks": 0, "loss_rank_avg": 0.0747838243842125, "step": 4280, "valid_targets_mean": 4473.8, "valid_targets_min": 1046 }, { "epoch": 3.671808054841474, "grad_norm": 0.48848277806211415, "learning_rate": 2.178378778432491e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.07787490636110306, "step": 4285, "valid_targets_mean": 5002.2, "valid_targets_min": 2578 }, { "epoch": 3.6760925449871467, "grad_norm": 0.5569673045876135, "learning_rate": 2.174122291266052e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.10725502669811249, "step": 4290, "valid_targets_mean": 5099.5, "valid_targets_min": 2687 }, { "epoch": 3.6803770351328193, "grad_norm": 0.5166032053971452, "learning_rate": 2.169865009253663e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.09015043079853058, "step": 4295, "valid_targets_mean": 5599.1, "valid_targets_min": 1040 }, { "epoch": 3.684661525278492, "grad_norm": 0.5709661002249621, "learning_rate": 2.1656069518292724e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.10100851207971573, "step": 4300, "valid_targets_mean": 4439.0, "valid_targets_min": 1128 }, { "epoch": 3.6889460154241647, "grad_norm": 0.543802259685694, "learning_rate": 2.161348138430365e-05, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.0801519826054573, "step": 4305, "valid_targets_mean": 4878.2, "valid_targets_min": 1294 }, { "epoch": 3.6932305055698373, "grad_norm": 0.5570095437587615, "learning_rate": 2.157088588497879e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.08337944746017456, "step": 4310, "valid_targets_mean": 3964.8, "valid_targets_min": 533 }, { "epoch": 3.69751499571551, "grad_norm": 0.453897962207074, "learning_rate": 2.1528283214761143e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.0844380259513855, "step": 4315, "valid_targets_mean": 5618.8, "valid_targets_min": 2713 }, { "epoch": 3.7017994858611827, "grad_norm": 0.5264838129574774, "learning_rate": 2.148567356812644e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.09211684763431549, "step": 4320, "valid_targets_mean": 4739.2, "valid_targets_min": 797 }, { "epoch": 3.7060839760068554, "grad_norm": 0.5416369851840257, "learning_rate": 2.1443057139582248e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.07441074401140213, "step": 4325, "valid_targets_mean": 4180.2, "valid_targets_min": 1716 }, { "epoch": 3.710368466152528, "grad_norm": 0.5233842699548993, "learning_rate": 2.140043412366711e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.09138879179954529, "step": 4330, "valid_targets_mean": 5340.5, "valid_targets_min": 2420 }, { "epoch": 3.7146529562982007, "grad_norm": 0.5027330097368046, "learning_rate": 2.135780471494964e-05, "loss": 0.1731, "loss_nan_ranks": 0, "loss_rank_avg": 0.08350911736488342, "step": 4335, "valid_targets_mean": 5366.6, "valid_targets_min": 1678 }, { "epoch": 3.7189374464438734, "grad_norm": 0.47526774562585344, "learning_rate": 2.1315169108027618e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.07638335227966309, "step": 4340, "valid_targets_mean": 5456.4, "valid_targets_min": 1939 }, { "epoch": 3.723221936589546, "grad_norm": 0.5042053368330688, "learning_rate": 2.127252749752713e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.09122496843338013, "step": 4345, "valid_targets_mean": 5834.4, "valid_targets_min": 1449 }, { "epoch": 3.7275064267352187, "grad_norm": 0.5289307926314227, "learning_rate": 2.122988007810166e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.09580802172422409, "step": 4350, "valid_targets_mean": 5320.8, "valid_targets_min": 3011 }, { "epoch": 3.7317909168808914, "grad_norm": 0.4576457670282547, "learning_rate": 2.1187227044431218e-05, "loss": 0.168, "loss_nan_ranks": 0, "loss_rank_avg": 0.05943462625145912, "step": 4355, "valid_targets_mean": 4858.8, "valid_targets_min": 1578 }, { "epoch": 3.736075407026564, "grad_norm": 0.45540481367302393, "learning_rate": 2.1144568591221435e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.08127421140670776, "step": 4360, "valid_targets_mean": 5734.1, "valid_targets_min": 2680 }, { "epoch": 3.7403598971722367, "grad_norm": 0.5362612179693383, "learning_rate": 2.1101904913202683e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.11337935924530029, "step": 4365, "valid_targets_mean": 5713.0, "valid_targets_min": 3480 }, { "epoch": 3.7446443873179094, "grad_norm": 0.4704003263016836, "learning_rate": 2.1059236205129193e-05, "loss": 0.1832, "loss_nan_ranks": 0, "loss_rank_avg": 0.08135171979665756, "step": 4370, "valid_targets_mean": 6026.6, "valid_targets_min": 3211 }, { "epoch": 3.748928877463582, "grad_norm": 0.5097814181014321, "learning_rate": 2.101656266177814e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.07321173697710037, "step": 4375, "valid_targets_mean": 4055.1, "valid_targets_min": 1062 }, { "epoch": 3.7532133676092547, "grad_norm": 0.5058831165511345, "learning_rate": 2.0973884477948788e-05, "loss": 0.1721, "loss_nan_ranks": 0, "loss_rank_avg": 0.07657093554735184, "step": 4380, "valid_targets_mean": 5092.8, "valid_targets_min": 2508 }, { "epoch": 3.7574978577549274, "grad_norm": 0.48377529739196745, "learning_rate": 2.093120184846158e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.07396461069583893, "step": 4385, "valid_targets_mean": 4718.1, "valid_targets_min": 3365 }, { "epoch": 3.7617823479006, "grad_norm": 0.5858845859525321, "learning_rate": 2.0888514968157242e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.11814798414707184, "step": 4390, "valid_targets_mean": 5390.4, "valid_targets_min": 3563 }, { "epoch": 3.7660668380462727, "grad_norm": 0.5009081909970391, "learning_rate": 2.0845824031895922e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.07869275659322739, "step": 4395, "valid_targets_mean": 5265.8, "valid_targets_min": 2004 }, { "epoch": 3.7703513281919454, "grad_norm": 0.46579194546844566, "learning_rate": 2.080312923455627e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.06215429678559303, "step": 4400, "valid_targets_mean": 5621.1, "valid_targets_min": 2765 }, { "epoch": 3.774635818337618, "grad_norm": 0.4811822376668833, "learning_rate": 2.0760430771034567e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.07595115900039673, "step": 4405, "valid_targets_mean": 5120.1, "valid_targets_min": 1484 }, { "epoch": 3.7789203084832907, "grad_norm": 0.5625193799505521, "learning_rate": 2.0717728836243828e-05, "loss": 0.1593, "loss_nan_ranks": 0, "loss_rank_avg": 0.07109188288450241, "step": 4410, "valid_targets_mean": 4732.2, "valid_targets_min": 2687 }, { "epoch": 3.7832047986289634, "grad_norm": 0.5103516926344571, "learning_rate": 2.0675023625112908e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.10274773091077805, "step": 4415, "valid_targets_mean": 5381.0, "valid_targets_min": 3303 }, { "epoch": 3.787489288774636, "grad_norm": 0.5353559159650585, "learning_rate": 2.063231533258563e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.09648248553276062, "step": 4420, "valid_targets_mean": 4760.2, "valid_targets_min": 2482 }, { "epoch": 3.7917737789203088, "grad_norm": 0.5362956724018828, "learning_rate": 2.058960415361988e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.0884857177734375, "step": 4425, "valid_targets_mean": 4564.9, "valid_targets_min": 2484 }, { "epoch": 3.796058269065981, "grad_norm": 0.6503106392647596, "learning_rate": 2.0546890283186717e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.10990839451551437, "step": 4430, "valid_targets_mean": 3900.4, "valid_targets_min": 2609 }, { "epoch": 3.8003427592116537, "grad_norm": 0.5916435853895476, "learning_rate": 2.050417391626948e-05, "loss": 0.1708, "loss_nan_ranks": 0, "loss_rank_avg": 0.08456003665924072, "step": 4435, "valid_targets_mean": 7036.9, "valid_targets_min": 1318 }, { "epoch": 3.8046272493573263, "grad_norm": 0.5036276852885103, "learning_rate": 2.0461455247862912e-05, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.06545372307300568, "step": 4440, "valid_targets_mean": 4662.1, "valid_targets_min": 505 }, { "epoch": 3.808911739502999, "grad_norm": 0.44765849535218993, "learning_rate": 2.0418734472972262e-05, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.06430330872535706, "step": 4445, "valid_targets_mean": 4303.9, "valid_targets_min": 1532 }, { "epoch": 3.8131962296486717, "grad_norm": 0.5222825963604962, "learning_rate": 2.0376011786612396e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.08797872811555862, "step": 4450, "valid_targets_mean": 4519.4, "valid_targets_min": 2156 }, { "epoch": 3.8174807197943443, "grad_norm": 0.49236298315659555, "learning_rate": 2.0333287383806907e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.08118836581707001, "step": 4455, "valid_targets_mean": 4663.1, "valid_targets_min": 2595 }, { "epoch": 3.821765209940017, "grad_norm": 0.4782325683501973, "learning_rate": 2.029056145958721e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.08120326697826385, "step": 4460, "valid_targets_mean": 6560.8, "valid_targets_min": 3023 }, { "epoch": 3.8260497000856897, "grad_norm": 0.473132007473985, "learning_rate": 2.0247834208991684e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.07763845473527908, "step": 4465, "valid_targets_mean": 5648.8, "valid_targets_min": 2787 }, { "epoch": 3.8303341902313623, "grad_norm": 0.5139351501622985, "learning_rate": 2.0205105827064736e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.09254143387079239, "step": 4470, "valid_targets_mean": 5020.5, "valid_targets_min": 2034 }, { "epoch": 3.834618680377035, "grad_norm": 0.5778317488055335, "learning_rate": 2.0162376508855978e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.09841796010732651, "step": 4475, "valid_targets_mean": 4625.0, "valid_targets_min": 1509 }, { "epoch": 3.8389031705227077, "grad_norm": 0.48508807741509924, "learning_rate": 2.0119646449419265e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.09713976830244064, "step": 4480, "valid_targets_mean": 5486.1, "valid_targets_min": 1497 }, { "epoch": 3.8431876606683804, "grad_norm": 0.5020491833115472, "learning_rate": 2.0076915843811835e-05, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.09118911623954773, "step": 4485, "valid_targets_mean": 4502.4, "valid_targets_min": 1301 }, { "epoch": 3.847472150814053, "grad_norm": 0.4907616526259011, "learning_rate": 2.0034184887093433e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.09922203421592712, "step": 4490, "valid_targets_mean": 5388.1, "valid_targets_min": 3170 }, { "epoch": 3.8517566409597257, "grad_norm": 0.4565291844177587, "learning_rate": 1.9991453774325402e-05, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.10273808240890503, "step": 4495, "valid_targets_mean": 6592.6, "valid_targets_min": 2004 }, { "epoch": 3.8560411311053984, "grad_norm": 0.5732545604455834, "learning_rate": 1.9948722700569795e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.10075698792934418, "step": 4500, "valid_targets_mean": 3010.5, "valid_targets_min": 845 }, { "epoch": 3.860325621251071, "grad_norm": 0.4860731335191765, "learning_rate": 1.9905991860888496e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.08558526635169983, "step": 4505, "valid_targets_mean": 5031.2, "valid_targets_min": 3410 }, { "epoch": 3.8646101113967437, "grad_norm": 0.5088911251158567, "learning_rate": 1.9863261450342305e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.06963960826396942, "step": 4510, "valid_targets_mean": 5028.4, "valid_targets_min": 1772 }, { "epoch": 3.8688946015424164, "grad_norm": 0.4879977625126342, "learning_rate": 1.9820531663990065e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.07305698841810226, "step": 4515, "valid_targets_mean": 5932.9, "valid_targets_min": 1210 }, { "epoch": 3.873179091688089, "grad_norm": 0.5372417512132406, "learning_rate": 1.9777802696887783e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.10021747648715973, "step": 4520, "valid_targets_mean": 5266.9, "valid_targets_min": 2822 }, { "epoch": 3.8774635818337617, "grad_norm": 0.4610327967140201, "learning_rate": 1.9735074744087733e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.12863047420978546, "step": 4525, "valid_targets_mean": 7164.8, "valid_targets_min": 4651 }, { "epoch": 3.8817480719794344, "grad_norm": 0.5019450406903498, "learning_rate": 1.9692348000637527e-05, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.07446804642677307, "step": 4530, "valid_targets_mean": 5320.9, "valid_targets_min": 3110 }, { "epoch": 3.886032562125107, "grad_norm": 0.5112673713240492, "learning_rate": 1.9649622661579274e-05, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.09042879939079285, "step": 4535, "valid_targets_mean": 5653.9, "valid_targets_min": 1091 }, { "epoch": 3.8903170522707797, "grad_norm": 0.5369515631810194, "learning_rate": 1.9606898921948683e-05, "loss": 0.1977, "loss_nan_ranks": 0, "loss_rank_avg": 0.0947985053062439, "step": 4540, "valid_targets_mean": 4051.1, "valid_targets_min": 2694 }, { "epoch": 3.8946015424164524, "grad_norm": 0.5552773847133019, "learning_rate": 1.956417697677414e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.08706317096948624, "step": 4545, "valid_targets_mean": 4993.9, "valid_targets_min": 3037 }, { "epoch": 3.898886032562125, "grad_norm": 0.4915528438499653, "learning_rate": 1.9521457021075855e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.08254234492778778, "step": 4550, "valid_targets_mean": 5879.4, "valid_targets_min": 3345 }, { "epoch": 3.9031705227077977, "grad_norm": 0.5160133103456404, "learning_rate": 1.9478739249864962e-05, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.10425172001123428, "step": 4555, "valid_targets_mean": 4621.1, "valid_targets_min": 1198 }, { "epoch": 3.9074550128534704, "grad_norm": 0.5000307732972977, "learning_rate": 1.9436023858142602e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.0853274017572403, "step": 4560, "valid_targets_mean": 4777.2, "valid_targets_min": 1683 }, { "epoch": 3.911739502999143, "grad_norm": 0.5068195746979115, "learning_rate": 1.9393311040899067e-05, "loss": 0.1847, "loss_nan_ranks": 0, "loss_rank_avg": 0.07205282896757126, "step": 4565, "valid_targets_mean": 5539.8, "valid_targets_min": 3387 }, { "epoch": 3.9160239931448158, "grad_norm": 0.4267534546807796, "learning_rate": 1.93506009931129e-05, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.06260967999696732, "step": 4570, "valid_targets_mean": 5994.8, "valid_targets_min": 4569 }, { "epoch": 3.9203084832904884, "grad_norm": 0.5252719123556089, "learning_rate": 1.9307893909749994e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.09602794051170349, "step": 4575, "valid_targets_mean": 4688.0, "valid_targets_min": 3086 }, { "epoch": 3.924592973436161, "grad_norm": 0.537363202650325, "learning_rate": 1.9265189985762703e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.07901383191347122, "step": 4580, "valid_targets_mean": 4856.1, "valid_targets_min": 2446 }, { "epoch": 3.9288774635818338, "grad_norm": 0.4719462842604403, "learning_rate": 1.9222489416088975e-05, "loss": 0.1709, "loss_nan_ranks": 0, "loss_rank_avg": 0.07746100425720215, "step": 4585, "valid_targets_mean": 6851.2, "valid_targets_min": 5211 }, { "epoch": 3.9331619537275064, "grad_norm": 0.5353923548310513, "learning_rate": 1.917979239565145e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.08081245422363281, "step": 4590, "valid_targets_mean": 4776.4, "valid_targets_min": 1753 }, { "epoch": 3.937446443873179, "grad_norm": 0.5404284267622435, "learning_rate": 1.9137099119356545e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.07720431685447693, "step": 4595, "valid_targets_mean": 5211.1, "valid_targets_min": 797 }, { "epoch": 3.9417309340188518, "grad_norm": 0.5867772663723523, "learning_rate": 1.9094409782093597e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.0957307517528534, "step": 4600, "valid_targets_mean": 3721.1, "valid_targets_min": 1406 }, { "epoch": 3.9460154241645244, "grad_norm": 0.5145554246504417, "learning_rate": 1.9051724578733962e-05, "loss": 0.177, "loss_nan_ranks": 0, "loss_rank_avg": 0.09897803515195847, "step": 4605, "valid_targets_mean": 6185.1, "valid_targets_min": 2822 }, { "epoch": 3.950299914310197, "grad_norm": 0.49010810880745426, "learning_rate": 1.9009043704130122e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.09428513050079346, "step": 4610, "valid_targets_mean": 5483.1, "valid_targets_min": 2530 }, { "epoch": 3.95458440445587, "grad_norm": 0.4733695336444945, "learning_rate": 1.8966367353114807e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.08150522410869598, "step": 4615, "valid_targets_mean": 5887.5, "valid_targets_min": 2650 }, { "epoch": 3.9588688946015425, "grad_norm": 0.5422990185050677, "learning_rate": 1.892369572050008e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.09762519598007202, "step": 4620, "valid_targets_mean": 3828.2, "valid_targets_min": 1364 }, { "epoch": 3.963153384747215, "grad_norm": 0.48852927765073745, "learning_rate": 1.888102900107649e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.10224743187427521, "step": 4625, "valid_targets_mean": 5479.5, "valid_targets_min": 904 }, { "epoch": 3.967437874892888, "grad_norm": 0.5723550383231459, "learning_rate": 1.8838367389612132e-05, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.10078905522823334, "step": 4630, "valid_targets_mean": 4667.5, "valid_targets_min": 2156 }, { "epoch": 3.9717223650385605, "grad_norm": 0.5944746392231771, "learning_rate": 1.879571108085181e-05, "loss": 0.1886, "loss_nan_ranks": 0, "loss_rank_avg": 0.09629759192466736, "step": 4635, "valid_targets_mean": 4048.5, "valid_targets_min": 1777 }, { "epoch": 3.976006855184233, "grad_norm": 0.5235308428167299, "learning_rate": 1.8753060269516098e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.08603832125663757, "step": 4640, "valid_targets_mean": 5105.2, "valid_targets_min": 1457 }, { "epoch": 3.980291345329906, "grad_norm": 0.6014671147278671, "learning_rate": 1.8710415150300485e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.12909947335720062, "step": 4645, "valid_targets_mean": 5040.0, "valid_targets_min": 1988 }, { "epoch": 3.9845758354755785, "grad_norm": 0.5570437745107412, "learning_rate": 1.866777591787448e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.0958973839879036, "step": 4650, "valid_targets_mean": 4275.1, "valid_targets_min": 3053 }, { "epoch": 3.988860325621251, "grad_norm": 0.4838053085641309, "learning_rate": 1.8625142766880707e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.07679547369480133, "step": 4655, "valid_targets_mean": 4272.4, "valid_targets_min": 1110 }, { "epoch": 3.993144815766924, "grad_norm": 0.4560089306445956, "learning_rate": 1.8582515891934053e-05, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.07818187773227692, "step": 4660, "valid_targets_mean": 5043.8, "valid_targets_min": 2346 }, { "epoch": 3.9974293059125965, "grad_norm": 0.4658705104546062, "learning_rate": 1.8539895487620728e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.07729354500770569, "step": 4665, "valid_targets_mean": 5242.0, "valid_targets_min": 3391 }, { "epoch": 4.001713796058269, "grad_norm": 0.5114580276556692, "learning_rate": 1.8497281748497423e-05, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.09246338158845901, "step": 4670, "valid_targets_mean": 5042.1, "valid_targets_min": 2457 }, { "epoch": 4.005998286203941, "grad_norm": 0.5675860095297649, "learning_rate": 1.8454674869090394e-05, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.07740327715873718, "step": 4675, "valid_targets_mean": 4260.1, "valid_targets_min": 1793 }, { "epoch": 4.010282776349614, "grad_norm": 0.4395254253260001, "learning_rate": 1.8412075043894587e-05, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.05301671475172043, "step": 4680, "valid_targets_mean": 6729.9, "valid_targets_min": 1457 }, { "epoch": 4.014567266495287, "grad_norm": 0.5305603780007552, "learning_rate": 1.8369482467372748e-05, "loss": 0.1507, "loss_nan_ranks": 0, "loss_rank_avg": 0.0686296597123146, "step": 4685, "valid_targets_mean": 4777.6, "valid_targets_min": 2383 }, { "epoch": 4.018851756640959, "grad_norm": 0.4427631670793687, "learning_rate": 1.8326897333954524e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.05530937761068344, "step": 4690, "valid_targets_mean": 5215.6, "valid_targets_min": 1880 }, { "epoch": 4.023136246786632, "grad_norm": 0.5273081300549666, "learning_rate": 1.8284319838035596e-05, "loss": 0.1693, "loss_nan_ranks": 0, "loss_rank_avg": 0.09043410420417786, "step": 4695, "valid_targets_mean": 5147.4, "valid_targets_min": 2946 }, { "epoch": 4.027420736932305, "grad_norm": 0.516072643406447, "learning_rate": 1.824175017397679e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.07810711860656738, "step": 4700, "valid_targets_mean": 5571.1, "valid_targets_min": 3578 }, { "epoch": 4.031705227077977, "grad_norm": 0.6072196631344798, "learning_rate": 1.8199188536103155e-05, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.08345551043748856, "step": 4705, "valid_targets_mean": 3770.1, "valid_targets_min": 1173 }, { "epoch": 4.03598971722365, "grad_norm": 0.5165920468423776, "learning_rate": 1.8156635118703113e-05, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.1011938825249672, "step": 4710, "valid_targets_mean": 5820.2, "valid_targets_min": 3722 }, { "epoch": 4.040274207369323, "grad_norm": 0.6037846700268825, "learning_rate": 1.8114090116027575e-05, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.08537499606609344, "step": 4715, "valid_targets_mean": 3899.5, "valid_targets_min": 2159 }, { "epoch": 4.044558697514995, "grad_norm": 0.564709272472501, "learning_rate": 1.8071553722289012e-05, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.07162496447563171, "step": 4720, "valid_targets_mean": 4443.4, "valid_targets_min": 571 }, { "epoch": 4.048843187660668, "grad_norm": 0.5249602067864373, "learning_rate": 1.8029026131660613e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.08937022089958191, "step": 4725, "valid_targets_mean": 5472.2, "valid_targets_min": 1922 }, { "epoch": 4.053127677806341, "grad_norm": 0.5323768288458474, "learning_rate": 1.7986507538275388e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.09161496162414551, "step": 4730, "valid_targets_mean": 4799.8, "valid_targets_min": 967 }, { "epoch": 4.057412167952013, "grad_norm": 0.5424394265463435, "learning_rate": 1.794399813622527e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.06499495357275009, "step": 4735, "valid_targets_mean": 4970.8, "valid_targets_min": 1345 }, { "epoch": 4.061696658097686, "grad_norm": 0.47986919896406616, "learning_rate": 1.7901498119560224e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.06093684583902359, "step": 4740, "valid_targets_mean": 5482.4, "valid_targets_min": 1190 }, { "epoch": 4.065981148243359, "grad_norm": 0.5696299033930009, "learning_rate": 1.7859007682287382e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.10723207890987396, "step": 4745, "valid_targets_mean": 5067.1, "valid_targets_min": 3381 }, { "epoch": 4.070265638389031, "grad_norm": 0.5399946394195704, "learning_rate": 1.7816527018370154e-05, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.0841757208108902, "step": 4750, "valid_targets_mean": 5439.0, "valid_targets_min": 2166 }, { "epoch": 4.074550128534704, "grad_norm": 0.49331881552628826, "learning_rate": 1.7774056321727318e-05, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.06685491651296616, "step": 4755, "valid_targets_mean": 5076.4, "valid_targets_min": 746 }, { "epoch": 4.078834618680377, "grad_norm": 0.5323944357504423, "learning_rate": 1.7731595786232158e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.08423639088869095, "step": 4760, "valid_targets_mean": 5571.4, "valid_targets_min": 2206 }, { "epoch": 4.0831191088260494, "grad_norm": 0.5021387969482174, "learning_rate": 1.7689145605711597e-05, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.06299129128456116, "step": 4765, "valid_targets_mean": 5146.2, "valid_targets_min": 2294 }, { "epoch": 4.087403598971722, "grad_norm": 0.5274689353853328, "learning_rate": 1.764670597394526e-05, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.07674658298492432, "step": 4770, "valid_targets_mean": 4519.9, "valid_targets_min": 1803 }, { "epoch": 4.091688089117395, "grad_norm": 0.6677711186644161, "learning_rate": 1.7604277084664627e-05, "loss": 0.1418, "loss_nan_ranks": 0, "loss_rank_avg": 0.07176576554775238, "step": 4775, "valid_targets_mean": 5555.4, "valid_targets_min": 2832 }, { "epoch": 4.0959725792630675, "grad_norm": 0.5595601408846527, "learning_rate": 1.7561859131552138e-05, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.0624658428132534, "step": 4780, "valid_targets_mean": 4522.5, "valid_targets_min": 1209 }, { "epoch": 4.10025706940874, "grad_norm": 0.5455455804748165, "learning_rate": 1.7519452308240324e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.07068127393722534, "step": 4785, "valid_targets_mean": 5320.4, "valid_targets_min": 1748 }, { "epoch": 4.104541559554413, "grad_norm": 0.5474643591865783, "learning_rate": 1.747705680831089e-05, "loss": 0.1546, "loss_nan_ranks": 0, "loss_rank_avg": 0.07546311616897583, "step": 4790, "valid_targets_mean": 5132.1, "valid_targets_min": 3519 }, { "epoch": 4.1088260497000855, "grad_norm": 0.5385666835894883, "learning_rate": 1.7434672825293858e-05, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.0874762162566185, "step": 4795, "valid_targets_mean": 4158.9, "valid_targets_min": 814 }, { "epoch": 4.113110539845758, "grad_norm": 0.6098356168965273, "learning_rate": 1.7392300552666693e-05, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.07409660518169403, "step": 4800, "valid_targets_mean": 3346.6, "valid_targets_min": 1078 }, { "epoch": 4.117395029991431, "grad_norm": 0.5600443893585015, "learning_rate": 1.7349940183853388e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.06515643000602722, "step": 4805, "valid_targets_mean": 4069.8, "valid_targets_min": 1473 }, { "epoch": 4.1216795201371035, "grad_norm": 0.5302463304522121, "learning_rate": 1.730759191222359e-05, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.07636624574661255, "step": 4810, "valid_targets_mean": 5003.0, "valid_targets_min": 2677 }, { "epoch": 4.125964010282776, "grad_norm": 0.5645410089555536, "learning_rate": 1.7265255931091744e-05, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.08191752433776855, "step": 4815, "valid_targets_mean": 5747.6, "valid_targets_min": 4079 }, { "epoch": 4.130248500428449, "grad_norm": 0.5577312981087081, "learning_rate": 1.7222932433716165e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.0870317667722702, "step": 4820, "valid_targets_mean": 4744.1, "valid_targets_min": 1434 }, { "epoch": 4.1345329905741215, "grad_norm": 0.6047371298572394, "learning_rate": 1.718062161329821e-05, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.07716318964958191, "step": 4825, "valid_targets_mean": 3328.6, "valid_targets_min": 484 }, { "epoch": 4.138817480719794, "grad_norm": 0.5179065735302368, "learning_rate": 1.7138323662981342e-05, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.055352915078401566, "step": 4830, "valid_targets_mean": 5146.1, "valid_targets_min": 1854 }, { "epoch": 4.143101970865467, "grad_norm": 0.5772651797610137, "learning_rate": 1.7096038775850295e-05, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.08402058482170105, "step": 4835, "valid_targets_mean": 4349.9, "valid_targets_min": 2355 }, { "epoch": 4.1473864610111395, "grad_norm": 0.5282643276921688, "learning_rate": 1.7053767144930155e-05, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.08722338080406189, "step": 4840, "valid_targets_mean": 5179.6, "valid_targets_min": 3034 }, { "epoch": 4.151670951156812, "grad_norm": 0.5683081625420684, "learning_rate": 1.7011508963185505e-05, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.06397093832492828, "step": 4845, "valid_targets_mean": 4508.5, "valid_targets_min": 2709 }, { "epoch": 4.155955441302485, "grad_norm": 0.5040127948122992, "learning_rate": 1.6969264423519525e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.07005979120731354, "step": 4850, "valid_targets_mean": 5723.5, "valid_targets_min": 2919 }, { "epoch": 4.1602399314481575, "grad_norm": 0.5126571353902103, "learning_rate": 1.6927033718773124e-05, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.06733615696430206, "step": 4855, "valid_targets_mean": 5801.8, "valid_targets_min": 3148 }, { "epoch": 4.16452442159383, "grad_norm": 0.5529197226331911, "learning_rate": 1.688481704172407e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.07038679718971252, "step": 4860, "valid_targets_mean": 4861.9, "valid_targets_min": 2188 }, { "epoch": 4.168808911739503, "grad_norm": 0.5276769475415478, "learning_rate": 1.684261458508607e-05, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.09177596867084503, "step": 4865, "valid_targets_mean": 5110.4, "valid_targets_min": 3486 }, { "epoch": 4.1730934018851755, "grad_norm": 0.5313106774206768, "learning_rate": 1.6800426541507933e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.07231737673282623, "step": 4870, "valid_targets_mean": 4668.4, "valid_targets_min": 2299 }, { "epoch": 4.177377892030848, "grad_norm": 0.4968871910487643, "learning_rate": 1.675825310357268e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.06075207144021988, "step": 4875, "valid_targets_mean": 4199.8, "valid_targets_min": 1058 }, { "epoch": 4.181662382176521, "grad_norm": 0.4992102223765819, "learning_rate": 1.6716094463796656e-05, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.06933930516242981, "step": 4880, "valid_targets_mean": 6485.5, "valid_targets_min": 4589 }, { "epoch": 4.1859468723221935, "grad_norm": 0.49852535954505295, "learning_rate": 1.6673950814628638e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.06788508594036102, "step": 4885, "valid_targets_mean": 4713.8, "valid_targets_min": 1500 }, { "epoch": 4.190231362467866, "grad_norm": 0.5428573528512465, "learning_rate": 1.663182234844899e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.09118878841400146, "step": 4890, "valid_targets_mean": 4834.9, "valid_targets_min": 1226 }, { "epoch": 4.194515852613539, "grad_norm": 0.5399301656937301, "learning_rate": 1.6589709257568766e-05, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.10401996970176697, "step": 4895, "valid_targets_mean": 5292.5, "valid_targets_min": 1699 }, { "epoch": 4.1988003427592115, "grad_norm": 0.5475752036164578, "learning_rate": 1.6547611734228817e-05, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.07695914804935455, "step": 4900, "valid_targets_mean": 4350.5, "valid_targets_min": 1223 }, { "epoch": 4.203084832904884, "grad_norm": 0.4556661261268513, "learning_rate": 1.650552997059895e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.06842450797557831, "step": 4905, "valid_targets_mean": 5715.6, "valid_targets_min": 2000 }, { "epoch": 4.207369323050557, "grad_norm": 0.4656726329938494, "learning_rate": 1.646346415877703e-05, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.061458855867385864, "step": 4910, "valid_targets_mean": 6226.4, "valid_targets_min": 4540 }, { "epoch": 4.21165381319623, "grad_norm": 0.5354888183136649, "learning_rate": 1.6421414490788098e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.09619096666574478, "step": 4915, "valid_targets_mean": 5275.5, "valid_targets_min": 1805 }, { "epoch": 4.215938303341902, "grad_norm": 0.4975118230489396, "learning_rate": 1.6379381158583493e-05, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.06388730555772781, "step": 4920, "valid_targets_mean": 5423.9, "valid_targets_min": 3288 }, { "epoch": 4.220222793487575, "grad_norm": 0.5974187769947972, "learning_rate": 1.6337364354039994e-05, "loss": 0.1551, "loss_nan_ranks": 0, "loss_rank_avg": 0.07961668074131012, "step": 4925, "valid_targets_mean": 6249.6, "valid_targets_min": 3773 }, { "epoch": 4.224507283633248, "grad_norm": 0.5862381544675477, "learning_rate": 1.6295364268958936e-05, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.08168651163578033, "step": 4930, "valid_targets_mean": 4983.1, "valid_targets_min": 929 }, { "epoch": 4.22879177377892, "grad_norm": 0.4911113975456263, "learning_rate": 1.6253381095065314e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.0776476263999939, "step": 4935, "valid_targets_mean": 6293.8, "valid_targets_min": 2358 }, { "epoch": 4.233076263924593, "grad_norm": 0.5126617824938491, "learning_rate": 1.621141502400694e-05, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.07559158653020859, "step": 4940, "valid_targets_mean": 6424.8, "valid_targets_min": 1374 }, { "epoch": 4.237360754070266, "grad_norm": 0.5075151025551148, "learning_rate": 1.6169466247353562e-05, "loss": 0.1513, "loss_nan_ranks": 0, "loss_rank_avg": 0.06209402531385422, "step": 4945, "valid_targets_mean": 5486.1, "valid_targets_min": 2639 }, { "epoch": 4.241645244215938, "grad_norm": 0.5109370413756867, "learning_rate": 1.612753495659596e-05, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.09271623939275742, "step": 4950, "valid_targets_mean": 5698.2, "valid_targets_min": 3159 }, { "epoch": 4.245929734361611, "grad_norm": 0.4747575594308358, "learning_rate": 1.6085621343145113e-05, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.07969255745410919, "step": 4955, "valid_targets_mean": 7038.0, "valid_targets_min": 5366 }, { "epoch": 4.250214224507284, "grad_norm": 0.5653444035435231, "learning_rate": 1.604372559833129e-05, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.07547251880168915, "step": 4960, "valid_targets_mean": 4756.8, "valid_targets_min": 1066 }, { "epoch": 4.254498714652956, "grad_norm": 0.5581339202049348, "learning_rate": 1.6001847913403195e-05, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.07747235894203186, "step": 4965, "valid_targets_mean": 5881.0, "valid_targets_min": 2908 }, { "epoch": 4.258783204798629, "grad_norm": 0.5703169846987617, "learning_rate": 1.5959988479527103e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.10156498104333878, "step": 4970, "valid_targets_mean": 3763.6, "valid_targets_min": 1803 }, { "epoch": 4.263067694944302, "grad_norm": 0.5108130782973002, "learning_rate": 1.591814748778595e-05, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.06843523681163788, "step": 4975, "valid_targets_mean": 6338.8, "valid_targets_min": 2763 }, { "epoch": 4.267352185089974, "grad_norm": 0.49260975625136155, "learning_rate": 1.5876325129178522e-05, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.061994947493076324, "step": 4980, "valid_targets_mean": 5452.9, "valid_targets_min": 3764 }, { "epoch": 4.271636675235647, "grad_norm": 0.6114248898222204, "learning_rate": 1.5834521594618514e-05, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.07271035015583038, "step": 4985, "valid_targets_mean": 4659.2, "valid_targets_min": 1087 }, { "epoch": 4.27592116538132, "grad_norm": 0.529292747106911, "learning_rate": 1.579273707493372e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.0663774311542511, "step": 4990, "valid_targets_mean": 3475.1, "valid_targets_min": 1711 }, { "epoch": 4.280205655526992, "grad_norm": 0.47914632822231956, "learning_rate": 1.57509717608651e-05, "loss": 0.1587, "loss_nan_ranks": 0, "loss_rank_avg": 0.058661431074142456, "step": 4995, "valid_targets_mean": 6168.5, "valid_targets_min": 4451 }, { "epoch": 4.284490145672665, "grad_norm": 0.5638502813940276, "learning_rate": 1.570922584306597e-05, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.07884243130683899, "step": 5000, "valid_targets_mean": 4818.4, "valid_targets_min": 2131 }, { "epoch": 4.288774635818338, "grad_norm": 0.5494126554720642, "learning_rate": 1.56674995121011e-05, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.08957488089799881, "step": 5005, "valid_targets_mean": 4892.2, "valid_targets_min": 1181 }, { "epoch": 4.29305912596401, "grad_norm": 0.5068086295229425, "learning_rate": 1.562579295844583e-05, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.06114926189184189, "step": 5010, "valid_targets_mean": 5003.1, "valid_targets_min": 2380 }, { "epoch": 4.297343616109683, "grad_norm": 0.513304107378341, "learning_rate": 1.5584106372485248e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.07609188556671143, "step": 5015, "valid_targets_mean": 4886.4, "valid_targets_min": 1893 }, { "epoch": 4.301628106255356, "grad_norm": 0.504771691823541, "learning_rate": 1.5542439944513275e-05, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.07484638690948486, "step": 5020, "valid_targets_mean": 4305.2, "valid_targets_min": 1695 }, { "epoch": 4.305912596401028, "grad_norm": 0.5398695617811872, "learning_rate": 1.550079386473182e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.07757730782032013, "step": 5025, "valid_targets_mean": 5340.9, "valid_targets_min": 3343 }, { "epoch": 4.310197086546701, "grad_norm": 0.550478230847001, "learning_rate": 1.545916832324989e-05, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.08564269542694092, "step": 5030, "valid_targets_mean": 4638.2, "valid_targets_min": 2890 }, { "epoch": 4.314481576692374, "grad_norm": 0.4889711466495263, "learning_rate": 1.5417563510082755e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.06698659062385559, "step": 5035, "valid_targets_mean": 5970.6, "valid_targets_min": 4406 }, { "epoch": 4.318766066838046, "grad_norm": 0.5347010488287188, "learning_rate": 1.5375979615151057e-05, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.08710899949073792, "step": 5040, "valid_targets_mean": 4744.0, "valid_targets_min": 2763 }, { "epoch": 4.323050556983719, "grad_norm": 0.5546906054359373, "learning_rate": 1.533441682827994e-05, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.06388499587774277, "step": 5045, "valid_targets_mean": 4623.4, "valid_targets_min": 1150 }, { "epoch": 4.327335047129392, "grad_norm": 0.5378021703951273, "learning_rate": 1.529287533919821e-05, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.0835384801030159, "step": 5050, "valid_targets_mean": 4925.8, "valid_targets_min": 2589 }, { "epoch": 4.331619537275064, "grad_norm": 0.5046452348781201, "learning_rate": 1.5251355337537444e-05, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.07628235965967178, "step": 5055, "valid_targets_mean": 5603.4, "valid_targets_min": 2126 }, { "epoch": 4.335904027420737, "grad_norm": 0.493889238390984, "learning_rate": 1.5209857012831123e-05, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.06308963894844055, "step": 5060, "valid_targets_mean": 5509.6, "valid_targets_min": 1801 }, { "epoch": 4.34018851756641, "grad_norm": 0.5937885212471326, "learning_rate": 1.5168380554513784e-05, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.09766152501106262, "step": 5065, "valid_targets_mean": 3527.0, "valid_targets_min": 618 }, { "epoch": 4.344473007712082, "grad_norm": 0.5495491492987082, "learning_rate": 1.5126926151920147e-05, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.07378506660461426, "step": 5070, "valid_targets_mean": 4329.9, "valid_targets_min": 1607 }, { "epoch": 4.348757497857755, "grad_norm": 0.5484078687151889, "learning_rate": 1.5085493994284242e-05, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.07752133905887604, "step": 5075, "valid_targets_mean": 4007.2, "valid_targets_min": 1397 }, { "epoch": 4.353041988003428, "grad_norm": 0.6848788002164049, "learning_rate": 1.5044084270738564e-05, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.08638869971036911, "step": 5080, "valid_targets_mean": 4488.8, "valid_targets_min": 2058 }, { "epoch": 4.3573264781491, "grad_norm": 0.5309526090692271, "learning_rate": 1.5002697170313196e-05, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.07703551650047302, "step": 5085, "valid_targets_mean": 6423.1, "valid_targets_min": 2527 }, { "epoch": 4.361610968294773, "grad_norm": 0.5847600572908466, "learning_rate": 1.4961332881934953e-05, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.07591263949871063, "step": 5090, "valid_targets_mean": 4150.9, "valid_targets_min": 1429 }, { "epoch": 4.365895458440446, "grad_norm": 0.5180251527106797, "learning_rate": 1.4919991594426502e-05, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.07740815728902817, "step": 5095, "valid_targets_mean": 5425.0, "valid_targets_min": 3707 }, { "epoch": 4.370179948586118, "grad_norm": 0.5000963323863451, "learning_rate": 1.4878673496505531e-05, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.0634835809469223, "step": 5100, "valid_targets_mean": 5381.6, "valid_targets_min": 2967 }, { "epoch": 4.374464438731791, "grad_norm": 0.5524440824151057, "learning_rate": 1.4837378776783861e-05, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.07013142108917236, "step": 5105, "valid_targets_mean": 4227.1, "valid_targets_min": 2190 }, { "epoch": 4.378748928877464, "grad_norm": 0.5691071845198381, "learning_rate": 1.4796107623766594e-05, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.08084717392921448, "step": 5110, "valid_targets_mean": 5505.4, "valid_targets_min": 2092 }, { "epoch": 4.383033419023136, "grad_norm": 0.491822580389387, "learning_rate": 1.4754860225851248e-05, "loss": 0.1641, "loss_nan_ranks": 0, "loss_rank_avg": 0.0682189092040062, "step": 5115, "valid_targets_mean": 5129.0, "valid_targets_min": 2418 }, { "epoch": 4.387317909168809, "grad_norm": 0.5001887996202214, "learning_rate": 1.4713636771326929e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.06508070975542068, "step": 5120, "valid_targets_mean": 5043.5, "valid_targets_min": 3149 }, { "epoch": 4.391602399314482, "grad_norm": 0.5022664642918662, "learning_rate": 1.4672437448373416e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.07056738436222076, "step": 5125, "valid_targets_mean": 6385.4, "valid_targets_min": 1720 }, { "epoch": 4.395886889460154, "grad_norm": 0.5863443026857277, "learning_rate": 1.4631262445060332e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.09551360458135605, "step": 5130, "valid_targets_mean": 3457.2, "valid_targets_min": 1548 }, { "epoch": 4.400171379605827, "grad_norm": 0.5741351775944951, "learning_rate": 1.4590111949346306e-05, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.08465814590454102, "step": 5135, "valid_targets_mean": 4954.9, "valid_targets_min": 2516 }, { "epoch": 4.4044558697515, "grad_norm": 0.5430047413666953, "learning_rate": 1.4548986149078062e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.09200140833854675, "step": 5140, "valid_targets_mean": 5727.6, "valid_targets_min": 2481 }, { "epoch": 4.408740359897172, "grad_norm": 0.5646929867221707, "learning_rate": 1.4507885231989622e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.06149185448884964, "step": 5145, "valid_targets_mean": 4736.2, "valid_targets_min": 1427 }, { "epoch": 4.413024850042845, "grad_norm": 0.5302072495262342, "learning_rate": 1.4466809385701392e-05, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.05918242782354355, "step": 5150, "valid_targets_mean": 4760.2, "valid_targets_min": 1269 }, { "epoch": 4.417309340188518, "grad_norm": 0.5252703532678488, "learning_rate": 1.4425758797719365e-05, "loss": 0.1665, "loss_nan_ranks": 0, "loss_rank_avg": 0.0716017633676529, "step": 5155, "valid_targets_mean": 4607.8, "valid_targets_min": 2376 }, { "epoch": 4.42159383033419, "grad_norm": 0.5844920058156552, "learning_rate": 1.4384733655434201e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.07548099756240845, "step": 5160, "valid_targets_mean": 4374.4, "valid_targets_min": 1540 }, { "epoch": 4.425878320479863, "grad_norm": 0.5440444311779218, "learning_rate": 1.434373414612043e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.08596000075340271, "step": 5165, "valid_targets_mean": 4538.4, "valid_targets_min": 1312 }, { "epoch": 4.430162810625536, "grad_norm": 0.5227315015316456, "learning_rate": 1.4302760456935554e-05, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.06954213976860046, "step": 5170, "valid_targets_mean": 4355.1, "valid_targets_min": 1344 }, { "epoch": 4.434447300771208, "grad_norm": 0.5359733841570606, "learning_rate": 1.4261812774919204e-05, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.07341448962688446, "step": 5175, "valid_targets_mean": 5344.9, "valid_targets_min": 1219 }, { "epoch": 4.438731790916881, "grad_norm": 0.5007954035839989, "learning_rate": 1.422089128699232e-05, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.0841982364654541, "step": 5180, "valid_targets_mean": 5447.6, "valid_targets_min": 4387 }, { "epoch": 4.443016281062554, "grad_norm": 0.4942238514175937, "learning_rate": 1.417999617995623e-05, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.083289735019207, "step": 5185, "valid_targets_mean": 6193.6, "valid_targets_min": 3138 }, { "epoch": 4.447300771208226, "grad_norm": 0.540560184297077, "learning_rate": 1.4139127640491878e-05, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.09234566986560822, "step": 5190, "valid_targets_mean": 5512.8, "valid_targets_min": 1162 }, { "epoch": 4.451585261353899, "grad_norm": 0.5261391646545392, "learning_rate": 1.40982858551589e-05, "loss": 0.1593, "loss_nan_ranks": 0, "loss_rank_avg": 0.08443096280097961, "step": 5195, "valid_targets_mean": 4668.5, "valid_targets_min": 2560 }, { "epoch": 4.455869751499572, "grad_norm": 0.5522795050476156, "learning_rate": 1.4057471010394817e-05, "loss": 0.1671, "loss_nan_ranks": 0, "loss_rank_avg": 0.07564914226531982, "step": 5200, "valid_targets_mean": 4724.5, "valid_targets_min": 1988 }, { "epoch": 4.460154241645244, "grad_norm": 0.567034605022243, "learning_rate": 1.4016683292514159e-05, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.0924619808793068, "step": 5205, "valid_targets_mean": 4826.9, "valid_targets_min": 1476 }, { "epoch": 4.464438731790917, "grad_norm": 0.5095049144912834, "learning_rate": 1.3975922887707642e-05, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.08745399862527847, "step": 5210, "valid_targets_mean": 7177.6, "valid_targets_min": 3947 }, { "epoch": 4.46872322193659, "grad_norm": 0.5347971040551971, "learning_rate": 1.3935189982041288e-05, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.06757889688014984, "step": 5215, "valid_targets_mean": 4876.9, "valid_targets_min": 1697 }, { "epoch": 4.473007712082262, "grad_norm": 0.5031940372937177, "learning_rate": 1.389448476145558e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.07829098403453827, "step": 5220, "valid_targets_mean": 5504.0, "valid_targets_min": 914 }, { "epoch": 4.477292202227935, "grad_norm": 0.4877850332317292, "learning_rate": 1.385380741176465e-05, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.05520389601588249, "step": 5225, "valid_targets_mean": 5574.2, "valid_targets_min": 2353 }, { "epoch": 4.481576692373608, "grad_norm": 0.5168689231491843, "learning_rate": 1.3813158118655388e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.06339316070079803, "step": 5230, "valid_targets_mean": 4143.9, "valid_targets_min": 2092 }, { "epoch": 4.4858611825192805, "grad_norm": 0.5211426284721579, "learning_rate": 1.37725370676866e-05, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.07790861278772354, "step": 5235, "valid_targets_mean": 5682.0, "valid_targets_min": 1654 }, { "epoch": 4.490145672664953, "grad_norm": 0.5501908060838966, "learning_rate": 1.3731944444288176e-05, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.07432614266872406, "step": 5240, "valid_targets_mean": 5329.0, "valid_targets_min": 2228 }, { "epoch": 4.494430162810626, "grad_norm": 0.6814936988247406, "learning_rate": 1.3691380433760256e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.08724258840084076, "step": 5245, "valid_targets_mean": 5105.9, "valid_targets_min": 1802 }, { "epoch": 4.4987146529562985, "grad_norm": 0.48575644119426753, "learning_rate": 1.3650845221272339e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.08099687099456787, "step": 5250, "valid_targets_mean": 5515.2, "valid_targets_min": 1997 }, { "epoch": 4.502999143101971, "grad_norm": 0.4792202117077872, "learning_rate": 1.361033899186247e-05, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.05577072501182556, "step": 5255, "valid_targets_mean": 4312.9, "valid_targets_min": 1432 }, { "epoch": 4.507283633247644, "grad_norm": 0.4968967287597206, "learning_rate": 1.356986193043641e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.056737661361694336, "step": 5260, "valid_targets_mean": 5970.6, "valid_targets_min": 2492 }, { "epoch": 4.5115681233933165, "grad_norm": 0.548191687960978, "learning_rate": 1.3529414221766757e-05, "loss": 0.1458, "loss_nan_ranks": 0, "loss_rank_avg": 0.06213381886482239, "step": 5265, "valid_targets_mean": 6522.9, "valid_targets_min": 4398 }, { "epoch": 4.515852613538989, "grad_norm": 0.5321136136220768, "learning_rate": 1.3488996050492113e-05, "loss": 0.1678, "loss_nan_ranks": 0, "loss_rank_avg": 0.09102845191955566, "step": 5270, "valid_targets_mean": 6087.0, "valid_targets_min": 3210 }, { "epoch": 4.520137103684662, "grad_norm": 0.5061958136840395, "learning_rate": 1.344860760111625e-05, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.0620713010430336, "step": 5275, "valid_targets_mean": 5473.5, "valid_targets_min": 2461 }, { "epoch": 4.5244215938303345, "grad_norm": 0.6581217807964654, "learning_rate": 1.340824905800727e-05, "loss": 0.1582, "loss_nan_ranks": 0, "loss_rank_avg": 0.0733901634812355, "step": 5280, "valid_targets_mean": 3708.5, "valid_targets_min": 1991 }, { "epoch": 4.528706083976007, "grad_norm": 0.5523848868978788, "learning_rate": 1.3367920605396747e-05, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.08316996693611145, "step": 5285, "valid_targets_mean": 5033.2, "valid_targets_min": 420 }, { "epoch": 4.53299057412168, "grad_norm": 0.5996859005901333, "learning_rate": 1.3327622427378898e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.07758800685405731, "step": 5290, "valid_targets_mean": 4266.6, "valid_targets_min": 648 }, { "epoch": 4.5372750642673525, "grad_norm": 0.4698519477164445, "learning_rate": 1.3287354707909749e-05, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.06927581131458282, "step": 5295, "valid_targets_mean": 5093.6, "valid_targets_min": 2129 }, { "epoch": 4.541559554413025, "grad_norm": 0.5573866431663388, "learning_rate": 1.3247117630806278e-05, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.08232997357845306, "step": 5300, "valid_targets_mean": 4446.1, "valid_targets_min": 1670 }, { "epoch": 4.545844044558698, "grad_norm": 0.5159305534170026, "learning_rate": 1.3206911379745584e-05, "loss": 0.1717, "loss_nan_ranks": 0, "loss_rank_avg": 0.09247186779975891, "step": 5305, "valid_targets_mean": 4631.2, "valid_targets_min": 2132 }, { "epoch": 4.5501285347043705, "grad_norm": 0.5031933574779294, "learning_rate": 1.3166736138264055e-05, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.06761917471885681, "step": 5310, "valid_targets_mean": 5934.8, "valid_targets_min": 1071 }, { "epoch": 4.554413024850043, "grad_norm": 0.5472447704799865, "learning_rate": 1.3126592089756521e-05, "loss": 0.1434, "loss_nan_ranks": 0, "loss_rank_avg": 0.07344842702150345, "step": 5315, "valid_targets_mean": 5072.5, "valid_targets_min": 2786 }, { "epoch": 4.558697514995716, "grad_norm": 0.577751519518059, "learning_rate": 1.3086479417475408e-05, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.09713322669267654, "step": 5320, "valid_targets_mean": 5168.0, "valid_targets_min": 2283 }, { "epoch": 4.5629820051413885, "grad_norm": 0.47491486290625706, "learning_rate": 1.3046398304529933e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.06455229222774506, "step": 5325, "valid_targets_mean": 5562.4, "valid_targets_min": 1848 }, { "epoch": 4.567266495287061, "grad_norm": 0.4797250814827459, "learning_rate": 1.3006348933885252e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.05497722327709198, "step": 5330, "valid_targets_mean": 5382.9, "valid_targets_min": 3161 }, { "epoch": 4.571550985432734, "grad_norm": 0.5414909779456916, "learning_rate": 1.2966331488361599e-05, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.08572009205818176, "step": 5335, "valid_targets_mean": 4926.2, "valid_targets_min": 770 }, { "epoch": 4.5758354755784065, "grad_norm": 0.5539025467247136, "learning_rate": 1.2926346150633484e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.06572136282920837, "step": 5340, "valid_targets_mean": 4644.0, "valid_targets_min": 1389 }, { "epoch": 4.580119965724079, "grad_norm": 0.5283538221866442, "learning_rate": 1.288639310322886e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.07332241535186768, "step": 5345, "valid_targets_mean": 5910.5, "valid_targets_min": 4202 }, { "epoch": 4.584404455869752, "grad_norm": 0.5636559415041953, "learning_rate": 1.2846472528528256e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.09230844676494598, "step": 5350, "valid_targets_mean": 5420.8, "valid_targets_min": 3139 }, { "epoch": 4.5886889460154245, "grad_norm": 0.4655589846682366, "learning_rate": 1.2806584608763994e-05, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.0654459148645401, "step": 5355, "valid_targets_mean": 5589.5, "valid_targets_min": 2240 }, { "epoch": 4.592973436161097, "grad_norm": 0.5546221446040871, "learning_rate": 1.2766729526019304e-05, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.07415308803319931, "step": 5360, "valid_targets_mean": 5301.8, "valid_targets_min": 3329 }, { "epoch": 4.59725792630677, "grad_norm": 0.546669939195082, "learning_rate": 1.2726907462227544e-05, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.08334168046712875, "step": 5365, "valid_targets_mean": 5201.9, "valid_targets_min": 3041 }, { "epoch": 4.6015424164524426, "grad_norm": 0.5135226747551913, "learning_rate": 1.2687118599171327e-05, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.07777928560972214, "step": 5370, "valid_targets_mean": 5755.5, "valid_targets_min": 3512 }, { "epoch": 4.605826906598114, "grad_norm": 0.5242944087916945, "learning_rate": 1.2647363118481717e-05, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.06749745458364487, "step": 5375, "valid_targets_mean": 5622.8, "valid_targets_min": 3932 }, { "epoch": 4.610111396743788, "grad_norm": 0.5290445805781622, "learning_rate": 1.260764120163739e-05, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.09278124570846558, "step": 5380, "valid_targets_mean": 5294.4, "valid_targets_min": 1943 }, { "epoch": 4.61439588688946, "grad_norm": 0.4952292523993502, "learning_rate": 1.25679530299638e-05, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.07781682163476944, "step": 5385, "valid_targets_mean": 6209.1, "valid_targets_min": 3518 }, { "epoch": 4.618680377035133, "grad_norm": 0.5090845076261995, "learning_rate": 1.2528298784632375e-05, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.08040069788694382, "step": 5390, "valid_targets_mean": 6575.0, "valid_targets_min": 4930 }, { "epoch": 4.622964867180805, "grad_norm": 0.7138521723562766, "learning_rate": 1.2488678646659658e-05, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.07027311623096466, "step": 5395, "valid_targets_mean": 4191.6, "valid_targets_min": 1864 }, { "epoch": 4.627249357326479, "grad_norm": 0.5234789422070203, "learning_rate": 1.2449092796906497e-05, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.06149337440729141, "step": 5400, "valid_targets_mean": 5699.6, "valid_targets_min": 2825 }, { "epoch": 4.63153384747215, "grad_norm": 0.5453103495533085, "learning_rate": 1.2409541416077238e-05, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.0639188289642334, "step": 5405, "valid_targets_mean": 4543.4, "valid_targets_min": 1354 }, { "epoch": 4.635818337617824, "grad_norm": 0.529250776293999, "learning_rate": 1.237002468471886e-05, "loss": 0.1693, "loss_nan_ranks": 0, "loss_rank_avg": 0.06333880126476288, "step": 5410, "valid_targets_mean": 5286.9, "valid_targets_min": 4132 }, { "epoch": 4.640102827763496, "grad_norm": 0.4824578549134014, "learning_rate": 1.2330542783220177e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.06923186033964157, "step": 5415, "valid_targets_mean": 5960.9, "valid_targets_min": 2901 }, { "epoch": 4.644387317909169, "grad_norm": 0.6147699408146292, "learning_rate": 1.2291095891811013e-05, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.0718100517988205, "step": 5420, "valid_targets_mean": 5304.1, "valid_targets_min": 2365 }, { "epoch": 4.648671808054841, "grad_norm": 0.570110845047798, "learning_rate": 1.2251684190561374e-05, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.11174198985099792, "step": 5425, "valid_targets_mean": 4865.2, "valid_targets_min": 1515 }, { "epoch": 4.652956298200515, "grad_norm": 0.5422990193863433, "learning_rate": 1.2212307859380618e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.08089768141508102, "step": 5430, "valid_targets_mean": 5349.4, "valid_targets_min": 1626 }, { "epoch": 4.657240788346186, "grad_norm": 0.5224672528642734, "learning_rate": 1.2172967078016656e-05, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.07316748797893524, "step": 5435, "valid_targets_mean": 5330.9, "valid_targets_min": 2271 }, { "epoch": 4.66152527849186, "grad_norm": 0.569852849423712, "learning_rate": 1.2133662026055125e-05, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.070674367249012, "step": 5440, "valid_targets_mean": 4763.4, "valid_targets_min": 2084 }, { "epoch": 4.665809768637532, "grad_norm": 0.5424889241152411, "learning_rate": 1.209439288291854e-05, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.09382478892803192, "step": 5445, "valid_targets_mean": 4803.8, "valid_targets_min": 2923 }, { "epoch": 4.670094258783205, "grad_norm": 0.5472144017637648, "learning_rate": 1.2055159827865505e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.0735054463148117, "step": 5450, "valid_targets_mean": 4434.1, "valid_targets_min": 2278 }, { "epoch": 4.674378748928877, "grad_norm": 0.4995362136721301, "learning_rate": 1.2015963039989905e-05, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.06715245544910431, "step": 5455, "valid_targets_mean": 4374.8, "valid_targets_min": 2406 }, { "epoch": 4.678663239074551, "grad_norm": 0.5507431322821279, "learning_rate": 1.1976802698220038e-05, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.06111610680818558, "step": 5460, "valid_targets_mean": 4680.6, "valid_targets_min": 2076 }, { "epoch": 4.682947729220222, "grad_norm": 0.5378007298408868, "learning_rate": 1.193767898131785e-05, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.07199619710445404, "step": 5465, "valid_targets_mean": 4682.8, "valid_targets_min": 817 }, { "epoch": 4.687232219365896, "grad_norm": 0.5653851351887367, "learning_rate": 1.1898592067878095e-05, "loss": 0.1512, "loss_nan_ranks": 0, "loss_rank_avg": 0.06057225912809372, "step": 5470, "valid_targets_mean": 4277.6, "valid_targets_min": 1210 }, { "epoch": 4.691516709511568, "grad_norm": 0.5696106129355583, "learning_rate": 1.1859542136327536e-05, "loss": 0.1685, "loss_nan_ranks": 0, "loss_rank_avg": 0.08045990765094757, "step": 5475, "valid_targets_mean": 4922.5, "valid_targets_min": 1710 }, { "epoch": 4.69580119965724, "grad_norm": 0.7438822419270039, "learning_rate": 1.1820529364924097e-05, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.06591324508190155, "step": 5480, "valid_targets_mean": 4385.4, "valid_targets_min": 2395 }, { "epoch": 4.700085689802913, "grad_norm": 0.5508282840037704, "learning_rate": 1.1781553931756085e-05, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.08241961896419525, "step": 5485, "valid_targets_mean": 4717.6, "valid_targets_min": 1312 }, { "epoch": 4.704370179948586, "grad_norm": 0.5323245501515965, "learning_rate": 1.1742616014741357e-05, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.08502338826656342, "step": 5490, "valid_targets_mean": 4517.1, "valid_targets_min": 2815 }, { "epoch": 4.708654670094258, "grad_norm": 0.5426241679965548, "learning_rate": 1.170371579162651e-05, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.08141259849071503, "step": 5495, "valid_targets_mean": 4457.2, "valid_targets_min": 1908 }, { "epoch": 4.712939160239931, "grad_norm": 0.5261494063308156, "learning_rate": 1.1664853439986088e-05, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.0825117975473404, "step": 5500, "valid_targets_mean": 5681.6, "valid_targets_min": 3930 }, { "epoch": 4.717223650385604, "grad_norm": 0.5842224316874969, "learning_rate": 1.1626029137221732e-05, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.089847132563591, "step": 5505, "valid_targets_mean": 4607.5, "valid_targets_min": 2200 }, { "epoch": 4.721508140531276, "grad_norm": 0.5451479286311981, "learning_rate": 1.158724306056143e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.07350163161754608, "step": 5510, "valid_targets_mean": 5046.6, "valid_targets_min": 1281 }, { "epoch": 4.725792630676949, "grad_norm": 0.5225285581687482, "learning_rate": 1.1548495387058642e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.08591011166572571, "step": 5515, "valid_targets_mean": 5717.2, "valid_targets_min": 3322 }, { "epoch": 4.730077120822622, "grad_norm": 0.5141714932638097, "learning_rate": 1.1509786293591524e-05, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.08459824323654175, "step": 5520, "valid_targets_mean": 5143.5, "valid_targets_min": 1339 }, { "epoch": 4.734361610968294, "grad_norm": 0.5597302521486275, "learning_rate": 1.1471115956862145e-05, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.08023977279663086, "step": 5525, "valid_targets_mean": 4154.6, "valid_targets_min": 1669 }, { "epoch": 4.738646101113967, "grad_norm": 0.538636287377202, "learning_rate": 1.143248455339563e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.07752753794193268, "step": 5530, "valid_targets_mean": 4840.4, "valid_targets_min": 1511 }, { "epoch": 4.74293059125964, "grad_norm": 0.5506968921961911, "learning_rate": 1.1393892259539383e-05, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.08784641325473785, "step": 5535, "valid_targets_mean": 4550.6, "valid_targets_min": 1941 }, { "epoch": 4.7472150814053125, "grad_norm": 0.5163377608613207, "learning_rate": 1.1355339251462274e-05, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.06592030823230743, "step": 5540, "valid_targets_mean": 4323.5, "valid_targets_min": 1705 }, { "epoch": 4.751499571550985, "grad_norm": 0.6296357758109399, "learning_rate": 1.1316825705153865e-05, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.09954133629798889, "step": 5545, "valid_targets_mean": 4299.6, "valid_targets_min": 2768 }, { "epoch": 4.755784061696658, "grad_norm": 0.48267799557988644, "learning_rate": 1.1278351796423545e-05, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.05708755552768707, "step": 5550, "valid_targets_mean": 5362.1, "valid_targets_min": 2246 }, { "epoch": 4.7600685518423305, "grad_norm": 0.5302101998703135, "learning_rate": 1.1239917700899778e-05, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.0904797613620758, "step": 5555, "valid_targets_mean": 5171.4, "valid_targets_min": 3800 }, { "epoch": 4.764353041988003, "grad_norm": 0.5421815674524496, "learning_rate": 1.1201523594029296e-05, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.07278761267662048, "step": 5560, "valid_targets_mean": 6107.8, "valid_targets_min": 2127 }, { "epoch": 4.768637532133676, "grad_norm": 0.5281193865224264, "learning_rate": 1.1163169651076271e-05, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.07599358260631561, "step": 5565, "valid_targets_mean": 5263.0, "valid_targets_min": 2255 }, { "epoch": 4.7729220222793485, "grad_norm": 0.5672602574684631, "learning_rate": 1.1124856047121538e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.08513578772544861, "step": 5570, "valid_targets_mean": 4949.6, "valid_targets_min": 1346 }, { "epoch": 4.777206512425021, "grad_norm": 0.5546920567993101, "learning_rate": 1.108658295706178e-05, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.07476161420345306, "step": 5575, "valid_targets_mean": 4970.9, "valid_targets_min": 1518 }, { "epoch": 4.781491002570694, "grad_norm": 0.5495756311638148, "learning_rate": 1.104835055560877e-05, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.11116725951433182, "step": 5580, "valid_targets_mean": 5278.9, "valid_targets_min": 3203 }, { "epoch": 4.7857754927163665, "grad_norm": 0.531572898829633, "learning_rate": 1.1010159017288503e-05, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.06708759069442749, "step": 5585, "valid_targets_mean": 5266.9, "valid_targets_min": 2536 }, { "epoch": 4.790059982862039, "grad_norm": 0.6385122856137114, "learning_rate": 1.0972008516440475e-05, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.08954238146543503, "step": 5590, "valid_targets_mean": 4359.5, "valid_targets_min": 1431 }, { "epoch": 4.794344473007712, "grad_norm": 0.5186245977784936, "learning_rate": 1.0933899227216825e-05, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.0712139829993248, "step": 5595, "valid_targets_mean": 5009.5, "valid_targets_min": 1381 }, { "epoch": 4.7986289631533845, "grad_norm": 0.5319356056915755, "learning_rate": 1.0895831323581576e-05, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.07693114131689072, "step": 5600, "valid_targets_mean": 4645.4, "valid_targets_min": 2833 }, { "epoch": 4.802913453299057, "grad_norm": 0.5212979617586241, "learning_rate": 1.085780497930983e-05, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.07081075012683868, "step": 5605, "valid_targets_mean": 5706.9, "valid_targets_min": 2853 }, { "epoch": 4.80719794344473, "grad_norm": 0.535613814118286, "learning_rate": 1.0819820367986971e-05, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.054836373776197433, "step": 5610, "valid_targets_mean": 4400.9, "valid_targets_min": 1582 }, { "epoch": 4.8114824335904025, "grad_norm": 0.524310423958414, "learning_rate": 1.0781877663007894e-05, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.08845508098602295, "step": 5615, "valid_targets_mean": 5411.8, "valid_targets_min": 2292 }, { "epoch": 4.815766923736075, "grad_norm": 0.49503651101709395, "learning_rate": 1.0743977037576175e-05, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.06133238226175308, "step": 5620, "valid_targets_mean": 6299.9, "valid_targets_min": 1401 }, { "epoch": 4.820051413881748, "grad_norm": 0.5260704382165095, "learning_rate": 1.0706118664703325e-05, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.07649976760149002, "step": 5625, "valid_targets_mean": 5099.4, "valid_targets_min": 1739 }, { "epoch": 4.8243359040274205, "grad_norm": 0.5417701735704517, "learning_rate": 1.0668302717207956e-05, "loss": 0.1538, "loss_nan_ranks": 0, "loss_rank_avg": 0.07010504603385925, "step": 5630, "valid_targets_mean": 4464.9, "valid_targets_min": 1685 }, { "epoch": 4.828620394173093, "grad_norm": 0.5671176679190546, "learning_rate": 1.063052936771503e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.06441761553287506, "step": 5635, "valid_targets_mean": 5495.6, "valid_targets_min": 3054 }, { "epoch": 4.832904884318766, "grad_norm": 0.581886558811821, "learning_rate": 1.0592798788655041e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.09613919258117676, "step": 5640, "valid_targets_mean": 5075.4, "valid_targets_min": 2716 }, { "epoch": 4.8371893744644385, "grad_norm": 0.7008507535275961, "learning_rate": 1.0555111152263242e-05, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.1073591411113739, "step": 5645, "valid_targets_mean": 6467.6, "valid_targets_min": 2480 }, { "epoch": 4.841473864610111, "grad_norm": 0.5070119707443743, "learning_rate": 1.0517466630578874e-05, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.054898276925086975, "step": 5650, "valid_targets_mean": 5255.6, "valid_targets_min": 1531 }, { "epoch": 4.845758354755784, "grad_norm": 0.5516486979699894, "learning_rate": 1.0479865395444362e-05, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.059809666126966476, "step": 5655, "valid_targets_mean": 5287.0, "valid_targets_min": 1630 }, { "epoch": 4.8500428449014565, "grad_norm": 0.5398004607320777, "learning_rate": 1.044230761850452e-05, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.08338692039251328, "step": 5660, "valid_targets_mean": 6707.8, "valid_targets_min": 3387 }, { "epoch": 4.854327335047129, "grad_norm": 0.5668342950363051, "learning_rate": 1.040479347120578e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.07433384656906128, "step": 5665, "valid_targets_mean": 4323.1, "valid_targets_min": 1718 }, { "epoch": 4.858611825192802, "grad_norm": 0.6213106739886147, "learning_rate": 1.036732312479543e-05, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.09529195725917816, "step": 5670, "valid_targets_mean": 5139.4, "valid_targets_min": 1208 }, { "epoch": 4.8628963153384746, "grad_norm": 0.5177404281691247, "learning_rate": 1.0329896750320789e-05, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.0704999715089798, "step": 5675, "valid_targets_mean": 5343.9, "valid_targets_min": 2279 }, { "epoch": 4.867180805484147, "grad_norm": 0.520797862309505, "learning_rate": 1.0292514518628462e-05, "loss": 0.14, "loss_nan_ranks": 0, "loss_rank_avg": 0.05940914899110794, "step": 5680, "valid_targets_mean": 5120.5, "valid_targets_min": 3199 }, { "epoch": 4.87146529562982, "grad_norm": 0.5458396359053364, "learning_rate": 1.025517660036355e-05, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.06686630845069885, "step": 5685, "valid_targets_mean": 5368.1, "valid_targets_min": 1607 }, { "epoch": 4.875749785775493, "grad_norm": 0.5143392154065023, "learning_rate": 1.0217883165968873e-05, "loss": 0.1663, "loss_nan_ranks": 0, "loss_rank_avg": 0.07533658295869827, "step": 5690, "valid_targets_mean": 5656.9, "valid_targets_min": 4122 }, { "epoch": 4.880034275921165, "grad_norm": 0.5466425536619203, "learning_rate": 1.0180634385684179e-05, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.08453083038330078, "step": 5695, "valid_targets_mean": 5683.0, "valid_targets_min": 2789 }, { "epoch": 4.884318766066838, "grad_norm": 0.5423879147218846, "learning_rate": 1.0143430429545367e-05, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.07795500010251999, "step": 5700, "valid_targets_mean": 5769.6, "valid_targets_min": 4791 }, { "epoch": 4.888603256212511, "grad_norm": 0.5341530692778058, "learning_rate": 1.010627146738374e-05, "loss": 0.1426, "loss_nan_ranks": 0, "loss_rank_avg": 0.0644720196723938, "step": 5705, "valid_targets_mean": 5012.2, "valid_targets_min": 2150 }, { "epoch": 4.892887746358183, "grad_norm": 0.5737432099647293, "learning_rate": 1.0069157668825185e-05, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.11156918108463287, "step": 5710, "valid_targets_mean": 4350.5, "valid_targets_min": 2085 }, { "epoch": 4.897172236503856, "grad_norm": 0.526678452776669, "learning_rate": 1.0032089203289446e-05, "loss": 0.1453, "loss_nan_ranks": 0, "loss_rank_avg": 0.06818336993455887, "step": 5715, "valid_targets_mean": 4246.8, "valid_targets_min": 1373 }, { "epoch": 4.901456726649529, "grad_norm": 0.47464083861660505, "learning_rate": 9.99506623998933e-06, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.07242852449417114, "step": 5720, "valid_targets_mean": 6936.0, "valid_targets_min": 4491 }, { "epoch": 4.905741216795201, "grad_norm": 0.6043407418923966, "learning_rate": 9.958088947929909e-06, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.10490664094686508, "step": 5725, "valid_targets_mean": 4582.8, "valid_targets_min": 1712 }, { "epoch": 4.910025706940874, "grad_norm": 0.5525595588437875, "learning_rate": 9.921157495907785e-06, "loss": 0.1646, "loss_nan_ranks": 0, "loss_rank_avg": 0.09463279694318771, "step": 5730, "valid_targets_mean": 5260.6, "valid_targets_min": 1353 }, { "epoch": 4.914310197086547, "grad_norm": 0.5188449026265485, "learning_rate": 9.884272052510306e-06, "loss": 0.1367, "loss_nan_ranks": 0, "loss_rank_avg": 0.08734147250652313, "step": 5735, "valid_targets_mean": 5719.8, "valid_targets_min": 3734 }, { "epoch": 4.918594687232219, "grad_norm": 0.550677240559499, "learning_rate": 9.847432786114793e-06, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.07683046162128448, "step": 5740, "valid_targets_mean": 5706.1, "valid_targets_min": 3867 }, { "epoch": 4.922879177377892, "grad_norm": 0.544349033724898, "learning_rate": 9.810639864887767e-06, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.07485879212617874, "step": 5745, "valid_targets_mean": 5523.6, "valid_targets_min": 1666 }, { "epoch": 4.927163667523565, "grad_norm": 0.5541874503249078, "learning_rate": 9.773893456784212e-06, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.08049365133047104, "step": 5750, "valid_targets_mean": 4984.2, "valid_targets_min": 1629 }, { "epoch": 4.931448157669237, "grad_norm": 0.49873889321961007, "learning_rate": 9.737193729546775e-06, "loss": 0.1455, "loss_nan_ranks": 0, "loss_rank_avg": 0.07165542244911194, "step": 5755, "valid_targets_mean": 5716.2, "valid_targets_min": 2894 }, { "epoch": 4.93573264781491, "grad_norm": 0.5310506565288947, "learning_rate": 9.700540850705007e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.08118843287229538, "step": 5760, "valid_targets_mean": 4976.8, "valid_targets_min": 2014 }, { "epoch": 4.940017137960583, "grad_norm": 0.581273266255407, "learning_rate": 9.663934987574597e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.08815907686948776, "step": 5765, "valid_targets_mean": 5708.8, "valid_targets_min": 2736 }, { "epoch": 4.944301628106255, "grad_norm": 0.4753411184941003, "learning_rate": 9.627376307256626e-06, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.07187001407146454, "step": 5770, "valid_targets_mean": 4870.6, "valid_targets_min": 2266 }, { "epoch": 4.948586118251928, "grad_norm": 0.5255200905440895, "learning_rate": 9.590864976636774e-06, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.07110698521137238, "step": 5775, "valid_targets_mean": 4578.6, "valid_targets_min": 1793 }, { "epoch": 4.952870608397601, "grad_norm": 0.5223872032353971, "learning_rate": 9.554401162384604e-06, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.06410413980484009, "step": 5780, "valid_targets_mean": 4336.6, "valid_targets_min": 2024 }, { "epoch": 4.957155098543273, "grad_norm": 0.546798377896757, "learning_rate": 9.517985030952739e-06, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.0852179229259491, "step": 5785, "valid_targets_mean": 5628.1, "valid_targets_min": 2023 }, { "epoch": 4.961439588688946, "grad_norm": 0.5161720732576406, "learning_rate": 9.481616748576171e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.06516799330711365, "step": 5790, "valid_targets_mean": 4302.5, "valid_targets_min": 1825 }, { "epoch": 4.965724078834619, "grad_norm": 0.565400152380402, "learning_rate": 9.44529648127144e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.07869059592485428, "step": 5795, "valid_targets_mean": 3989.9, "valid_targets_min": 699 }, { "epoch": 4.970008568980291, "grad_norm": 0.48670358415908505, "learning_rate": 9.409024394835912e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.06296761333942413, "step": 5800, "valid_targets_mean": 4779.6, "valid_targets_min": 1387 }, { "epoch": 4.974293059125964, "grad_norm": 0.5317639102339133, "learning_rate": 9.372800654847015e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.05721823498606682, "step": 5805, "valid_targets_mean": 4486.0, "valid_targets_min": 1897 }, { "epoch": 4.978577549271637, "grad_norm": 0.5874589278661156, "learning_rate": 9.336625426661475e-06, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.07887572050094604, "step": 5810, "valid_targets_mean": 4364.9, "valid_targets_min": 1879 }, { "epoch": 4.982862039417309, "grad_norm": 0.5575739274103504, "learning_rate": 9.300498875414583e-06, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.08425137400627136, "step": 5815, "valid_targets_mean": 4901.0, "valid_targets_min": 1233 }, { "epoch": 4.987146529562982, "grad_norm": 0.47598116677152114, "learning_rate": 9.264421166019408e-06, "loss": 0.1441, "loss_nan_ranks": 0, "loss_rank_avg": 0.052196092903614044, "step": 5820, "valid_targets_mean": 4768.5, "valid_targets_min": 2056 }, { "epoch": 4.991431019708655, "grad_norm": 0.5278491426313316, "learning_rate": 9.228392463166082e-06, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.0845300629734993, "step": 5825, "valid_targets_mean": 7003.1, "valid_targets_min": 3785 }, { "epoch": 4.995715509854327, "grad_norm": 0.575656419690066, "learning_rate": 9.192412931321011e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.09089523553848267, "step": 5830, "valid_targets_mean": 4330.6, "valid_targets_min": 1567 }, { "epoch": 5.0, "grad_norm": 0.536566562014675, "learning_rate": 9.156482734726147e-06, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.07456126809120178, "step": 5835, "valid_targets_mean": 5001.2, "valid_targets_min": 2780 }, { "epoch": 5.004284490145673, "grad_norm": 0.461679823419595, "learning_rate": 9.120602037398227e-06, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.05347277969121933, "step": 5840, "valid_targets_mean": 4582.1, "valid_targets_min": 2106 }, { "epoch": 5.008568980291345, "grad_norm": 0.5615618946463897, "learning_rate": 9.084771003128053e-06, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.09778857976198196, "step": 5845, "valid_targets_mean": 5213.6, "valid_targets_min": 2510 }, { "epoch": 5.012853470437018, "grad_norm": 0.5224785906609419, "learning_rate": 9.048989795479697e-06, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.06234997138381004, "step": 5850, "valid_targets_mean": 5434.2, "valid_targets_min": 3402 }, { "epoch": 5.017137960582691, "grad_norm": 0.558131422882269, "learning_rate": 9.013258577789778e-06, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.06631478667259216, "step": 5855, "valid_targets_mean": 5814.6, "valid_targets_min": 887 }, { "epoch": 5.021422450728363, "grad_norm": 0.5007153060775194, "learning_rate": 8.977577513166745e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.05998099595308304, "step": 5860, "valid_targets_mean": 5688.1, "valid_targets_min": 1945 }, { "epoch": 5.025706940874036, "grad_norm": 0.5457382272762462, "learning_rate": 8.941946764490075e-06, "loss": 0.1495, "loss_nan_ranks": 0, "loss_rank_avg": 0.05917572230100632, "step": 5865, "valid_targets_mean": 3900.0, "valid_targets_min": 863 }, { "epoch": 5.029991431019709, "grad_norm": 0.5654326331634673, "learning_rate": 8.906366494409572e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.0636155903339386, "step": 5870, "valid_targets_mean": 3952.5, "valid_targets_min": 1962 }, { "epoch": 5.034275921165381, "grad_norm": 0.5558719783166709, "learning_rate": 8.870836865344605e-06, "loss": 0.1436, "loss_nan_ranks": 0, "loss_rank_avg": 0.0862559899687767, "step": 5875, "valid_targets_mean": 6003.8, "valid_targets_min": 2878 }, { "epoch": 5.038560411311054, "grad_norm": 0.5931457187334572, "learning_rate": 8.83535803948339e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.06579413264989853, "step": 5880, "valid_targets_mean": 3968.0, "valid_targets_min": 1049 }, { "epoch": 5.042844901456727, "grad_norm": 0.4926081340892514, "learning_rate": 8.799930178782217e-06, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.048622652888298035, "step": 5885, "valid_targets_mean": 5776.8, "valid_targets_min": 3088 }, { "epoch": 5.047129391602399, "grad_norm": 0.5043569545461065, "learning_rate": 8.764553444964727e-06, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.06690607964992523, "step": 5890, "valid_targets_mean": 5154.6, "valid_targets_min": 1254 }, { "epoch": 5.051413881748072, "grad_norm": 0.570691437471372, "learning_rate": 8.72922799952117e-06, "loss": 0.1485, "loss_nan_ranks": 0, "loss_rank_avg": 0.0650261640548706, "step": 5895, "valid_targets_mean": 5009.9, "valid_targets_min": 2690 }, { "epoch": 5.055698371893745, "grad_norm": 0.544574579251449, "learning_rate": 8.693954003707696e-06, "loss": 0.1391, "loss_nan_ranks": 0, "loss_rank_avg": 0.07156353443861008, "step": 5900, "valid_targets_mean": 5317.2, "valid_targets_min": 2609 }, { "epoch": 5.059982862039417, "grad_norm": 0.5129014740792754, "learning_rate": 8.658731618545568e-06, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.06884966790676117, "step": 5905, "valid_targets_mean": 5266.9, "valid_targets_min": 2015 }, { "epoch": 5.06426735218509, "grad_norm": 0.557367027998699, "learning_rate": 8.623561004820453e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.06522762775421143, "step": 5910, "valid_targets_mean": 4625.5, "valid_targets_min": 1500 }, { "epoch": 5.068551842330763, "grad_norm": 0.593029732278665, "learning_rate": 8.58844232308171e-06, "loss": 0.1381, "loss_nan_ranks": 0, "loss_rank_avg": 0.07211321592330933, "step": 5915, "valid_targets_mean": 5161.1, "valid_targets_min": 2515 }, { "epoch": 5.072836332476435, "grad_norm": 0.565911279068255, "learning_rate": 8.553375733641617e-06, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.0606425404548645, "step": 5920, "valid_targets_mean": 4933.0, "valid_targets_min": 2762 }, { "epoch": 5.077120822622108, "grad_norm": 0.5706569662387289, "learning_rate": 8.518361396574659e-06, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.08236978203058243, "step": 5925, "valid_targets_mean": 4947.5, "valid_targets_min": 2784 }, { "epoch": 5.081405312767781, "grad_norm": 0.5089594026928188, "learning_rate": 8.483399471716793e-06, "loss": 0.124, "loss_nan_ranks": 0, "loss_rank_avg": 0.05879615992307663, "step": 5930, "valid_targets_mean": 6075.5, "valid_targets_min": 2211 }, { "epoch": 5.085689802913453, "grad_norm": 0.5281032014270479, "learning_rate": 8.44849011866474e-06, "loss": 0.1338, "loss_nan_ranks": 0, "loss_rank_avg": 0.0665479302406311, "step": 5935, "valid_targets_mean": 6032.6, "valid_targets_min": 1734 }, { "epoch": 5.089974293059126, "grad_norm": 0.5773129793427175, "learning_rate": 8.413633496775209e-06, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.07037808746099472, "step": 5940, "valid_targets_mean": 4567.1, "valid_targets_min": 1981 }, { "epoch": 5.094258783204799, "grad_norm": 0.545253432414127, "learning_rate": 8.378829765164227e-06, "loss": 0.143, "loss_nan_ranks": 0, "loss_rank_avg": 0.06493847072124481, "step": 5945, "valid_targets_mean": 5403.6, "valid_targets_min": 1040 }, { "epoch": 5.098543273350471, "grad_norm": 0.5843283397967569, "learning_rate": 8.344079082706365e-06, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.06504341959953308, "step": 5950, "valid_targets_mean": 5195.8, "valid_targets_min": 3061 }, { "epoch": 5.102827763496144, "grad_norm": 0.746729007527675, "learning_rate": 8.309381608034031e-06, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.07642590254545212, "step": 5955, "valid_targets_mean": 5460.0, "valid_targets_min": 3577 }, { "epoch": 5.107112253641817, "grad_norm": 0.5842968919515109, "learning_rate": 8.274737499536756e-06, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.0753287672996521, "step": 5960, "valid_targets_mean": 4521.8, "valid_targets_min": 952 }, { "epoch": 5.111396743787489, "grad_norm": 0.5470619824706553, "learning_rate": 8.240146915360446e-06, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.0719161406159401, "step": 5965, "valid_targets_mean": 6245.6, "valid_targets_min": 4221 }, { "epoch": 5.115681233933162, "grad_norm": 0.5541965469691894, "learning_rate": 8.205610013406703e-06, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.07677328586578369, "step": 5970, "valid_targets_mean": 4794.0, "valid_targets_min": 3034 }, { "epoch": 5.119965724078835, "grad_norm": 0.5665391192317706, "learning_rate": 8.17112695133204e-06, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.06618514657020569, "step": 5975, "valid_targets_mean": 4742.2, "valid_targets_min": 2004 }, { "epoch": 5.124250214224507, "grad_norm": 0.5762731737652794, "learning_rate": 8.136697886547235e-06, "loss": 0.1372, "loss_nan_ranks": 0, "loss_rank_avg": 0.07710222899913788, "step": 5980, "valid_targets_mean": 5326.2, "valid_targets_min": 2850 }, { "epoch": 5.12853470437018, "grad_norm": 0.6488573742379213, "learning_rate": 8.10232297621655e-06, "loss": 0.1407, "loss_nan_ranks": 0, "loss_rank_avg": 0.06464515626430511, "step": 5985, "valid_targets_mean": 6132.5, "valid_targets_min": 1318 }, { "epoch": 5.132819194515853, "grad_norm": 0.5668846483094866, "learning_rate": 8.068002377257047e-06, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.07700810581445694, "step": 5990, "valid_targets_mean": 5266.4, "valid_targets_min": 2162 }, { "epoch": 5.1371036846615254, "grad_norm": 0.6119562445788617, "learning_rate": 8.033736246337861e-06, "loss": 0.1367, "loss_nan_ranks": 0, "loss_rank_avg": 0.08774948120117188, "step": 5995, "valid_targets_mean": 4714.4, "valid_targets_min": 2076 }, { "epoch": 5.141388174807198, "grad_norm": 0.5803264364747844, "learning_rate": 7.999524739879486e-06, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.07601134479045868, "step": 6000, "valid_targets_mean": 4622.2, "valid_targets_min": 2434 }, { "epoch": 5.145672664952871, "grad_norm": 0.5669247714040354, "learning_rate": 7.965368014053065e-06, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.0730358436703682, "step": 6005, "valid_targets_mean": 4821.9, "valid_targets_min": 1683 }, { "epoch": 5.1499571550985435, "grad_norm": 0.6008925220384994, "learning_rate": 7.931266224779688e-06, "loss": 0.1406, "loss_nan_ranks": 0, "loss_rank_avg": 0.06482844054698944, "step": 6010, "valid_targets_mean": 4140.9, "valid_targets_min": 1302 }, { "epoch": 5.154241645244216, "grad_norm": 0.6067676646670379, "learning_rate": 7.897219527729647e-06, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.060043372213840485, "step": 6015, "valid_targets_mean": 3742.0, "valid_targets_min": 1625 }, { "epoch": 5.158526135389889, "grad_norm": 0.5562801412629258, "learning_rate": 7.863228078321748e-06, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.08964170515537262, "step": 6020, "valid_targets_mean": 4821.4, "valid_targets_min": 3237 }, { "epoch": 5.1628106255355615, "grad_norm": 0.5677679608679317, "learning_rate": 7.829292031722605e-06, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.07650621235370636, "step": 6025, "valid_targets_mean": 4806.0, "valid_targets_min": 1482 }, { "epoch": 5.167095115681234, "grad_norm": 0.6154466258539943, "learning_rate": 7.795411542845918e-06, "loss": 0.1417, "loss_nan_ranks": 0, "loss_rank_avg": 0.07820950448513031, "step": 6030, "valid_targets_mean": 4463.4, "valid_targets_min": 2484 }, { "epoch": 5.171379605826907, "grad_norm": 0.534700907388558, "learning_rate": 7.761586766351779e-06, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.06325490772724152, "step": 6035, "valid_targets_mean": 5119.2, "valid_targets_min": 2836 }, { "epoch": 5.1756640959725795, "grad_norm": 0.6171116306561318, "learning_rate": 7.727817856645959e-06, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.0964316874742508, "step": 6040, "valid_targets_mean": 4525.8, "valid_targets_min": 1179 }, { "epoch": 5.179948586118252, "grad_norm": 0.49396649995838965, "learning_rate": 7.694104967879213e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.0832238420844078, "step": 6045, "valid_targets_mean": 6017.9, "valid_targets_min": 2326 }, { "epoch": 5.184233076263925, "grad_norm": 0.5414578284712983, "learning_rate": 7.66044825394655e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.09561492502689362, "step": 6050, "valid_targets_mean": 5810.4, "valid_targets_min": 3746 }, { "epoch": 5.1885175664095975, "grad_norm": 0.600524577834584, "learning_rate": 7.62684786848656e-06, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.05960875004529953, "step": 6055, "valid_targets_mean": 4689.1, "valid_targets_min": 1267 }, { "epoch": 5.19280205655527, "grad_norm": 0.5979465438640408, "learning_rate": 7.593303964880696e-06, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.05936659500002861, "step": 6060, "valid_targets_mean": 4414.9, "valid_targets_min": 1569 }, { "epoch": 5.197086546700943, "grad_norm": 0.5581662135102559, "learning_rate": 7.559816696252573e-06, "loss": 0.1699, "loss_nan_ranks": 0, "loss_rank_avg": 0.06237490475177765, "step": 6065, "valid_targets_mean": 5152.8, "valid_targets_min": 1741 }, { "epoch": 5.2013710368466155, "grad_norm": 0.614944712657222, "learning_rate": 7.526386215467287e-06, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.05573698878288269, "step": 6070, "valid_targets_mean": 4619.1, "valid_targets_min": 2424 }, { "epoch": 5.205655526992288, "grad_norm": 0.5765074497095739, "learning_rate": 7.493012675130711e-06, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.06293430924415588, "step": 6075, "valid_targets_mean": 4066.6, "valid_targets_min": 699 }, { "epoch": 5.209940017137961, "grad_norm": 0.6194830516991278, "learning_rate": 7.459696227588768e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.08389878273010254, "step": 6080, "valid_targets_mean": 6030.9, "valid_targets_min": 2243 }, { "epoch": 5.2142245072836335, "grad_norm": 0.5820834048829306, "learning_rate": 7.426437024926774e-06, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.06466574966907501, "step": 6085, "valid_targets_mean": 5668.6, "valid_targets_min": 3608 }, { "epoch": 5.218508997429306, "grad_norm": 0.6448838593097435, "learning_rate": 7.393235218968731e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.0774383544921875, "step": 6090, "valid_targets_mean": 3682.6, "valid_targets_min": 1195 }, { "epoch": 5.222793487574979, "grad_norm": 0.5256021821677503, "learning_rate": 7.360090961276625e-06, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.06239830330014229, "step": 6095, "valid_targets_mean": 4077.2, "valid_targets_min": 1100 }, { "epoch": 5.2270779777206515, "grad_norm": 0.5506695042512416, "learning_rate": 7.327004403149738e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.06670170277357101, "step": 6100, "valid_targets_mean": 5362.8, "valid_targets_min": 1035 }, { "epoch": 5.231362467866324, "grad_norm": 0.5494435488237343, "learning_rate": 7.293975695623981e-06, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.0640135109424591, "step": 6105, "valid_targets_mean": 4585.5, "valid_targets_min": 1389 }, { "epoch": 5.235646958011997, "grad_norm": 0.5741122933274755, "learning_rate": 7.261004989471172e-06, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.08091049641370773, "step": 6110, "valid_targets_mean": 5247.6, "valid_targets_min": 1066 }, { "epoch": 5.2399314481576695, "grad_norm": 0.527100645437638, "learning_rate": 7.228092435198359e-06, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.06724964827299118, "step": 6115, "valid_targets_mean": 4800.0, "valid_targets_min": 1681 }, { "epoch": 5.244215938303342, "grad_norm": 0.5732389963931994, "learning_rate": 7.195238183047133e-06, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.07661618292331696, "step": 6120, "valid_targets_mean": 5228.4, "valid_targets_min": 2611 }, { "epoch": 5.248500428449015, "grad_norm": 0.6371677881221045, "learning_rate": 7.1624423829929446e-06, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.09487690031528473, "step": 6125, "valid_targets_mean": 5642.8, "valid_targets_min": 3309 }, { "epoch": 5.2527849185946875, "grad_norm": 0.5587444588268791, "learning_rate": 7.129705184744413e-06, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.09017151594161987, "step": 6130, "valid_targets_mean": 5733.6, "valid_targets_min": 3604 }, { "epoch": 5.25706940874036, "grad_norm": 0.5574414156904585, "learning_rate": 7.097026737742667e-06, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.05598699301481247, "step": 6135, "valid_targets_mean": 3445.1, "valid_targets_min": 1295 }, { "epoch": 5.261353898886033, "grad_norm": 0.5174736669960975, "learning_rate": 7.064407191160616e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.07012724876403809, "step": 6140, "valid_targets_mean": 6463.2, "valid_targets_min": 3191 }, { "epoch": 5.265638389031706, "grad_norm": 0.5082834218010197, "learning_rate": 7.0318466939023264e-06, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.05886061489582062, "step": 6145, "valid_targets_mean": 6100.0, "valid_targets_min": 1874 }, { "epoch": 5.269922879177378, "grad_norm": 0.5548709879767999, "learning_rate": 6.999345394602286e-06, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.08334115892648697, "step": 6150, "valid_targets_mean": 4543.4, "valid_targets_min": 2328 }, { "epoch": 5.274207369323051, "grad_norm": 0.5676546777822717, "learning_rate": 6.966903441624766e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.05629216507077217, "step": 6155, "valid_targets_mean": 4842.1, "valid_targets_min": 1318 }, { "epoch": 5.278491859468724, "grad_norm": 0.6042159590416843, "learning_rate": 6.93452098306312e-06, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.06647060811519623, "step": 6160, "valid_targets_mean": 5053.8, "valid_targets_min": 1747 }, { "epoch": 5.282776349614396, "grad_norm": 0.6191709463886721, "learning_rate": 6.90219816673912e-06, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.0582103431224823, "step": 6165, "valid_targets_mean": 4129.1, "valid_targets_min": 1373 }, { "epoch": 5.287060839760069, "grad_norm": 0.5249507912952034, "learning_rate": 6.869935140202293e-06, "loss": 0.1302, "loss_nan_ranks": 0, "loss_rank_avg": 0.055291514843702316, "step": 6170, "valid_targets_mean": 5271.0, "valid_targets_min": 2146 }, { "epoch": 5.291345329905742, "grad_norm": 0.5156906152579579, "learning_rate": 6.837732050729207e-06, "loss": 0.1402, "loss_nan_ranks": 0, "loss_rank_avg": 0.06559474766254425, "step": 6175, "valid_targets_mean": 5878.5, "valid_targets_min": 1439 }, { "epoch": 5.295629820051414, "grad_norm": 0.592944268797725, "learning_rate": 6.805589045322854e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.0791960209608078, "step": 6180, "valid_targets_mean": 5405.0, "valid_targets_min": 1577 }, { "epoch": 5.299914310197087, "grad_norm": 0.5999862846915844, "learning_rate": 6.773506270711925e-06, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.08896322548389435, "step": 6185, "valid_targets_mean": 5432.4, "valid_targets_min": 1440 }, { "epoch": 5.30419880034276, "grad_norm": 0.5263317224741103, "learning_rate": 6.741483873350181e-06, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.05374643951654434, "step": 6190, "valid_targets_mean": 6210.0, "valid_targets_min": 3094 }, { "epoch": 5.308483290488432, "grad_norm": 0.6235588769390094, "learning_rate": 6.709521999415753e-06, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.06328782439231873, "step": 6195, "valid_targets_mean": 4310.1, "valid_targets_min": 2227 }, { "epoch": 5.312767780634105, "grad_norm": 0.567942608527058, "learning_rate": 6.677620794810513e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.07411561161279678, "step": 6200, "valid_targets_mean": 5104.1, "valid_targets_min": 2564 }, { "epoch": 5.317052270779778, "grad_norm": 0.6366432620717134, "learning_rate": 6.6457804051593675e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.06682665646076202, "step": 6205, "valid_targets_mean": 3957.5, "valid_targets_min": 929 }, { "epoch": 5.32133676092545, "grad_norm": 0.54498818017496, "learning_rate": 6.614000975809611e-06, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.06897222250699997, "step": 6210, "valid_targets_mean": 5864.2, "valid_targets_min": 3570 }, { "epoch": 5.325621251071123, "grad_norm": 0.5459683344468065, "learning_rate": 6.582282651830274e-06, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.066863052546978, "step": 6215, "valid_targets_mean": 6395.4, "valid_targets_min": 1982 }, { "epoch": 5.329905741216796, "grad_norm": 0.5503926257381906, "learning_rate": 6.55062557801144e-06, "loss": 0.1478, "loss_nan_ranks": 0, "loss_rank_avg": 0.08532165735960007, "step": 6220, "valid_targets_mean": 4813.0, "valid_targets_min": 3996 }, { "epoch": 5.334190231362468, "grad_norm": 0.5895214744593827, "learning_rate": 6.519029898863594e-06, "loss": 0.145, "loss_nan_ranks": 0, "loss_rank_avg": 0.07670275866985321, "step": 6225, "valid_targets_mean": 4062.2, "valid_targets_min": 1206 }, { "epoch": 5.33847472150814, "grad_norm": 0.5638386205387821, "learning_rate": 6.487495758616953e-06, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.08205410838127136, "step": 6230, "valid_targets_mean": 6390.1, "valid_targets_min": 1676 }, { "epoch": 5.342759211653814, "grad_norm": 0.5167616637272222, "learning_rate": 6.456023301220844e-06, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.06270787119865417, "step": 6235, "valid_targets_mean": 5502.0, "valid_targets_min": 1988 }, { "epoch": 5.347043701799485, "grad_norm": 0.5650143553238214, "learning_rate": 6.424612670342993e-06, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.07442963123321533, "step": 6240, "valid_targets_mean": 5757.2, "valid_targets_min": 3118 }, { "epoch": 5.351328191945159, "grad_norm": 0.558072143781282, "learning_rate": 6.3932640093689e-06, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.07415077835321426, "step": 6245, "valid_targets_mean": 5365.6, "valid_targets_min": 2881 }, { "epoch": 5.355612682090831, "grad_norm": 0.5233654550955804, "learning_rate": 6.361977461401201e-06, "loss": 0.1363, "loss_nan_ranks": 0, "loss_rank_avg": 0.06110835075378418, "step": 6250, "valid_targets_mean": 4701.1, "valid_targets_min": 1436 }, { "epoch": 5.359897172236504, "grad_norm": 0.5861788265596787, "learning_rate": 6.330753169258967e-06, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.055069178342819214, "step": 6255, "valid_targets_mean": 4977.6, "valid_targets_min": 1345 }, { "epoch": 5.364181662382176, "grad_norm": 0.5832531571711229, "learning_rate": 6.299591275477091e-06, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.07630908489227295, "step": 6260, "valid_targets_mean": 3914.6, "valid_targets_min": 2431 }, { "epoch": 5.36846615252785, "grad_norm": 0.5049380798779455, "learning_rate": 6.268491922305633e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.06887591630220413, "step": 6265, "valid_targets_mean": 5875.1, "valid_targets_min": 4278 }, { "epoch": 5.372750642673521, "grad_norm": 0.6388268871126679, "learning_rate": 6.23745525170915e-06, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.06426230072975159, "step": 6270, "valid_targets_mean": 5025.6, "valid_targets_min": 1614 }, { "epoch": 5.377035132819195, "grad_norm": 0.5446159780516101, "learning_rate": 6.206481405366069e-06, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.08342628180980682, "step": 6275, "valid_targets_mean": 5403.2, "valid_targets_min": 2126 }, { "epoch": 5.381319622964867, "grad_norm": 0.5607310151212304, "learning_rate": 6.175570524668022e-06, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.06648731231689453, "step": 6280, "valid_targets_mean": 5965.5, "valid_targets_min": 4029 }, { "epoch": 5.385604113110539, "grad_norm": 0.558085994371478, "learning_rate": 6.144722750719232e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.07811075448989868, "step": 6285, "valid_targets_mean": 5506.6, "valid_targets_min": 3583 }, { "epoch": 5.389888603256212, "grad_norm": 0.5483846780131174, "learning_rate": 6.113938224335827e-06, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.07613667845726013, "step": 6290, "valid_targets_mean": 5975.0, "valid_targets_min": 3121 }, { "epoch": 5.394173093401885, "grad_norm": 0.5855194434955084, "learning_rate": 6.083217086045219e-06, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.08013680577278137, "step": 6295, "valid_targets_mean": 4852.4, "valid_targets_min": 2089 }, { "epoch": 5.3984575835475574, "grad_norm": 0.5350669250301283, "learning_rate": 6.052559476085482e-06, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.06474751234054565, "step": 6300, "valid_targets_mean": 5435.9, "valid_targets_min": 2461 }, { "epoch": 5.40274207369323, "grad_norm": 0.58160460055041, "learning_rate": 6.021965534404672e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.07002052664756775, "step": 6305, "valid_targets_mean": 4838.4, "valid_targets_min": 2493 }, { "epoch": 5.407026563838903, "grad_norm": 0.5396925657648401, "learning_rate": 5.991435400660213e-06, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.08394481986761093, "step": 6310, "valid_targets_mean": 6202.5, "valid_targets_min": 2967 }, { "epoch": 5.4113110539845755, "grad_norm": 0.5694513991424146, "learning_rate": 5.960969214218244e-06, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.08601640164852142, "step": 6315, "valid_targets_mean": 4850.4, "valid_targets_min": 1333 }, { "epoch": 5.415595544130248, "grad_norm": 0.5836812047602808, "learning_rate": 5.930567114153016e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.0535474456846714, "step": 6320, "valid_targets_mean": 5394.1, "valid_targets_min": 2081 }, { "epoch": 5.419880034275921, "grad_norm": 0.6996982249932461, "learning_rate": 5.900229239246211e-06, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.07842926681041718, "step": 6325, "valid_targets_mean": 4914.5, "valid_targets_min": 2608 }, { "epoch": 5.4241645244215935, "grad_norm": 0.5927430432906213, "learning_rate": 5.869955727986352e-06, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.06343986839056015, "step": 6330, "valid_targets_mean": 4385.8, "valid_targets_min": 1844 }, { "epoch": 5.428449014567266, "grad_norm": 0.5615288154250935, "learning_rate": 5.839746718568131e-06, "loss": 0.1457, "loss_nan_ranks": 0, "loss_rank_avg": 0.07984130084514618, "step": 6335, "valid_targets_mean": 5323.0, "valid_targets_min": 2204 }, { "epoch": 5.432733504712939, "grad_norm": 0.5541340256670348, "learning_rate": 5.809602348891808e-06, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.061635490506887436, "step": 6340, "valid_targets_mean": 4427.9, "valid_targets_min": 2092 }, { "epoch": 5.4370179948586115, "grad_norm": 0.5960063481704528, "learning_rate": 5.779522756562563e-06, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.06906621158123016, "step": 6345, "valid_targets_mean": 5128.5, "valid_targets_min": 2339 }, { "epoch": 5.441302485004284, "grad_norm": 0.5661976276058973, "learning_rate": 5.749508078889881e-06, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.06279657036066055, "step": 6350, "valid_targets_mean": 5162.1, "valid_targets_min": 2131 }, { "epoch": 5.445586975149957, "grad_norm": 0.5497893081216243, "learning_rate": 5.719558452886929e-06, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.0694722831249237, "step": 6355, "valid_targets_mean": 4845.1, "valid_targets_min": 2309 }, { "epoch": 5.4498714652956295, "grad_norm": 0.5163796487394642, "learning_rate": 5.689674015269901e-06, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.05982083082199097, "step": 6360, "valid_targets_mean": 6627.6, "valid_targets_min": 3133 }, { "epoch": 5.454155955441302, "grad_norm": 0.5471286635981826, "learning_rate": 5.6598549024574375e-06, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.06936630606651306, "step": 6365, "valid_targets_mean": 5126.2, "valid_targets_min": 1611 }, { "epoch": 5.458440445586975, "grad_norm": 0.5944792407962814, "learning_rate": 5.6301012505699615e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.07246899604797363, "step": 6370, "valid_targets_mean": 4889.1, "valid_targets_min": 1502 }, { "epoch": 5.4627249357326475, "grad_norm": 0.6361275513468415, "learning_rate": 5.600413195429082e-06, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.07020856440067291, "step": 6375, "valid_targets_mean": 5216.9, "valid_targets_min": 2034 }, { "epoch": 5.46700942587832, "grad_norm": 0.5612537422879182, "learning_rate": 5.570790872556966e-06, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.0894571989774704, "step": 6380, "valid_targets_mean": 6033.5, "valid_targets_min": 3294 }, { "epoch": 5.471293916023993, "grad_norm": 0.5000465417769924, "learning_rate": 5.541234417175718e-06, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.05969848483800888, "step": 6385, "valid_targets_mean": 5685.2, "valid_targets_min": 1363 }, { "epoch": 5.4755784061696655, "grad_norm": 0.6351891861499561, "learning_rate": 5.5117439642067725e-06, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.09923093765974045, "step": 6390, "valid_targets_mean": 4533.6, "valid_targets_min": 2594 }, { "epoch": 5.479862896315338, "grad_norm": 0.5210414729111282, "learning_rate": 5.482319648270278e-06, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.0708557665348053, "step": 6395, "valid_targets_mean": 5451.4, "valid_targets_min": 1234 }, { "epoch": 5.484147386461011, "grad_norm": 0.5334767406234865, "learning_rate": 5.452961603684459e-06, "loss": 0.1408, "loss_nan_ranks": 0, "loss_rank_avg": 0.07409349828958511, "step": 6400, "valid_targets_mean": 6112.6, "valid_targets_min": 2179 }, { "epoch": 5.4884318766066835, "grad_norm": 0.5412429447282396, "learning_rate": 5.423669964465028e-06, "loss": 0.1449, "loss_nan_ranks": 0, "loss_rank_avg": 0.06016102433204651, "step": 6405, "valid_targets_mean": 5271.8, "valid_targets_min": 1831 }, { "epoch": 5.492716366752356, "grad_norm": 0.5818658258711826, "learning_rate": 5.394444864324564e-06, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.0727088674902916, "step": 6410, "valid_targets_mean": 4549.9, "valid_targets_min": 1142 }, { "epoch": 5.497000856898029, "grad_norm": 0.5784324823124002, "learning_rate": 5.365286436671903e-06, "loss": 0.1473, "loss_nan_ranks": 0, "loss_rank_avg": 0.07919305562973022, "step": 6415, "valid_targets_mean": 4619.6, "valid_targets_min": 1724 }, { "epoch": 5.5012853470437015, "grad_norm": 0.5460056842645928, "learning_rate": 5.3361948146115306e-06, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.063385508954525, "step": 6420, "valid_targets_mean": 4789.6, "valid_targets_min": 3603 }, { "epoch": 5.505569837189374, "grad_norm": 0.49938221905703617, "learning_rate": 5.307170130942976e-06, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.06451307237148285, "step": 6425, "valid_targets_mean": 6023.5, "valid_targets_min": 2947 }, { "epoch": 5.509854327335047, "grad_norm": 0.562066135955173, "learning_rate": 5.278212518160208e-06, "loss": 0.1303, "loss_nan_ranks": 0, "loss_rank_avg": 0.07842020690441132, "step": 6430, "valid_targets_mean": 5180.6, "valid_targets_min": 1873 }, { "epoch": 5.5141388174807195, "grad_norm": 0.5540925996211802, "learning_rate": 5.249322108451014e-06, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.08028965443372726, "step": 6435, "valid_targets_mean": 5239.5, "valid_targets_min": 1830 }, { "epoch": 5.518423307626392, "grad_norm": 0.5073241633366583, "learning_rate": 5.220499033696409e-06, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.06025489419698715, "step": 6440, "valid_targets_mean": 4024.8, "valid_targets_min": 1668 }, { "epoch": 5.522707797772065, "grad_norm": 0.5717332273536765, "learning_rate": 5.191743425470039e-06, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.07372932136058807, "step": 6445, "valid_targets_mean": 5477.2, "valid_targets_min": 3413 }, { "epoch": 5.526992287917738, "grad_norm": 0.5215747809897383, "learning_rate": 5.163055415037565e-06, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.0440630242228508, "step": 6450, "valid_targets_mean": 4580.2, "valid_targets_min": 1269 }, { "epoch": 5.53127677806341, "grad_norm": 0.5442611902593508, "learning_rate": 5.134435133356091e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.06199388578534126, "step": 6455, "valid_targets_mean": 5632.6, "valid_targets_min": 2253 }, { "epoch": 5.535561268209083, "grad_norm": 0.6524942377050443, "learning_rate": 5.105882711073524e-06, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.058554474264383316, "step": 6460, "valid_targets_mean": 4896.4, "valid_targets_min": 1597 }, { "epoch": 5.539845758354756, "grad_norm": 0.6548298261620451, "learning_rate": 5.077398278528023e-06, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.05502365902066231, "step": 6465, "valid_targets_mean": 4457.4, "valid_targets_min": 1757 }, { "epoch": 5.544130248500428, "grad_norm": 0.5792243897972685, "learning_rate": 5.04898196574737e-06, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.0710696280002594, "step": 6470, "valid_targets_mean": 5837.4, "valid_targets_min": 1548 }, { "epoch": 5.548414738646101, "grad_norm": 0.5385213971717662, "learning_rate": 5.020633902448391e-06, "loss": 0.1303, "loss_nan_ranks": 0, "loss_rank_avg": 0.07189559936523438, "step": 6475, "valid_targets_mean": 5131.1, "valid_targets_min": 2320 }, { "epoch": 5.552699228791774, "grad_norm": 0.5951604508945392, "learning_rate": 4.992354218036362e-06, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.07350689172744751, "step": 6480, "valid_targets_mean": 3616.0, "valid_targets_min": 1744 }, { "epoch": 5.556983718937446, "grad_norm": 0.5223294450121244, "learning_rate": 4.9641430416044124e-06, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.06630503386259079, "step": 6485, "valid_targets_mean": 5069.4, "valid_targets_min": 3190 }, { "epoch": 5.561268209083119, "grad_norm": 0.5302966929442247, "learning_rate": 4.93600050193296e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.05977999418973923, "step": 6490, "valid_targets_mean": 5080.2, "valid_targets_min": 420 }, { "epoch": 5.565552699228792, "grad_norm": 0.5793933577454219, "learning_rate": 4.907926727489083e-06, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.06778793036937714, "step": 6495, "valid_targets_mean": 5024.2, "valid_targets_min": 3738 }, { "epoch": 5.569837189374464, "grad_norm": 0.5749514354601191, "learning_rate": 4.879921846425972e-06, "loss": 0.1395, "loss_nan_ranks": 0, "loss_rank_avg": 0.07842457294464111, "step": 6500, "valid_targets_mean": 6434.0, "valid_targets_min": 2762 }, { "epoch": 5.574121679520137, "grad_norm": 0.5535613872524504, "learning_rate": 4.851985986582322e-06, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.07504276931285858, "step": 6505, "valid_targets_mean": 4328.8, "valid_targets_min": 1916 }, { "epoch": 5.57840616966581, "grad_norm": 0.5083713146732084, "learning_rate": 4.8241192754817464e-06, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.051820166409015656, "step": 6510, "valid_targets_mean": 4595.5, "valid_targets_min": 1220 }, { "epoch": 5.582690659811482, "grad_norm": 0.5143527720674547, "learning_rate": 4.7963218403322095e-06, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.07099468261003494, "step": 6515, "valid_targets_mean": 5824.1, "valid_targets_min": 2822 }, { "epoch": 5.586975149957155, "grad_norm": 0.5586273797079392, "learning_rate": 4.76859380802545e-06, "loss": 0.1253, "loss_nan_ranks": 0, "loss_rank_avg": 0.07062015682458878, "step": 6520, "valid_targets_mean": 4951.0, "valid_targets_min": 1362 }, { "epoch": 5.591259640102828, "grad_norm": 0.5659530059931339, "learning_rate": 4.74093530513638e-06, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.07185934484004974, "step": 6525, "valid_targets_mean": 4485.4, "valid_targets_min": 3572 }, { "epoch": 5.5955441302485, "grad_norm": 0.559165573881336, "learning_rate": 4.713346457922514e-06, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.07086736708879471, "step": 6530, "valid_targets_mean": 4172.9, "valid_targets_min": 1002 }, { "epoch": 5.599828620394173, "grad_norm": 0.6504390747344749, "learning_rate": 4.6858273923234145e-06, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.064616858959198, "step": 6535, "valid_targets_mean": 4253.6, "valid_targets_min": 1969 }, { "epoch": 5.604113110539846, "grad_norm": 0.5689426033257432, "learning_rate": 4.658378233960088e-06, "loss": 0.1376, "loss_nan_ranks": 0, "loss_rank_avg": 0.05738406628370285, "step": 6540, "valid_targets_mean": 5430.6, "valid_targets_min": 2168 }, { "epoch": 5.608397600685518, "grad_norm": 0.6003852321277522, "learning_rate": 4.6309991081344215e-06, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.06764773279428482, "step": 6545, "valid_targets_mean": 4634.0, "valid_targets_min": 738 }, { "epoch": 5.612682090831191, "grad_norm": 0.5314130423969416, "learning_rate": 4.603690139828611e-06, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.063227578997612, "step": 6550, "valid_targets_mean": 5144.6, "valid_targets_min": 1834 }, { "epoch": 5.616966580976864, "grad_norm": 0.5519198942615016, "learning_rate": 4.576451453704614e-06, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.06084362044930458, "step": 6555, "valid_targets_mean": 4861.1, "valid_targets_min": 1124 }, { "epoch": 5.621251071122536, "grad_norm": 0.5085490164316521, "learning_rate": 4.549283174103529e-06, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.05866881459951401, "step": 6560, "valid_targets_mean": 5328.1, "valid_targets_min": 3653 }, { "epoch": 5.625535561268209, "grad_norm": 0.5166410092324383, "learning_rate": 4.522185425045074e-06, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.07482907176017761, "step": 6565, "valid_targets_mean": 5045.6, "valid_targets_min": 2124 }, { "epoch": 5.629820051413882, "grad_norm": 0.5735608739843969, "learning_rate": 4.495158330227005e-06, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.08168354630470276, "step": 6570, "valid_targets_mean": 5395.8, "valid_targets_min": 4029 }, { "epoch": 5.634104541559554, "grad_norm": 0.5850271273841091, "learning_rate": 4.468202013024547e-06, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.07387813925743103, "step": 6575, "valid_targets_mean": 4727.8, "valid_targets_min": 1939 }, { "epoch": 5.638389031705227, "grad_norm": 0.6816286906770415, "learning_rate": 4.441316596489826e-06, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.09496738016605377, "step": 6580, "valid_targets_mean": 5681.8, "valid_targets_min": 720 }, { "epoch": 5.6426735218509, "grad_norm": 0.6492212601368968, "learning_rate": 4.414502203351336e-06, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.08192385733127594, "step": 6585, "valid_targets_mean": 4593.8, "valid_targets_min": 2645 }, { "epoch": 5.646958011996572, "grad_norm": 0.5776686099072865, "learning_rate": 4.387758956013342e-06, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.06738873571157455, "step": 6590, "valid_targets_mean": 3651.4, "valid_targets_min": 1737 }, { "epoch": 5.651242502142245, "grad_norm": 0.7273725593882753, "learning_rate": 4.361086976555336e-06, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.055989429354667664, "step": 6595, "valid_targets_mean": 5591.0, "valid_targets_min": 2574 }, { "epoch": 5.655526992287918, "grad_norm": 0.5714109431160903, "learning_rate": 4.334486386731487e-06, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.06508769094944, "step": 6600, "valid_targets_mean": 4761.9, "valid_targets_min": 1046 }, { "epoch": 5.65981148243359, "grad_norm": 0.5476429325916928, "learning_rate": 4.307957307970085e-06, "loss": 0.1259, "loss_nan_ranks": 0, "loss_rank_avg": 0.06340515613555908, "step": 6605, "valid_targets_mean": 4844.9, "valid_targets_min": 2410 }, { "epoch": 5.664095972579263, "grad_norm": 0.5006033373634183, "learning_rate": 4.2814998613729755e-06, "loss": 0.1147, "loss_nan_ranks": 0, "loss_rank_avg": 0.05262615531682968, "step": 6610, "valid_targets_mean": 6462.6, "valid_targets_min": 5640 }, { "epoch": 5.668380462724936, "grad_norm": 0.5933953350490176, "learning_rate": 4.255114167715005e-06, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.07736065983772278, "step": 6615, "valid_targets_mean": 5382.6, "valid_targets_min": 2419 }, { "epoch": 5.672664952870608, "grad_norm": 0.5266374655195465, "learning_rate": 4.228800347443491e-06, "loss": 0.1305, "loss_nan_ranks": 0, "loss_rank_avg": 0.07201828062534332, "step": 6620, "valid_targets_mean": 5567.9, "valid_targets_min": 3669 }, { "epoch": 5.676949443016281, "grad_norm": 0.5898754476535092, "learning_rate": 4.202558520677651e-06, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.07570499181747437, "step": 6625, "valid_targets_mean": 4978.1, "valid_targets_min": 1173 }, { "epoch": 5.681233933161954, "grad_norm": 0.4991332472101233, "learning_rate": 4.17638880720806e-06, "loss": 0.1379, "loss_nan_ranks": 0, "loss_rank_avg": 0.05089268088340759, "step": 6630, "valid_targets_mean": 6274.0, "valid_targets_min": 3291 }, { "epoch": 5.685518423307626, "grad_norm": 0.5419759634610473, "learning_rate": 4.150291326496101e-06, "loss": 0.1413, "loss_nan_ranks": 0, "loss_rank_avg": 0.07586829364299774, "step": 6635, "valid_targets_mean": 5088.5, "valid_targets_min": 2381 }, { "epoch": 5.689802913453299, "grad_norm": 0.5441222779036342, "learning_rate": 4.1242661976734434e-06, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.04856753721833229, "step": 6640, "valid_targets_mean": 4978.9, "valid_targets_min": 1832 }, { "epoch": 5.694087403598972, "grad_norm": 0.6207196786094554, "learning_rate": 4.09831353954145e-06, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.0738341212272644, "step": 6645, "valid_targets_mean": 4128.1, "valid_targets_min": 1906 }, { "epoch": 5.698371893744644, "grad_norm": 0.5213327231009702, "learning_rate": 4.072433470570696e-06, "loss": 0.1395, "loss_nan_ranks": 0, "loss_rank_avg": 0.05955669283866882, "step": 6650, "valid_targets_mean": 4380.0, "valid_targets_min": 2072 }, { "epoch": 5.702656383890317, "grad_norm": 0.5453669018514253, "learning_rate": 4.046626108900369e-06, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.07227616012096405, "step": 6655, "valid_targets_mean": 5088.1, "valid_targets_min": 1736 }, { "epoch": 5.70694087403599, "grad_norm": 0.5739041238549919, "learning_rate": 4.0208915723377724e-06, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.08359837532043457, "step": 6660, "valid_targets_mean": 4858.0, "valid_targets_min": 2031 }, { "epoch": 5.711225364181662, "grad_norm": 0.5221244934963233, "learning_rate": 3.995229978357771e-06, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.06315900385379791, "step": 6665, "valid_targets_mean": 5562.8, "valid_targets_min": 2966 }, { "epoch": 5.715509854327335, "grad_norm": 0.5293926691188072, "learning_rate": 3.969641444102241e-06, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.0793573409318924, "step": 6670, "valid_targets_mean": 4634.9, "valid_targets_min": 3504 }, { "epoch": 5.719794344473008, "grad_norm": 0.5911683803276364, "learning_rate": 3.944126086379578e-06, "loss": 0.1405, "loss_nan_ranks": 0, "loss_rank_avg": 0.059656694531440735, "step": 6675, "valid_targets_mean": 4381.6, "valid_targets_min": 1091 }, { "epoch": 5.72407883461868, "grad_norm": 0.5868429249145188, "learning_rate": 3.9186840216641075e-06, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.07227806746959686, "step": 6680, "valid_targets_mean": 2916.5, "valid_targets_min": 869 }, { "epoch": 5.728363324764353, "grad_norm": 0.5684965723566315, "learning_rate": 3.893315366095609e-06, "loss": 0.1431, "loss_nan_ranks": 0, "loss_rank_avg": 0.0693536251783371, "step": 6685, "valid_targets_mean": 6093.6, "valid_targets_min": 2979 }, { "epoch": 5.732647814910026, "grad_norm": 0.5603873006925839, "learning_rate": 3.868020235478735e-06, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.09165522456169128, "step": 6690, "valid_targets_mean": 5763.5, "valid_targets_min": 1445 }, { "epoch": 5.736932305055698, "grad_norm": 0.5469489775102141, "learning_rate": 3.842798745282521e-06, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.058962516486644745, "step": 6695, "valid_targets_mean": 4978.2, "valid_targets_min": 2444 }, { "epoch": 5.741216795201371, "grad_norm": 0.6019679932692666, "learning_rate": 3.817651010639833e-06, "loss": 0.141, "loss_nan_ranks": 0, "loss_rank_avg": 0.07497408986091614, "step": 6700, "valid_targets_mean": 3552.8, "valid_targets_min": 1639 }, { "epoch": 5.745501285347044, "grad_norm": 0.6504758349385636, "learning_rate": 3.7925771463468564e-06, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.07307694852352142, "step": 6705, "valid_targets_mean": 3517.8, "valid_targets_min": 854 }, { "epoch": 5.749785775492716, "grad_norm": 0.5541217867040226, "learning_rate": 3.7675772668625765e-06, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.06129279360175133, "step": 6710, "valid_targets_mean": 5937.2, "valid_targets_min": 1195 }, { "epoch": 5.754070265638389, "grad_norm": 0.5592631375594215, "learning_rate": 3.742651486308233e-06, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.07175225019454956, "step": 6715, "valid_targets_mean": 5371.6, "valid_targets_min": 2908 }, { "epoch": 5.758354755784062, "grad_norm": 0.5535958969395064, "learning_rate": 3.7177999184668267e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.09704683721065521, "step": 6720, "valid_targets_mean": 6141.8, "valid_targets_min": 2870 }, { "epoch": 5.762639245929734, "grad_norm": 0.5287083456633489, "learning_rate": 3.693022676782578e-06, "loss": 0.1379, "loss_nan_ranks": 0, "loss_rank_avg": 0.06492763757705688, "step": 6725, "valid_targets_mean": 5959.8, "valid_targets_min": 3981 }, { "epoch": 5.766923736075407, "grad_norm": 0.5235234483770389, "learning_rate": 3.6683198743604176e-06, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.05290340632200241, "step": 6730, "valid_targets_mean": 5557.6, "valid_targets_min": 2775 }, { "epoch": 5.77120822622108, "grad_norm": 0.5744313280557972, "learning_rate": 3.6436916239654775e-06, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.07471472024917603, "step": 6735, "valid_targets_mean": 5893.5, "valid_targets_min": 4005 }, { "epoch": 5.775492716366752, "grad_norm": 0.5191831107637773, "learning_rate": 3.619138038022558e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.05435687303543091, "step": 6740, "valid_targets_mean": 6395.0, "valid_targets_min": 777 }, { "epoch": 5.779777206512425, "grad_norm": 0.5542420902763224, "learning_rate": 3.594659228615638e-06, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.06281452625989914, "step": 6745, "valid_targets_mean": 4446.0, "valid_targets_min": 1787 }, { "epoch": 5.784061696658098, "grad_norm": 0.57109479507259, "learning_rate": 3.5702553074873515e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.07405635714530945, "step": 6750, "valid_targets_mean": 5396.8, "valid_targets_min": 1616 }, { "epoch": 5.78834618680377, "grad_norm": 0.5845579805680661, "learning_rate": 3.5459263860384676e-06, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.0800202414393425, "step": 6755, "valid_targets_mean": 5868.5, "valid_targets_min": 2093 }, { "epoch": 5.792630676949443, "grad_norm": 0.5083013565986827, "learning_rate": 3.521672575327393e-06, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.054221805185079575, "step": 6760, "valid_targets_mean": 6155.0, "valid_targets_min": 1994 }, { "epoch": 5.796915167095116, "grad_norm": 0.5761850082494403, "learning_rate": 3.4974939860696667e-06, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.05445557087659836, "step": 6765, "valid_targets_mean": 3601.5, "valid_targets_min": 876 }, { "epoch": 5.8011996572407885, "grad_norm": 0.638371981329725, "learning_rate": 3.473390728637447e-06, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.07390281558036804, "step": 6770, "valid_targets_mean": 3327.8, "valid_targets_min": 1259 }, { "epoch": 5.805484147386461, "grad_norm": 0.7196984139985203, "learning_rate": 3.4493629130590246e-06, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.07923655956983566, "step": 6775, "valid_targets_mean": 4779.0, "valid_targets_min": 1021 }, { "epoch": 5.809768637532134, "grad_norm": 0.5267892321366978, "learning_rate": 3.425410649018288e-06, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.05486609786748886, "step": 6780, "valid_targets_mean": 4125.4, "valid_targets_min": 1208 }, { "epoch": 5.8140531276778065, "grad_norm": 0.4997215023511863, "learning_rate": 3.4015340458542667e-06, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.06113504618406296, "step": 6785, "valid_targets_mean": 6006.1, "valid_targets_min": 2393 }, { "epoch": 5.818337617823479, "grad_norm": 0.5803591765288956, "learning_rate": 3.3777332125605876e-06, "loss": 0.1411, "loss_nan_ranks": 0, "loss_rank_avg": 0.0857536643743515, "step": 6790, "valid_targets_mean": 4885.4, "valid_targets_min": 1143 }, { "epoch": 5.822622107969152, "grad_norm": 0.6302037090494906, "learning_rate": 3.354008257785004e-06, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.06109432876110077, "step": 6795, "valid_targets_mean": 4721.6, "valid_targets_min": 996 }, { "epoch": 5.8269065981148245, "grad_norm": 0.5321710621405683, "learning_rate": 3.3303592898288996e-06, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.06634179502725601, "step": 6800, "valid_targets_mean": 5669.6, "valid_targets_min": 2958 }, { "epoch": 5.831191088260497, "grad_norm": 0.5265118919796228, "learning_rate": 3.3067864166467724e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.06433935463428497, "step": 6805, "valid_targets_mean": 5867.8, "valid_targets_min": 1720 }, { "epoch": 5.83547557840617, "grad_norm": 0.6185168294053308, "learning_rate": 3.2832897458457746e-06, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.0700758695602417, "step": 6810, "valid_targets_mean": 4015.1, "valid_targets_min": 1654 }, { "epoch": 5.8397600685518425, "grad_norm": 0.5574030938626355, "learning_rate": 3.2598693846852037e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.06746580451726913, "step": 6815, "valid_targets_mean": 5562.1, "valid_targets_min": 3556 }, { "epoch": 5.844044558697515, "grad_norm": 0.544442153355723, "learning_rate": 3.2365254400760036e-06, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.09361623972654343, "step": 6820, "valid_targets_mean": 5243.6, "valid_targets_min": 1166 }, { "epoch": 5.848329048843188, "grad_norm": 0.5254064816831592, "learning_rate": 3.2132580185802876e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.051424961537122726, "step": 6825, "valid_targets_mean": 5415.0, "valid_targets_min": 3837 }, { "epoch": 5.8526135389888605, "grad_norm": 0.5915974965701197, "learning_rate": 3.190067226410858e-06, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.08004424721002579, "step": 6830, "valid_targets_mean": 5658.2, "valid_targets_min": 3150 }, { "epoch": 5.856898029134533, "grad_norm": 0.504995306642246, "learning_rate": 3.1669531694307e-06, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.041914355009794235, "step": 6835, "valid_targets_mean": 5900.6, "valid_targets_min": 2968 }, { "epoch": 5.861182519280206, "grad_norm": 0.6108621619033056, "learning_rate": 3.1439159531525344e-06, "loss": 0.1379, "loss_nan_ranks": 0, "loss_rank_avg": 0.068336620926857, "step": 6840, "valid_targets_mean": 5198.2, "valid_targets_min": 1241 }, { "epoch": 5.8654670094258785, "grad_norm": 0.5372951593834955, "learning_rate": 3.1209556827382915e-06, "loss": 0.1414, "loss_nan_ranks": 0, "loss_rank_avg": 0.05392158031463623, "step": 6845, "valid_targets_mean": 4665.5, "valid_targets_min": 1243 }, { "epoch": 5.869751499571551, "grad_norm": 0.5427030654594667, "learning_rate": 3.098072462998671e-06, "loss": 0.1338, "loss_nan_ranks": 0, "loss_rank_avg": 0.06130759045481682, "step": 6850, "valid_targets_mean": 5294.8, "valid_targets_min": 1186 }, { "epoch": 5.874035989717224, "grad_norm": 0.5551297016793235, "learning_rate": 3.07526639839264e-06, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.07664550840854645, "step": 6855, "valid_targets_mean": 6137.0, "valid_targets_min": 3194 }, { "epoch": 5.8783204798628965, "grad_norm": 0.552587788514632, "learning_rate": 3.0525375930269584e-06, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.07360447943210602, "step": 6860, "valid_targets_mean": 5645.5, "valid_targets_min": 2589 }, { "epoch": 5.882604970008569, "grad_norm": 0.5800728441639016, "learning_rate": 3.0298861506557076e-06, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.057409510016441345, "step": 6865, "valid_targets_mean": 4250.6, "valid_targets_min": 1360 }, { "epoch": 5.886889460154242, "grad_norm": 0.5472337989778477, "learning_rate": 3.0073121746798196e-06, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.053992968052625656, "step": 6870, "valid_targets_mean": 5314.0, "valid_targets_min": 1640 }, { "epoch": 5.8911739502999145, "grad_norm": 0.5339616139250007, "learning_rate": 2.9848157681466093e-06, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.06431794911623001, "step": 6875, "valid_targets_mean": 4802.9, "valid_targets_min": 1410 }, { "epoch": 5.895458440445587, "grad_norm": 0.5851089093746733, "learning_rate": 2.96239703374928e-06, "loss": 0.1421, "loss_nan_ranks": 0, "loss_rank_avg": 0.07572221010923386, "step": 6880, "valid_targets_mean": 5150.2, "valid_targets_min": 3099 }, { "epoch": 5.89974293059126, "grad_norm": 0.5482802919748951, "learning_rate": 2.940056073826494e-06, "loss": 0.1323, "loss_nan_ranks": 0, "loss_rank_avg": 0.05965782329440117, "step": 6885, "valid_targets_mean": 5102.5, "valid_targets_min": 1197 }, { "epoch": 5.9040274207369325, "grad_norm": 0.5859800632364757, "learning_rate": 2.917792990361863e-06, "loss": 0.1284, "loss_nan_ranks": 0, "loss_rank_avg": 0.06816573441028595, "step": 6890, "valid_targets_mean": 4878.9, "valid_targets_min": 2223 }, { "epoch": 5.908311910882605, "grad_norm": 0.5243638339363336, "learning_rate": 2.8956078849835133e-06, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.05222854018211365, "step": 6895, "valid_targets_mean": 6770.0, "valid_targets_min": 3501 }, { "epoch": 5.912596401028278, "grad_norm": 0.6186882882901905, "learning_rate": 2.873500858963607e-06, "loss": 0.1297, "loss_nan_ranks": 0, "loss_rank_avg": 0.04518494755029678, "step": 6900, "valid_targets_mean": 4287.5, "valid_targets_min": 922 }, { "epoch": 5.9168808911739506, "grad_norm": 0.5803000774619191, "learning_rate": 2.85147201321788e-06, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.08812421560287476, "step": 6905, "valid_targets_mean": 4709.4, "valid_targets_min": 2221 }, { "epoch": 5.921165381319623, "grad_norm": 0.6531158925885155, "learning_rate": 2.829521448305199e-06, "loss": 0.1465, "loss_nan_ranks": 0, "loss_rank_avg": 0.08043619245290756, "step": 6910, "valid_targets_mean": 4030.8, "valid_targets_min": 1831 }, { "epoch": 5.925449871465296, "grad_norm": 0.6188264080269267, "learning_rate": 2.807649264427079e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.09220334887504578, "step": 6915, "valid_targets_mean": 4534.5, "valid_targets_min": 2656 }, { "epoch": 5.929734361610969, "grad_norm": 0.5381152998325993, "learning_rate": 2.785855561427231e-06, "loss": 0.1398, "loss_nan_ranks": 0, "loss_rank_avg": 0.05605997145175934, "step": 6920, "valid_targets_mean": 5281.2, "valid_targets_min": 3046 }, { "epoch": 5.934018851756641, "grad_norm": 0.5777102355387708, "learning_rate": 2.7641404387911253e-06, "loss": 0.1401, "loss_nan_ranks": 0, "loss_rank_avg": 0.08713674545288086, "step": 6925, "valid_targets_mean": 5400.8, "valid_targets_min": 2651 }, { "epoch": 5.938303341902314, "grad_norm": 0.7710764345542876, "learning_rate": 2.7425039956455113e-06, "loss": 0.1451, "loss_nan_ranks": 0, "loss_rank_avg": 0.08280148357152939, "step": 6930, "valid_targets_mean": 5259.6, "valid_targets_min": 1085 }, { "epoch": 5.942587832047987, "grad_norm": 0.49364547735421227, "learning_rate": 2.720946330757972e-06, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.06348837912082672, "step": 6935, "valid_targets_mean": 5807.9, "valid_targets_min": 3536 }, { "epoch": 5.946872322193659, "grad_norm": 0.6205905188458044, "learning_rate": 2.699467542536498e-06, "loss": 0.1357, "loss_nan_ranks": 0, "loss_rank_avg": 0.11586824059486389, "step": 6940, "valid_targets_mean": 6235.1, "valid_targets_min": 2918 }, { "epoch": 5.951156812339332, "grad_norm": 0.6084874967670024, "learning_rate": 2.678067729028999e-06, "loss": 0.1437, "loss_nan_ranks": 0, "loss_rank_avg": 0.0647452175617218, "step": 6945, "valid_targets_mean": 3589.9, "valid_targets_min": 505 }, { "epoch": 5.955441302485005, "grad_norm": 0.5973192224285923, "learning_rate": 2.6567469879228824e-06, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.07049669325351715, "step": 6950, "valid_targets_mean": 4123.8, "valid_targets_min": 1399 }, { "epoch": 5.959725792630677, "grad_norm": 0.6208232920444805, "learning_rate": 2.635505416544595e-06, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.0627826675772667, "step": 6955, "valid_targets_mean": 4860.9, "valid_targets_min": 1282 }, { "epoch": 5.96401028277635, "grad_norm": 0.5267484487748498, "learning_rate": 2.6143431118591967e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.08430700749158859, "step": 6960, "valid_targets_mean": 5536.1, "valid_targets_min": 4115 }, { "epoch": 5.968294772922023, "grad_norm": 0.5496591230529959, "learning_rate": 2.593260170469891e-06, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.0636175125837326, "step": 6965, "valid_targets_mean": 5769.9, "valid_targets_min": 2399 }, { "epoch": 5.972579263067695, "grad_norm": 0.4920257881440762, "learning_rate": 2.5722566886176047e-06, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.054918207228183746, "step": 6970, "valid_targets_mean": 5959.6, "valid_targets_min": 2296 }, { "epoch": 5.976863753213368, "grad_norm": 0.6577430899430436, "learning_rate": 2.5513327621805473e-06, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.07874983549118042, "step": 6975, "valid_targets_mean": 4578.1, "valid_targets_min": 1934 }, { "epoch": 5.981148243359041, "grad_norm": 0.5192838115792693, "learning_rate": 2.530488486673757e-06, "loss": 0.1368, "loss_nan_ranks": 0, "loss_rank_avg": 0.06696130335330963, "step": 6980, "valid_targets_mean": 5333.2, "valid_targets_min": 2213 }, { "epoch": 5.985432733504713, "grad_norm": 0.5527558283403213, "learning_rate": 2.50972395724868e-06, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.0464884415268898, "step": 6985, "valid_targets_mean": 4953.5, "valid_targets_min": 988 }, { "epoch": 5.989717223650386, "grad_norm": 0.5352427081717313, "learning_rate": 2.48903926869273e-06, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.0705413892865181, "step": 6990, "valid_targets_mean": 5753.9, "valid_targets_min": 4252 }, { "epoch": 5.994001713796059, "grad_norm": 0.5714701782964342, "learning_rate": 2.468434515428868e-06, "loss": 0.1581, "loss_nan_ranks": 0, "loss_rank_avg": 0.07364567369222641, "step": 6995, "valid_targets_mean": 4093.5, "valid_targets_min": 2187 }, { "epoch": 5.998286203941731, "grad_norm": 0.5603266143505143, "learning_rate": 2.4479097915151438e-06, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.0819477066397667, "step": 7000, "valid_targets_mean": 5255.8, "valid_targets_min": 2270 }, { "epoch": 6.002570694087404, "grad_norm": 0.5617902857898495, "learning_rate": 2.4274651906443026e-06, "loss": 0.1349, "loss_nan_ranks": 0, "loss_rank_avg": 0.07298682630062103, "step": 7005, "valid_targets_mean": 6007.9, "valid_targets_min": 3138 }, { "epoch": 6.006855184233077, "grad_norm": 0.5590701329433548, "learning_rate": 2.407100806143321e-06, "loss": 0.1307, "loss_nan_ranks": 0, "loss_rank_avg": 0.056523799896240234, "step": 7010, "valid_targets_mean": 4618.4, "valid_targets_min": 2404 }, { "epoch": 6.011139674378749, "grad_norm": 0.5314159056896909, "learning_rate": 2.386816730973005e-06, "loss": 0.1347, "loss_nan_ranks": 0, "loss_rank_avg": 0.05974011868238449, "step": 7015, "valid_targets_mean": 5098.0, "valid_targets_min": 2011 }, { "epoch": 6.015424164524422, "grad_norm": 0.5636771573961143, "learning_rate": 2.3666130577275604e-06, "loss": 0.1422, "loss_nan_ranks": 0, "loss_rank_avg": 0.07339408248662949, "step": 7020, "valid_targets_mean": 4734.5, "valid_targets_min": 1748 }, { "epoch": 6.019708654670095, "grad_norm": 0.5435129863456174, "learning_rate": 2.3464898786341615e-06, "loss": 0.1258, "loss_nan_ranks": 0, "loss_rank_avg": 0.06307528913021088, "step": 7025, "valid_targets_mean": 4226.4, "valid_targets_min": 2028 }, { "epoch": 6.023993144815767, "grad_norm": 0.5315069862433984, "learning_rate": 2.3264472855525532e-06, "loss": 0.123, "loss_nan_ranks": 0, "loss_rank_avg": 0.06738060712814331, "step": 7030, "valid_targets_mean": 5815.2, "valid_targets_min": 3714 }, { "epoch": 6.02827763496144, "grad_norm": 0.4855041602382719, "learning_rate": 2.3064853699745936e-06, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.05301181226968765, "step": 7035, "valid_targets_mean": 6482.8, "valid_targets_min": 3550 }, { "epoch": 6.032562125107113, "grad_norm": 0.5294378234912969, "learning_rate": 2.2866042230238804e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.061131253838539124, "step": 7040, "valid_targets_mean": 6033.4, "valid_targets_min": 3134 }, { "epoch": 6.036846615252785, "grad_norm": 0.5273015137391548, "learning_rate": 2.266803935455295e-06, "loss": 0.1227, "loss_nan_ranks": 0, "loss_rank_avg": 0.0604885071516037, "step": 7045, "valid_targets_mean": 5655.1, "valid_targets_min": 1845 }, { "epoch": 6.041131105398458, "grad_norm": 0.5952816902680278, "learning_rate": 2.2470845976546163e-06, "loss": 0.1244, "loss_nan_ranks": 0, "loss_rank_avg": 0.06316784024238586, "step": 7050, "valid_targets_mean": 5000.8, "valid_targets_min": 1318 }, { "epoch": 6.045415595544131, "grad_norm": 0.5949149831620895, "learning_rate": 2.227446299638092e-06, "loss": 0.136, "loss_nan_ranks": 0, "loss_rank_avg": 0.08699578046798706, "step": 7055, "valid_targets_mean": 5022.2, "valid_targets_min": 2303 }, { "epoch": 6.049700085689803, "grad_norm": 0.5432610582498822, "learning_rate": 2.2078891310520346e-06, "loss": 0.1278, "loss_nan_ranks": 0, "loss_rank_avg": 0.05387689173221588, "step": 7060, "valid_targets_mean": 3837.4, "valid_targets_min": 1804 }, { "epoch": 6.053984575835476, "grad_norm": 0.5661465570912795, "learning_rate": 2.188413181172415e-06, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.06640972197055817, "step": 7065, "valid_targets_mean": 3869.1, "valid_targets_min": 1786 }, { "epoch": 6.058269065981149, "grad_norm": 0.5711416361143601, "learning_rate": 2.169018538904455e-06, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.0669720321893692, "step": 7070, "valid_targets_mean": 6166.6, "valid_targets_min": 2563 }, { "epoch": 6.062553556126821, "grad_norm": 0.6060473922843284, "learning_rate": 2.149705292782205e-06, "loss": 0.1329, "loss_nan_ranks": 0, "loss_rank_avg": 0.06459236145019531, "step": 7075, "valid_targets_mean": 4371.8, "valid_targets_min": 2106 }, { "epoch": 6.066838046272494, "grad_norm": 0.5258787232106485, "learning_rate": 2.13047353096816e-06, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.05734770745038986, "step": 7080, "valid_targets_mean": 4410.9, "valid_targets_min": 1790 }, { "epoch": 6.071122536418166, "grad_norm": 0.5835317414829356, "learning_rate": 2.111323341252851e-06, "loss": 0.128, "loss_nan_ranks": 0, "loss_rank_avg": 0.07886640727519989, "step": 7085, "valid_targets_mean": 4713.9, "valid_targets_min": 1312 }, { "epoch": 6.075407026563839, "grad_norm": 0.5824598357112564, "learning_rate": 2.092254811054437e-06, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.07371959835290909, "step": 7090, "valid_targets_mean": 5103.1, "valid_targets_min": 1558 }, { "epoch": 6.079691516709511, "grad_norm": 0.5772979309118111, "learning_rate": 2.073268027418314e-06, "loss": 0.1186, "loss_nan_ranks": 0, "loss_rank_avg": 0.07025423645973206, "step": 7095, "valid_targets_mean": 4879.0, "valid_targets_min": 1787 }, { "epoch": 6.083976006855184, "grad_norm": 0.5759877981086569, "learning_rate": 2.0543630770167166e-06, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.09002973884344101, "step": 7100, "valid_targets_mean": 5280.8, "valid_targets_min": 2574 }, { "epoch": 6.0882604970008565, "grad_norm": 0.5319451711483659, "learning_rate": 2.0355400461483278e-06, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.057267673313617706, "step": 7105, "valid_targets_mean": 4528.5, "valid_targets_min": 1902 }, { "epoch": 6.092544987146529, "grad_norm": 0.5722236613500173, "learning_rate": 2.0167990207378696e-06, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.06940978765487671, "step": 7110, "valid_targets_mean": 4825.8, "valid_targets_min": 793 }, { "epoch": 6.096829477292202, "grad_norm": 0.5990088640600807, "learning_rate": 1.998140086335718e-06, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.0675596296787262, "step": 7115, "valid_targets_mean": 4574.1, "valid_targets_min": 797 }, { "epoch": 6.1011139674378745, "grad_norm": 0.5801047706770528, "learning_rate": 1.97956332811752e-06, "loss": 0.1155, "loss_nan_ranks": 0, "loss_rank_avg": 0.055842798203229904, "step": 7120, "valid_targets_mean": 4754.4, "valid_targets_min": 1071 }, { "epoch": 6.105398457583547, "grad_norm": 0.6048377130053119, "learning_rate": 1.96106883088379e-06, "loss": 0.1395, "loss_nan_ranks": 0, "loss_rank_avg": 0.07217507064342499, "step": 7125, "valid_targets_mean": 4534.0, "valid_targets_min": 2138 }, { "epoch": 6.10968294772922, "grad_norm": 0.520549717902676, "learning_rate": 1.942656679059547e-06, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.06939978897571564, "step": 7130, "valid_targets_mean": 5840.8, "valid_targets_min": 2292 }, { "epoch": 6.1139674378748925, "grad_norm": 0.570791137709158, "learning_rate": 1.924326956693905e-06, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.07258065789937973, "step": 7135, "valid_targets_mean": 4443.1, "valid_targets_min": 1876 }, { "epoch": 6.118251928020565, "grad_norm": 0.49546155449057244, "learning_rate": 1.906079747459695e-06, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.05577601492404938, "step": 7140, "valid_targets_mean": 5838.4, "valid_targets_min": 3043 }, { "epoch": 6.122536418166238, "grad_norm": 0.6098928236472626, "learning_rate": 1.8879151346530889e-06, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.07786683738231659, "step": 7145, "valid_targets_mean": 4605.0, "valid_targets_min": 671 }, { "epoch": 6.1268209083119105, "grad_norm": 0.5765047245134982, "learning_rate": 1.8698332011932164e-06, "loss": 0.1327, "loss_nan_ranks": 0, "loss_rank_avg": 0.053650569170713425, "step": 7150, "valid_targets_mean": 4318.0, "valid_targets_min": 1250 }, { "epoch": 6.131105398457583, "grad_norm": 1.6491384383257206, "learning_rate": 1.8518340296217907e-06, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.05434166640043259, "step": 7155, "valid_targets_mean": 5819.2, "valid_targets_min": 2102 }, { "epoch": 6.135389888603256, "grad_norm": 0.5471148417542772, "learning_rate": 1.8339177021027144e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.07945186644792557, "step": 7160, "valid_targets_mean": 5115.5, "valid_targets_min": 1679 }, { "epoch": 6.1396743787489285, "grad_norm": 0.6043050620509512, "learning_rate": 1.8160843004217344e-06, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.06661148369312286, "step": 7165, "valid_targets_mean": 4373.0, "valid_targets_min": 1373 }, { "epoch": 6.143958868894601, "grad_norm": 0.5942375631504286, "learning_rate": 1.7983339059860472e-06, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.0706518292427063, "step": 7170, "valid_targets_mean": 4559.2, "valid_targets_min": 3384 }, { "epoch": 6.148243359040274, "grad_norm": 0.6161555629304948, "learning_rate": 1.780666599823926e-06, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.06862369924783707, "step": 7175, "valid_targets_mean": 4812.8, "valid_targets_min": 2162 }, { "epoch": 6.1525278491859465, "grad_norm": 0.5570310289376202, "learning_rate": 1.7630824625843579e-06, "loss": 0.1262, "loss_nan_ranks": 0, "loss_rank_avg": 0.05563248693943024, "step": 7180, "valid_targets_mean": 5118.5, "valid_targets_min": 1578 }, { "epoch": 6.156812339331619, "grad_norm": 0.5565818568350045, "learning_rate": 1.745581574536679e-06, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.07531631737947464, "step": 7185, "valid_targets_mean": 5362.5, "valid_targets_min": 1126 }, { "epoch": 6.161096829477292, "grad_norm": 0.5474402626627962, "learning_rate": 1.728164015570195e-06, "loss": 0.1267, "loss_nan_ranks": 0, "loss_rank_avg": 0.05338769778609276, "step": 7190, "valid_targets_mean": 5042.5, "valid_targets_min": 2566 }, { "epoch": 6.1653813196229645, "grad_norm": 0.5006188609732733, "learning_rate": 1.7108298651938393e-06, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.04690549895167351, "step": 7195, "valid_targets_mean": 6448.0, "valid_targets_min": 4129 }, { "epoch": 6.169665809768637, "grad_norm": 0.6054830426470936, "learning_rate": 1.69357920253578e-06, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.052494410425424576, "step": 7200, "valid_targets_mean": 3395.1, "valid_targets_min": 1208 }, { "epoch": 6.17395029991431, "grad_norm": 0.5458160886088905, "learning_rate": 1.6764121063430882e-06, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.06598511338233948, "step": 7205, "valid_targets_mean": 6574.4, "valid_targets_min": 1931 }, { "epoch": 6.1782347900599826, "grad_norm": 0.5511129685150017, "learning_rate": 1.659328654981356e-06, "loss": 0.1365, "loss_nan_ranks": 0, "loss_rank_avg": 0.06158352270722389, "step": 7210, "valid_targets_mean": 6243.9, "valid_targets_min": 4428 }, { "epoch": 6.182519280205655, "grad_norm": 0.5721224946813679, "learning_rate": 1.642328926434349e-06, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.052804622799158096, "step": 7215, "valid_targets_mean": 4807.4, "valid_targets_min": 2000 }, { "epoch": 6.186803770351328, "grad_norm": 0.5187633332938161, "learning_rate": 1.6254129983036504e-06, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.06331296265125275, "step": 7220, "valid_targets_mean": 5979.9, "valid_targets_min": 3483 }, { "epoch": 6.191088260497001, "grad_norm": 0.5538859237064832, "learning_rate": 1.6085809478083025e-06, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.08845791220664978, "step": 7225, "valid_targets_mean": 4928.2, "valid_targets_min": 1834 }, { "epoch": 6.195372750642673, "grad_norm": 0.5971124365145998, "learning_rate": 1.5918328517844628e-06, "loss": 0.1367, "loss_nan_ranks": 0, "loss_rank_avg": 0.0702032819390297, "step": 7230, "valid_targets_mean": 4869.4, "valid_targets_min": 1197 }, { "epoch": 6.199657240788346, "grad_norm": 0.5376800060207101, "learning_rate": 1.5751687866850396e-06, "loss": 0.1383, "loss_nan_ranks": 0, "loss_rank_avg": 0.04543754830956459, "step": 7235, "valid_targets_mean": 5223.5, "valid_targets_min": 1531 }, { "epoch": 6.203941730934019, "grad_norm": 0.52362958791206, "learning_rate": 1.5585888285793616e-06, "loss": 0.1195, "loss_nan_ranks": 0, "loss_rank_avg": 0.056802961975336075, "step": 7240, "valid_targets_mean": 5973.1, "valid_targets_min": 4700 }, { "epoch": 6.208226221079691, "grad_norm": 0.5787165339346138, "learning_rate": 1.542093053152809e-06, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.06048420071601868, "step": 7245, "valid_targets_mean": 5055.2, "valid_targets_min": 2931 }, { "epoch": 6.212510711225364, "grad_norm": 0.522957992600429, "learning_rate": 1.5256815357064825e-06, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.04589177295565605, "step": 7250, "valid_targets_mean": 5997.5, "valid_targets_min": 3531 }, { "epoch": 6.216795201371037, "grad_norm": 0.5811695311496623, "learning_rate": 1.5093543511568531e-06, "loss": 0.1271, "loss_nan_ranks": 0, "loss_rank_avg": 0.054738134145736694, "step": 7255, "valid_targets_mean": 4873.9, "valid_targets_min": 2125 }, { "epoch": 6.221079691516709, "grad_norm": 0.5878951744890861, "learning_rate": 1.4931115740354352e-06, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.0675361156463623, "step": 7260, "valid_targets_mean": 5341.0, "valid_targets_min": 2498 }, { "epoch": 6.225364181662382, "grad_norm": 0.5239516616418894, "learning_rate": 1.4769532784884199e-06, "loss": 0.1266, "loss_nan_ranks": 0, "loss_rank_avg": 0.054139237850904465, "step": 7265, "valid_targets_mean": 6078.6, "valid_targets_min": 505 }, { "epoch": 6.229648671808055, "grad_norm": 0.6125674704012837, "learning_rate": 1.4608795382763519e-06, "loss": 0.1384, "loss_nan_ranks": 0, "loss_rank_avg": 0.09281733632087708, "step": 7270, "valid_targets_mean": 3341.8, "valid_targets_min": 1937 }, { "epoch": 6.233933161953727, "grad_norm": 0.5802810544979863, "learning_rate": 1.4448904267738062e-06, "loss": 0.1419, "loss_nan_ranks": 0, "loss_rank_avg": 0.05857785418629646, "step": 7275, "valid_targets_mean": 4161.6, "valid_targets_min": 1381 }, { "epoch": 6.2382176520994, "grad_norm": 0.6228348827694725, "learning_rate": 1.4289860169690206e-06, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.06603018939495087, "step": 7280, "valid_targets_mean": 3769.4, "valid_targets_min": 1893 }, { "epoch": 6.242502142245073, "grad_norm": 0.5606682274420252, "learning_rate": 1.4131663814635888e-06, "loss": 0.1367, "loss_nan_ranks": 0, "loss_rank_avg": 0.07488321512937546, "step": 7285, "valid_targets_mean": 4953.9, "valid_targets_min": 3753 }, { "epoch": 6.246786632390745, "grad_norm": 0.5681033905864885, "learning_rate": 1.3974315924721182e-06, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.054232463240623474, "step": 7290, "valid_targets_mean": 4851.4, "valid_targets_min": 2171 }, { "epoch": 6.251071122536418, "grad_norm": 0.5528862655721212, "learning_rate": 1.381781721821911e-06, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.0710495263338089, "step": 7295, "valid_targets_mean": 5688.9, "valid_targets_min": 4264 }, { "epoch": 6.255355612682091, "grad_norm": 0.5967193988030114, "learning_rate": 1.3662168409526167e-06, "loss": 0.1256, "loss_nan_ranks": 0, "loss_rank_avg": 0.11634612828493118, "step": 7300, "valid_targets_mean": 6235.5, "valid_targets_min": 2655 }, { "epoch": 6.259640102827763, "grad_norm": 0.5821630227786284, "learning_rate": 1.350737020915922e-06, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.052662041038274765, "step": 7305, "valid_targets_mean": 4289.1, "valid_targets_min": 1202 }, { "epoch": 6.263924592973436, "grad_norm": 0.6765553432922821, "learning_rate": 1.3353423323752246e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.09214189648628235, "step": 7310, "valid_targets_mean": 4074.9, "valid_targets_min": 2281 }, { "epoch": 6.268209083119109, "grad_norm": 0.5044662591051317, "learning_rate": 1.3200328456053036e-06, "loss": 0.1136, "loss_nan_ranks": 0, "loss_rank_avg": 0.04478124529123306, "step": 7315, "valid_targets_mean": 6636.9, "valid_targets_min": 3794 }, { "epoch": 6.272493573264781, "grad_norm": 0.566414312062377, "learning_rate": 1.3048086304920026e-06, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.06308507919311523, "step": 7320, "valid_targets_mean": 5068.5, "valid_targets_min": 1538 }, { "epoch": 6.276778063410454, "grad_norm": 0.6515762665691374, "learning_rate": 1.289669756531917e-06, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.0729881301522255, "step": 7325, "valid_targets_mean": 4246.6, "valid_targets_min": 1436 }, { "epoch": 6.281062553556127, "grad_norm": 0.5517482213898717, "learning_rate": 1.2746162928320649e-06, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.08301884680986404, "step": 7330, "valid_targets_mean": 5955.0, "valid_targets_min": 1822 }, { "epoch": 6.285347043701799, "grad_norm": 0.5523007068091895, "learning_rate": 1.2596483081095778e-06, "loss": 0.1229, "loss_nan_ranks": 0, "loss_rank_avg": 0.06908877938985825, "step": 7335, "valid_targets_mean": 5983.0, "valid_targets_min": 3720 }, { "epoch": 6.289631533847472, "grad_norm": 0.5601682429843172, "learning_rate": 1.2447658706913868e-06, "loss": 0.1297, "loss_nan_ranks": 0, "loss_rank_avg": 0.05858379602432251, "step": 7340, "valid_targets_mean": 5157.9, "valid_targets_min": 1599 }, { "epoch": 6.293916023993145, "grad_norm": 0.5981781004239811, "learning_rate": 1.2299690485139193e-06, "loss": 0.138, "loss_nan_ranks": 0, "loss_rank_avg": 0.07124894857406616, "step": 7345, "valid_targets_mean": 4882.2, "valid_targets_min": 2014 }, { "epoch": 6.298200514138817, "grad_norm": 0.5628953258224636, "learning_rate": 1.2152579091227668e-06, "loss": 0.1378, "loss_nan_ranks": 0, "loss_rank_avg": 0.07427423447370529, "step": 7350, "valid_targets_mean": 5157.0, "valid_targets_min": 2189 }, { "epoch": 6.30248500428449, "grad_norm": 0.5264402145565338, "learning_rate": 1.2006325196723933e-06, "loss": 0.1407, "loss_nan_ranks": 0, "loss_rank_avg": 0.06821203231811523, "step": 7355, "valid_targets_mean": 5412.6, "valid_targets_min": 1866 }, { "epoch": 6.306769494430163, "grad_norm": 0.5815500627748932, "learning_rate": 1.1860929469258341e-06, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.052492864429950714, "step": 7360, "valid_targets_mean": 4367.4, "valid_targets_min": 512 }, { "epoch": 6.311053984575835, "grad_norm": 0.5825385511943423, "learning_rate": 1.1716392572543732e-06, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.07757897675037384, "step": 7365, "valid_targets_mean": 5754.5, "valid_targets_min": 4385 }, { "epoch": 6.315338474721508, "grad_norm": 0.6110286527146042, "learning_rate": 1.1572715166372506e-06, "loss": 0.1323, "loss_nan_ranks": 0, "loss_rank_avg": 0.06084147468209267, "step": 7370, "valid_targets_mean": 3635.0, "valid_targets_min": 1439 }, { "epoch": 6.319622964867181, "grad_norm": 0.5483459534045897, "learning_rate": 1.1429897906613596e-06, "loss": 0.1416, "loss_nan_ranks": 0, "loss_rank_avg": 0.050404250621795654, "step": 7375, "valid_targets_mean": 4962.5, "valid_targets_min": 1736 }, { "epoch": 6.323907455012853, "grad_norm": 0.5642870717751584, "learning_rate": 1.128794144520955e-06, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.05563634634017944, "step": 7380, "valid_targets_mean": 4469.4, "valid_targets_min": 1883 }, { "epoch": 6.328191945158526, "grad_norm": 0.5588183190716616, "learning_rate": 1.1146846430173385e-06, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.08249536901712418, "step": 7385, "valid_targets_mean": 5998.8, "valid_targets_min": 2795 }, { "epoch": 6.332476435304199, "grad_norm": 0.5731674436370081, "learning_rate": 1.1006613505585783e-06, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.06888927519321442, "step": 7390, "valid_targets_mean": 4352.9, "valid_targets_min": 1884 }, { "epoch": 6.336760925449871, "grad_norm": 0.5123918560667162, "learning_rate": 1.0867243311592079e-06, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.05763709917664528, "step": 7395, "valid_targets_mean": 6003.0, "valid_targets_min": 2829 }, { "epoch": 6.341045415595544, "grad_norm": 0.5100597503907828, "learning_rate": 1.072873648439936e-06, "loss": 0.1375, "loss_nan_ranks": 0, "loss_rank_avg": 0.05623047798871994, "step": 7400, "valid_targets_mean": 5028.2, "valid_targets_min": 2742 }, { "epoch": 6.345329905741217, "grad_norm": 0.5811807929396194, "learning_rate": 1.059109365627351e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.07150489836931229, "step": 7405, "valid_targets_mean": 5120.2, "valid_targets_min": 3356 }, { "epoch": 6.349614395886889, "grad_norm": 0.4895410328153705, "learning_rate": 1.0454315455536436e-06, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.05738158896565437, "step": 7410, "valid_targets_mean": 5229.6, "valid_targets_min": 2671 }, { "epoch": 6.353898886032562, "grad_norm": 0.5404284191963216, "learning_rate": 1.0318402506563062e-06, "loss": 0.1253, "loss_nan_ranks": 0, "loss_rank_avg": 0.0597027949988842, "step": 7415, "valid_targets_mean": 5363.9, "valid_targets_min": 1530 }, { "epoch": 6.358183376178235, "grad_norm": 0.5501116303269473, "learning_rate": 1.0183355429778595e-06, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.06805878132581711, "step": 7420, "valid_targets_mean": 5213.6, "valid_targets_min": 3005 }, { "epoch": 6.362467866323907, "grad_norm": 0.5576493461479655, "learning_rate": 1.0049174841655685e-06, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.07751034200191498, "step": 7425, "valid_targets_mean": 5268.6, "valid_targets_min": 3439 }, { "epoch": 6.36675235646958, "grad_norm": 0.5548633392053545, "learning_rate": 9.915861354711498e-07, "loss": 0.1399, "loss_nan_ranks": 0, "loss_rank_avg": 0.07571675628423691, "step": 7430, "valid_targets_mean": 6207.0, "valid_targets_min": 1883 }, { "epoch": 6.371036846615253, "grad_norm": 0.526980009994755, "learning_rate": 9.783415577505018e-07, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.053638383746147156, "step": 7435, "valid_targets_mean": 6888.4, "valid_targets_min": 4719 }, { "epoch": 6.375321336760925, "grad_norm": 0.5729456153802657, "learning_rate": 9.651838114634216e-07, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.06362077593803406, "step": 7440, "valid_targets_mean": 4871.2, "valid_targets_min": 1490 }, { "epoch": 6.379605826906598, "grad_norm": 0.5184410617626088, "learning_rate": 9.521129566733389e-07, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.06541168689727783, "step": 7445, "valid_targets_mean": 5580.0, "valid_targets_min": 3229 }, { "epoch": 6.383890317052271, "grad_norm": 0.6255470828970859, "learning_rate": 9.391290530470277e-07, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.07521027326583862, "step": 7450, "valid_targets_mean": 5401.9, "valid_targets_min": 1524 }, { "epoch": 6.388174807197943, "grad_norm": 0.5194885483403754, "learning_rate": 9.2623215985435e-07, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.09347446262836456, "step": 7455, "valid_targets_mean": 5763.8, "valid_targets_min": 1737 }, { "epoch": 6.392459297343616, "grad_norm": 0.5600928570709444, "learning_rate": 9.134223359679683e-07, "loss": 0.1305, "loss_nan_ranks": 0, "loss_rank_avg": 0.06300924718379974, "step": 7460, "valid_targets_mean": 4393.2, "valid_targets_min": 2933 }, { "epoch": 6.396743787489289, "grad_norm": 0.5369824063885026, "learning_rate": 9.006996398630851e-07, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.0863390564918518, "step": 7465, "valid_targets_mean": 6428.6, "valid_targets_min": 2124 }, { "epoch": 6.401028277634961, "grad_norm": 0.5773689496250954, "learning_rate": 8.88064129617181e-07, "loss": 0.1394, "loss_nan_ranks": 0, "loss_rank_avg": 0.05433430150151253, "step": 7470, "valid_targets_mean": 5142.5, "valid_targets_min": 2347 }, { "epoch": 6.405312767780634, "grad_norm": 0.5256807129221563, "learning_rate": 8.755158629097393e-07, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.07254520058631897, "step": 7475, "valid_targets_mean": 6583.0, "valid_targets_min": 3019 }, { "epoch": 6.409597257926307, "grad_norm": 0.5655039871931183, "learning_rate": 8.630548970219888e-07, "loss": 0.1327, "loss_nan_ranks": 0, "loss_rank_avg": 0.08246055990457535, "step": 7480, "valid_targets_mean": 7249.6, "valid_targets_min": 3680 }, { "epoch": 6.413881748071979, "grad_norm": 0.5463016827169638, "learning_rate": 8.506812888366412e-07, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.059731028974056244, "step": 7485, "valid_targets_mean": 5100.2, "valid_targets_min": 2494 }, { "epoch": 6.418166238217652, "grad_norm": 0.5832410787055895, "learning_rate": 8.383950948376385e-07, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.09012992680072784, "step": 7490, "valid_targets_mean": 4581.4, "valid_targets_min": 1210 }, { "epoch": 6.422450728363325, "grad_norm": 0.5373271133685443, "learning_rate": 8.261963711098798e-07, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.05034567415714264, "step": 7495, "valid_targets_mean": 5593.4, "valid_targets_min": 3512 }, { "epoch": 6.426735218508997, "grad_norm": 0.49924700407085665, "learning_rate": 8.140851733389743e-07, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.05929369851946831, "step": 7500, "valid_targets_mean": 5676.0, "valid_targets_min": 3019 }, { "epoch": 6.43101970865467, "grad_norm": 0.5566287946269606, "learning_rate": 8.020615568109868e-07, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.07680325210094452, "step": 7505, "valid_targets_mean": 4787.9, "valid_targets_min": 3468 }, { "epoch": 6.435304198800343, "grad_norm": 0.5718185055108692, "learning_rate": 7.901255764121862e-07, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.049524642527103424, "step": 7510, "valid_targets_mean": 5347.8, "valid_targets_min": 2413 }, { "epoch": 6.439588688946015, "grad_norm": 0.5617952603517002, "learning_rate": 7.782772866287968e-07, "loss": 0.1312, "loss_nan_ranks": 0, "loss_rank_avg": 0.07754452526569366, "step": 7515, "valid_targets_mean": 4205.2, "valid_targets_min": 746 }, { "epoch": 6.443873179091688, "grad_norm": 0.5382909893432877, "learning_rate": 7.66516741546739e-07, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.06745108962059021, "step": 7520, "valid_targets_mean": 5163.9, "valid_targets_min": 3205 }, { "epoch": 6.448157669237361, "grad_norm": 0.6324837900871627, "learning_rate": 7.548439948514019e-07, "loss": 0.1268, "loss_nan_ranks": 0, "loss_rank_avg": 0.09697423875331879, "step": 7525, "valid_targets_mean": 5868.6, "valid_targets_min": 2030 }, { "epoch": 6.4524421593830334, "grad_norm": 0.6297388208752188, "learning_rate": 7.432590998273714e-07, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.05477753281593323, "step": 7530, "valid_targets_mean": 4286.4, "valid_targets_min": 484 }, { "epoch": 6.456726649528706, "grad_norm": 0.6145786549613212, "learning_rate": 7.317621093582117e-07, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.07500009983778, "step": 7535, "valid_targets_mean": 3922.9, "valid_targets_min": 977 }, { "epoch": 6.461011139674379, "grad_norm": 0.5521848259032168, "learning_rate": 7.2035307592621e-07, "loss": 0.1234, "loss_nan_ranks": 0, "loss_rank_avg": 0.06406620144844055, "step": 7540, "valid_targets_mean": 4464.2, "valid_targets_min": 1828 }, { "epoch": 6.4652956298200515, "grad_norm": 0.5833023790742793, "learning_rate": 7.090320516121418e-07, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.06913968175649643, "step": 7545, "valid_targets_mean": 5600.9, "valid_targets_min": 1182 }, { "epoch": 6.469580119965724, "grad_norm": 0.6100203970157438, "learning_rate": 6.977990880950348e-07, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.06103619933128357, "step": 7550, "valid_targets_mean": 4139.6, "valid_targets_min": 1295 }, { "epoch": 6.473864610111397, "grad_norm": 0.5633400073336338, "learning_rate": 6.866542366519247e-07, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.06431341916322708, "step": 7555, "valid_targets_mean": 5054.8, "valid_targets_min": 2696 }, { "epoch": 6.4781491002570695, "grad_norm": 0.6041224027325699, "learning_rate": 6.755975481576338e-07, "loss": 0.1346, "loss_nan_ranks": 0, "loss_rank_avg": 0.0816982090473175, "step": 7560, "valid_targets_mean": 4527.1, "valid_targets_min": 1576 }, { "epoch": 6.482433590402742, "grad_norm": 0.5881212273674449, "learning_rate": 6.646290730845285e-07, "loss": 0.1303, "loss_nan_ranks": 0, "loss_rank_avg": 0.07361535727977753, "step": 7565, "valid_targets_mean": 5084.4, "valid_targets_min": 2417 }, { "epoch": 6.486718080548415, "grad_norm": 0.6028451231337074, "learning_rate": 6.537488615022902e-07, "loss": 0.1324, "loss_nan_ranks": 0, "loss_rank_avg": 0.06748676300048828, "step": 7570, "valid_targets_mean": 4147.8, "valid_targets_min": 2788 }, { "epoch": 6.4910025706940875, "grad_norm": 0.6049291595728633, "learning_rate": 6.429569630776899e-07, "loss": 0.1281, "loss_nan_ranks": 0, "loss_rank_avg": 0.07137708365917206, "step": 7575, "valid_targets_mean": 6559.4, "valid_targets_min": 3194 }, { "epoch": 6.49528706083976, "grad_norm": 0.5724152711580965, "learning_rate": 6.322534270743653e-07, "loss": 0.1409, "loss_nan_ranks": 0, "loss_rank_avg": 0.04908524081110954, "step": 7580, "valid_targets_mean": 5618.8, "valid_targets_min": 2020 }, { "epoch": 6.499571550985433, "grad_norm": 0.5284775742025518, "learning_rate": 6.216383023525829e-07, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.06110971421003342, "step": 7585, "valid_targets_mean": 6379.1, "valid_targets_min": 3952 }, { "epoch": 6.5038560411311055, "grad_norm": 0.5412105324257526, "learning_rate": 6.111116373690262e-07, "loss": 0.1302, "loss_nan_ranks": 0, "loss_rank_avg": 0.06972099840641022, "step": 7590, "valid_targets_mean": 5871.4, "valid_targets_min": 2694 }, { "epoch": 6.508140531276778, "grad_norm": 0.5803291024390985, "learning_rate": 6.006734801765746e-07, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.05369029939174652, "step": 7595, "valid_targets_mean": 4633.1, "valid_targets_min": 571 }, { "epoch": 6.512425021422451, "grad_norm": 0.5703864930855584, "learning_rate": 5.903238784240794e-07, "loss": 0.1373, "loss_nan_ranks": 0, "loss_rank_avg": 0.07159294188022614, "step": 7600, "valid_targets_mean": 5685.8, "valid_targets_min": 3429 }, { "epoch": 6.5167095115681235, "grad_norm": 0.5489229421473321, "learning_rate": 5.800628793561447e-07, "loss": 0.1196, "loss_nan_ranks": 0, "loss_rank_avg": 0.06936562061309814, "step": 7605, "valid_targets_mean": 5826.9, "valid_targets_min": 3011 }, { "epoch": 6.520994001713796, "grad_norm": 0.5421183921246827, "learning_rate": 5.698905298129154e-07, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.07958382368087769, "step": 7610, "valid_targets_mean": 6062.5, "valid_targets_min": 3845 }, { "epoch": 6.525278491859469, "grad_norm": 0.5649633947170538, "learning_rate": 5.598068762298647e-07, "loss": 0.1366, "loss_nan_ranks": 0, "loss_rank_avg": 0.06852822005748749, "step": 7615, "valid_targets_mean": 5788.6, "valid_targets_min": 1353 }, { "epoch": 6.5295629820051415, "grad_norm": 0.5844565816018681, "learning_rate": 5.49811964637581e-07, "loss": 0.1385, "loss_nan_ranks": 0, "loss_rank_avg": 0.07468803226947784, "step": 7620, "valid_targets_mean": 4700.9, "valid_targets_min": 2566 }, { "epoch": 6.533847472150814, "grad_norm": 0.5759158172395592, "learning_rate": 5.399058406615498e-07, "loss": 0.1364, "loss_nan_ranks": 0, "loss_rank_avg": 0.09095199406147003, "step": 7625, "valid_targets_mean": 4950.9, "valid_targets_min": 2768 }, { "epoch": 6.538131962296487, "grad_norm": 0.6098207410965979, "learning_rate": 5.300885495219654e-07, "loss": 0.1172, "loss_nan_ranks": 0, "loss_rank_avg": 0.07239219546318054, "step": 7630, "valid_targets_mean": 6228.8, "valid_targets_min": 2836 }, { "epoch": 6.5424164524421595, "grad_norm": 0.6448334666116833, "learning_rate": 5.203601360334998e-07, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.0904010683298111, "step": 7635, "valid_targets_mean": 4510.2, "valid_targets_min": 1861 }, { "epoch": 6.546700942587832, "grad_norm": 0.6303612947945207, "learning_rate": 5.107206446051138e-07, "loss": 0.1387, "loss_nan_ranks": 0, "loss_rank_avg": 0.07945692539215088, "step": 7640, "valid_targets_mean": 4986.5, "valid_targets_min": 1948 }, { "epoch": 6.550985432733505, "grad_norm": 0.6436318797393943, "learning_rate": 5.01170119239851e-07, "loss": 0.1278, "loss_nan_ranks": 0, "loss_rank_avg": 0.07079534232616425, "step": 7645, "valid_targets_mean": 4854.4, "valid_targets_min": 1728 }, { "epoch": 6.5552699228791775, "grad_norm": 0.5134784672643112, "learning_rate": 4.917086035346374e-07, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.05049274116754532, "step": 7650, "valid_targets_mean": 6183.4, "valid_targets_min": 3825 }, { "epoch": 6.55955441302485, "grad_norm": 0.5325514964818551, "learning_rate": 4.823361406800775e-07, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.06300629675388336, "step": 7655, "valid_targets_mean": 5562.2, "valid_targets_min": 2461 }, { "epoch": 6.563838903170523, "grad_norm": 0.5355193257799574, "learning_rate": 4.7305277346026523e-07, "loss": 0.1205, "loss_nan_ranks": 0, "loss_rank_avg": 0.06088012084364891, "step": 7660, "valid_targets_mean": 6078.8, "valid_targets_min": 3357 }, { "epoch": 6.5681233933161955, "grad_norm": 0.5743674784749225, "learning_rate": 4.6385854425258225e-07, "loss": 0.1328, "loss_nan_ranks": 0, "loss_rank_avg": 0.06708808243274689, "step": 7665, "valid_targets_mean": 4031.1, "valid_targets_min": 2246 }, { "epoch": 6.572407883461868, "grad_norm": 0.48895775992421786, "learning_rate": 4.5475349502750675e-07, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.04776772856712341, "step": 7670, "valid_targets_mean": 5182.9, "valid_targets_min": 2608 }, { "epoch": 6.576692373607541, "grad_norm": 0.5923442658960232, "learning_rate": 4.457376673484204e-07, "loss": 0.1274, "loss_nan_ranks": 0, "loss_rank_avg": 0.06151628866791725, "step": 7675, "valid_targets_mean": 4924.8, "valid_targets_min": 2762 }, { "epoch": 6.580976863753214, "grad_norm": 0.6082249406191534, "learning_rate": 4.3681110237142165e-07, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.06975458562374115, "step": 7680, "valid_targets_mean": 4497.1, "valid_targets_min": 1832 }, { "epoch": 6.585261353898886, "grad_norm": 0.5650799881285941, "learning_rate": 4.279738408451395e-07, "loss": 0.1496, "loss_nan_ranks": 0, "loss_rank_avg": 0.06257934868335724, "step": 7685, "valid_targets_mean": 4092.9, "valid_targets_min": 904 }, { "epoch": 6.589545844044559, "grad_norm": 0.655822224913595, "learning_rate": 4.1922592311053776e-07, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.06709827482700348, "step": 7690, "valid_targets_mean": 5060.4, "valid_targets_min": 1415 }, { "epoch": 6.593830334190232, "grad_norm": 0.5030085090665306, "learning_rate": 4.105673891007378e-07, "loss": 0.1216, "loss_nan_ranks": 0, "loss_rank_avg": 0.049611542373895645, "step": 7695, "valid_targets_mean": 6162.4, "valid_targets_min": 2679 }, { "epoch": 6.598114824335904, "grad_norm": 0.6102081049129495, "learning_rate": 4.0199827834084047e-07, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.09663502871990204, "step": 7700, "valid_targets_mean": 4532.8, "valid_targets_min": 2484 }, { "epoch": 6.602399314481577, "grad_norm": 0.5895159499997753, "learning_rate": 3.9351862994774e-07, "loss": 0.1126, "loss_nan_ranks": 0, "loss_rank_avg": 0.07301288843154907, "step": 7705, "valid_targets_mean": 4698.4, "valid_targets_min": 1504 }, { "epoch": 6.60668380462725, "grad_norm": 0.5314397820314964, "learning_rate": 3.8512848262994175e-07, "loss": 0.1278, "loss_nan_ranks": 0, "loss_rank_avg": 0.07113306224346161, "step": 7710, "valid_targets_mean": 5652.4, "valid_targets_min": 4421 }, { "epoch": 6.610968294772922, "grad_norm": 0.5677507631274338, "learning_rate": 3.7682787468739544e-07, "loss": 0.1345, "loss_nan_ranks": 0, "loss_rank_avg": 0.07104374468326569, "step": 7715, "valid_targets_mean": 4550.2, "valid_targets_min": 2510 }, { "epoch": 6.615252784918595, "grad_norm": 0.6096034474741296, "learning_rate": 3.6861684401131135e-07, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.09399035573005676, "step": 7720, "valid_targets_mean": 6537.1, "valid_targets_min": 3034 }, { "epoch": 6.619537275064268, "grad_norm": 0.5217524607050796, "learning_rate": 3.604954280839934e-07, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.06967628002166748, "step": 7725, "valid_targets_mean": 5787.9, "valid_targets_min": 3968 }, { "epoch": 6.62382176520994, "grad_norm": 0.6152416458895353, "learning_rate": 3.524636639786616e-07, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.059186115860939026, "step": 7730, "valid_targets_mean": 4107.1, "valid_targets_min": 2620 }, { "epoch": 6.628106255355613, "grad_norm": 0.5668561641800082, "learning_rate": 3.445215883592945e-07, "loss": 0.1346, "loss_nan_ranks": 0, "loss_rank_avg": 0.0830339565873146, "step": 7735, "valid_targets_mean": 6530.4, "valid_targets_min": 2104 }, { "epoch": 6.632390745501286, "grad_norm": 0.6248303748819045, "learning_rate": 3.36669237480447e-07, "loss": 0.1382, "loss_nan_ranks": 0, "loss_rank_avg": 0.08806224167346954, "step": 7740, "valid_targets_mean": 5062.6, "valid_targets_min": 3322 }, { "epoch": 6.636675235646958, "grad_norm": 0.537812883564012, "learning_rate": 3.289066471870972e-07, "loss": 0.1432, "loss_nan_ranks": 0, "loss_rank_avg": 0.06440138071775436, "step": 7745, "valid_targets_mean": 6161.6, "valid_targets_min": 1091 }, { "epoch": 6.640959725792631, "grad_norm": 0.6367096859599471, "learning_rate": 3.2123385291447315e-07, "loss": 0.1396, "loss_nan_ranks": 0, "loss_rank_avg": 0.06297184526920319, "step": 7750, "valid_targets_mean": 5560.1, "valid_targets_min": 2408 }, { "epoch": 6.645244215938304, "grad_norm": 0.5174128452501829, "learning_rate": 3.136508896878976e-07, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.046948693692684174, "step": 7755, "valid_targets_mean": 5429.2, "valid_targets_min": 2134 }, { "epoch": 6.649528706083976, "grad_norm": 0.5502673569976809, "learning_rate": 3.0615779212262773e-07, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.054427504539489746, "step": 7760, "valid_targets_mean": 5898.8, "valid_targets_min": 1897 }, { "epoch": 6.653813196229649, "grad_norm": 0.5942641291785041, "learning_rate": 2.9875459442368915e-07, "loss": 0.1272, "loss_nan_ranks": 0, "loss_rank_avg": 0.06269437074661255, "step": 7765, "valid_targets_mean": 5309.4, "valid_targets_min": 3817 }, { "epoch": 6.658097686375322, "grad_norm": 0.5808692095958206, "learning_rate": 2.914413303857377e-07, "loss": 0.1389, "loss_nan_ranks": 0, "loss_rank_avg": 0.06568677723407745, "step": 7770, "valid_targets_mean": 4647.8, "valid_targets_min": 2544 }, { "epoch": 6.662382176520994, "grad_norm": 0.557804612223383, "learning_rate": 2.8421803339288236e-07, "loss": 0.1392, "loss_nan_ranks": 0, "loss_rank_avg": 0.06331031024456024, "step": 7775, "valid_targets_mean": 5791.6, "valid_targets_min": 3055 }, { "epoch": 6.666666666666667, "grad_norm": 0.5493010270576719, "learning_rate": 2.7708473641854917e-07, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.05088922753930092, "step": 7780, "valid_targets_mean": 4945.6, "valid_targets_min": 1712 }, { "epoch": 6.67095115681234, "grad_norm": 0.538355272547983, "learning_rate": 2.7004147202532416e-07, "loss": 0.1355, "loss_nan_ranks": 0, "loss_rank_avg": 0.07455355674028397, "step": 7785, "valid_targets_mean": 5992.4, "valid_targets_min": 3400 }, { "epoch": 6.675235646958012, "grad_norm": 0.5608671946650889, "learning_rate": 2.630882723648087e-07, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.04839465022087097, "step": 7790, "valid_targets_mean": 4834.1, "valid_targets_min": 1084 }, { "epoch": 6.679520137103685, "grad_norm": 0.5725307968184742, "learning_rate": 2.5622516917746644e-07, "loss": 0.1424, "loss_nan_ranks": 0, "loss_rank_avg": 0.06177856773138046, "step": 7795, "valid_targets_mean": 4075.1, "valid_targets_min": 1885 }, { "epoch": 6.683804627249358, "grad_norm": 0.5668999443014117, "learning_rate": 2.494521937924854e-07, "loss": 0.1361, "loss_nan_ranks": 0, "loss_rank_avg": 0.07443411648273468, "step": 7800, "valid_targets_mean": 5455.5, "valid_targets_min": 3160 }, { "epoch": 6.68808911739503, "grad_norm": 0.5604181051156855, "learning_rate": 2.427693771276274e-07, "loss": 0.1218, "loss_nan_ranks": 0, "loss_rank_avg": 0.0571829155087471, "step": 7805, "valid_targets_mean": 5181.1, "valid_targets_min": 1670 }, { "epoch": 6.692373607540703, "grad_norm": 0.5947177144498428, "learning_rate": 2.3617674968909876e-07, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.09753529727458954, "step": 7810, "valid_targets_mean": 4709.2, "valid_targets_min": 2501 }, { "epoch": 6.696658097686376, "grad_norm": 0.5618804740404388, "learning_rate": 2.2967434157139756e-07, "loss": 0.1118, "loss_nan_ranks": 0, "loss_rank_avg": 0.0628480538725853, "step": 7815, "valid_targets_mean": 4900.4, "valid_targets_min": 2355 }, { "epoch": 6.700942587832048, "grad_norm": 0.5927186775042097, "learning_rate": 2.2326218245718455e-07, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.07199184596538544, "step": 7820, "valid_targets_mean": 4698.0, "valid_targets_min": 1902 }, { "epoch": 6.705227077977721, "grad_norm": 0.6156643349117058, "learning_rate": 2.1694030161714118e-07, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.055360130965709686, "step": 7825, "valid_targets_mean": 4293.8, "valid_targets_min": 1427 }, { "epoch": 6.709511568123394, "grad_norm": 0.6098212433325052, "learning_rate": 2.107087279098452e-07, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.08166077733039856, "step": 7830, "valid_targets_mean": 5018.5, "valid_targets_min": 2294 }, { "epoch": 6.713796058269066, "grad_norm": 0.5356389161718971, "learning_rate": 2.0456748978163299e-07, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.05675205588340759, "step": 7835, "valid_targets_mean": 4544.2, "valid_targets_min": 2282 }, { "epoch": 6.718080548414739, "grad_norm": 0.5858343176283142, "learning_rate": 1.9851661526646638e-07, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.08815167844295502, "step": 7840, "valid_targets_mean": 4550.6, "valid_targets_min": 2884 }, { "epoch": 6.722365038560412, "grad_norm": 0.5595700704199968, "learning_rate": 1.9255613198581934e-07, "loss": 0.1318, "loss_nan_ranks": 0, "loss_rank_avg": 0.060909878462553024, "step": 7845, "valid_targets_mean": 5540.4, "valid_targets_min": 2807 }, { "epoch": 6.726649528706084, "grad_norm": 0.5191269758152909, "learning_rate": 1.866860671485271e-07, "loss": 0.1229, "loss_nan_ranks": 0, "loss_rank_avg": 0.06576729565858841, "step": 7850, "valid_targets_mean": 5806.9, "valid_targets_min": 2533 }, { "epoch": 6.730934018851757, "grad_norm": 0.5758310377261832, "learning_rate": 1.809064475506883e-07, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.07471377402544022, "step": 7855, "valid_targets_mean": 5287.5, "valid_targets_min": 2978 }, { "epoch": 6.73521850899743, "grad_norm": 0.5278397932305886, "learning_rate": 1.7521729957552302e-07, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.06098167225718498, "step": 7860, "valid_targets_mean": 5044.8, "valid_targets_min": 2857 }, { "epoch": 6.739502999143102, "grad_norm": 0.5395419129018436, "learning_rate": 1.6961864919326166e-07, "loss": 0.1412, "loss_nan_ranks": 0, "loss_rank_avg": 0.05927133187651634, "step": 7865, "valid_targets_mean": 5738.5, "valid_targets_min": 2026 }, { "epoch": 6.743787489288774, "grad_norm": 0.5304905943053638, "learning_rate": 1.641105219610295e-07, "loss": 0.1284, "loss_nan_ranks": 0, "loss_rank_avg": 0.07619032263755798, "step": 7870, "valid_targets_mean": 6232.8, "valid_targets_min": 2850 }, { "epoch": 6.748071979434448, "grad_norm": 0.5553095352748566, "learning_rate": 1.586929430227202e-07, "loss": 0.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.06535205990076065, "step": 7875, "valid_targets_mean": 4887.5, "valid_targets_min": 1439 }, { "epoch": 6.7523564695801195, "grad_norm": 0.5534113588647671, "learning_rate": 1.5336593710888914e-07, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.06758899241685867, "step": 7880, "valid_targets_mean": 4739.1, "valid_targets_min": 2091 }, { "epoch": 6.756640959725793, "grad_norm": 0.5601728067274346, "learning_rate": 1.4812952853663132e-07, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.05526921898126602, "step": 7885, "valid_targets_mean": 3589.0, "valid_targets_min": 1466 }, { "epoch": 6.760925449871465, "grad_norm": 0.5724487101335303, "learning_rate": 1.4298374120948588e-07, "loss": 0.126, "loss_nan_ranks": 0, "loss_rank_avg": 0.07227601855993271, "step": 7890, "valid_targets_mean": 6033.5, "valid_targets_min": 1545 }, { "epoch": 6.765209940017138, "grad_norm": 0.5629625045477072, "learning_rate": 1.3792859861730955e-07, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.06101224198937416, "step": 7895, "valid_targets_mean": 5031.9, "valid_targets_min": 2327 }, { "epoch": 6.76949443016281, "grad_norm": 0.5682786914829596, "learning_rate": 1.3296412383617896e-07, "loss": 0.1246, "loss_nan_ranks": 0, "loss_rank_avg": 0.06303523480892181, "step": 7900, "valid_targets_mean": 5499.0, "valid_targets_min": 3762 }, { "epoch": 6.773778920308484, "grad_norm": 0.53063945226954, "learning_rate": 1.2809033952829065e-07, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.06398984789848328, "step": 7905, "valid_targets_mean": 6115.8, "valid_targets_min": 3463 }, { "epoch": 6.7780634104541555, "grad_norm": 0.5683228046451378, "learning_rate": 1.2330726794184124e-07, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.06533034145832062, "step": 7910, "valid_targets_mean": 4878.9, "valid_targets_min": 537 }, { "epoch": 6.782347900599829, "grad_norm": 0.6162313267351365, "learning_rate": 1.1861493091094078e-07, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.05130893737077713, "step": 7915, "valid_targets_mean": 3761.9, "valid_targets_min": 1588 }, { "epoch": 6.786632390745501, "grad_norm": 0.5364938112255343, "learning_rate": 1.1401334985550849e-07, "loss": 0.1333, "loss_nan_ranks": 0, "loss_rank_avg": 0.05069788917899132, "step": 7920, "valid_targets_mean": 4648.5, "valid_targets_min": 1284 }, { "epoch": 6.790916880891174, "grad_norm": 0.6759019110702623, "learning_rate": 1.0950254578117047e-07, "loss": 0.1393, "loss_nan_ranks": 0, "loss_rank_avg": 0.08072400093078613, "step": 7925, "valid_targets_mean": 4252.4, "valid_targets_min": 2091 }, { "epoch": 6.795201371036846, "grad_norm": 0.6010547033753089, "learning_rate": 1.0508253927916878e-07, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.07396875321865082, "step": 7930, "valid_targets_mean": 4642.6, "valid_targets_min": 2359 }, { "epoch": 6.79948586118252, "grad_norm": 0.5306208560777944, "learning_rate": 1.0075335052626811e-07, "loss": 0.1277, "loss_nan_ranks": 0, "loss_rank_avg": 0.09541085362434387, "step": 7935, "valid_targets_mean": 4518.5, "valid_targets_min": 1451 }, { "epoch": 6.8037703513281915, "grad_norm": 0.5503742533160736, "learning_rate": 9.651499928465812e-08, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.045133013278245926, "step": 7940, "valid_targets_mean": 5171.4, "valid_targets_min": 2204 }, { "epoch": 6.808054841473865, "grad_norm": 0.6369200662485703, "learning_rate": 9.23675049018713e-08, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.08669963479042053, "step": 7945, "valid_targets_mean": 5398.8, "valid_targets_min": 2923 }, { "epoch": 6.812339331619537, "grad_norm": 0.5797105544129365, "learning_rate": 8.831088631068962e-08, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.08598867058753967, "step": 7950, "valid_targets_mean": 5427.9, "valid_targets_min": 1720 }, { "epoch": 6.81662382176521, "grad_norm": 0.5892362865899328, "learning_rate": 8.434516202905585e-08, "loss": 0.1138, "loss_nan_ranks": 0, "loss_rank_avg": 0.04355989396572113, "step": 7955, "valid_targets_mean": 4668.5, "valid_targets_min": 1787 }, { "epoch": 6.820908311910882, "grad_norm": 0.5259449130439358, "learning_rate": 8.047035015999127e-08, "loss": 0.1293, "loss_nan_ranks": 0, "loss_rank_avg": 0.062147438526153564, "step": 7960, "valid_targets_mean": 6266.0, "valid_targets_min": 3304 }, { "epoch": 6.825192802056556, "grad_norm": 0.5980788196035809, "learning_rate": 7.668646839151584e-08, "loss": 0.1342, "loss_nan_ranks": 0, "loss_rank_avg": 0.07914112508296967, "step": 7965, "valid_targets_mean": 4330.0, "valid_targets_min": 2088 }, { "epoch": 6.8294772922022275, "grad_norm": 0.5679019198989551, "learning_rate": 7.299353399656817e-08, "loss": 0.1343, "loss_nan_ranks": 0, "loss_rank_avg": 0.06378501653671265, "step": 7970, "valid_targets_mean": 5255.6, "valid_targets_min": 2568 }, { "epoch": 6.8337617823479, "grad_norm": 0.5466815453187154, "learning_rate": 6.939156383291679e-08, "loss": 0.1113, "loss_nan_ranks": 0, "loss_rank_avg": 0.0462757870554924, "step": 7975, "valid_targets_mean": 6509.4, "valid_targets_min": 2957 }, { "epoch": 6.838046272493573, "grad_norm": 0.5441314114108987, "learning_rate": 6.58805743430957e-08, "loss": 0.137, "loss_nan_ranks": 0, "loss_rank_avg": 0.07762189954519272, "step": 7980, "valid_targets_mean": 6555.9, "valid_targets_min": 1836 }, { "epoch": 6.842330762639246, "grad_norm": 0.50096448496228, "learning_rate": 6.246058155432444e-08, "loss": 0.1205, "loss_nan_ranks": 0, "loss_rank_avg": 0.04757378250360489, "step": 7985, "valid_targets_mean": 5298.4, "valid_targets_min": 1479 }, { "epoch": 6.846615252784918, "grad_norm": 0.4878422198549988, "learning_rate": 5.913160107842819e-08, "loss": 0.1132, "loss_nan_ranks": 0, "loss_rank_avg": 0.0475429967045784, "step": 7990, "valid_targets_mean": 5907.8, "valid_targets_min": 1951 }, { "epoch": 6.850899742930591, "grad_norm": 0.49936103592353775, "learning_rate": 5.5893648111777774e-08, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.0695628896355629, "step": 7995, "valid_targets_mean": 6045.9, "valid_targets_min": 3008 }, { "epoch": 6.855184233076264, "grad_norm": 0.5665138724150077, "learning_rate": 5.274673743521197e-08, "loss": 0.1142, "loss_nan_ranks": 0, "loss_rank_avg": 0.05693498253822327, "step": 8000, "valid_targets_mean": 4705.0, "valid_targets_min": 887 }, { "epoch": 6.859468723221936, "grad_norm": 0.5203110760122742, "learning_rate": 4.969088341397976e-08, "loss": 0.1291, "loss_nan_ranks": 0, "loss_rank_avg": 0.04779854789376259, "step": 8005, "valid_targets_mean": 4978.9, "valid_targets_min": 1267 }, { "epoch": 6.863753213367609, "grad_norm": 0.5627332408917793, "learning_rate": 4.6726099997655985e-08, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.06360907107591629, "step": 8010, "valid_targets_mean": 4355.4, "valid_targets_min": 1548 }, { "epoch": 6.868037703513282, "grad_norm": 0.6210799134015753, "learning_rate": 4.385240072010355e-08, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.07875913381576538, "step": 8015, "valid_targets_mean": 5311.0, "valid_targets_min": 2297 }, { "epoch": 6.872322193658954, "grad_norm": 0.6250033404142441, "learning_rate": 4.1069798699389094e-08, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.06782643496990204, "step": 8020, "valid_targets_mean": 4566.6, "valid_targets_min": 2102 }, { "epoch": 6.876606683804627, "grad_norm": 0.5422644649871644, "learning_rate": 3.83783066377319e-08, "loss": 0.1243, "loss_nan_ranks": 0, "loss_rank_avg": 0.0571243017911911, "step": 8025, "valid_targets_mean": 4521.6, "valid_targets_min": 1140 }, { "epoch": 6.8808911739503, "grad_norm": 0.5636592346059632, "learning_rate": 3.5777936821450584e-08, "loss": 0.113, "loss_nan_ranks": 0, "loss_rank_avg": 0.07804582267999649, "step": 8030, "valid_targets_mean": 6277.8, "valid_targets_min": 2562 }, { "epoch": 6.885175664095972, "grad_norm": 0.5444328936008808, "learning_rate": 3.326870112090097e-08, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.060951389372348785, "step": 8035, "valid_targets_mean": 5473.1, "valid_targets_min": 2419 }, { "epoch": 6.889460154241645, "grad_norm": 0.5365253336459935, "learning_rate": 3.0850610990422745e-08, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.06827065348625183, "step": 8040, "valid_targets_mean": 6299.4, "valid_targets_min": 3425 }, { "epoch": 6.893744644387318, "grad_norm": 0.5234285669194776, "learning_rate": 2.8523677468286216e-08, "loss": 0.1143, "loss_nan_ranks": 0, "loss_rank_avg": 0.051526255905628204, "step": 8045, "valid_targets_mean": 5121.8, "valid_targets_min": 3038 }, { "epoch": 6.89802913453299, "grad_norm": 0.6361279161031459, "learning_rate": 2.6287911176643422e-08, "loss": 0.1321, "loss_nan_ranks": 0, "loss_rank_avg": 0.07987803220748901, "step": 8050, "valid_targets_mean": 4748.1, "valid_targets_min": 1969 }, { "epoch": 6.902313624678663, "grad_norm": 0.5639544639534764, "learning_rate": 2.414332232148375e-08, "loss": 0.1341, "loss_nan_ranks": 0, "loss_rank_avg": 0.056079618632793427, "step": 8055, "valid_targets_mean": 3328.0, "valid_targets_min": 1312 }, { "epoch": 6.906598114824336, "grad_norm": 0.5270526838763586, "learning_rate": 2.2089920692578427e-08, "loss": 0.1377, "loss_nan_ranks": 0, "loss_rank_avg": 0.062460094690322876, "step": 8060, "valid_targets_mean": 6072.0, "valid_targets_min": 3614 }, { "epoch": 6.910882604970008, "grad_norm": 0.5623331773457231, "learning_rate": 2.0127715663442737e-08, "loss": 0.1054, "loss_nan_ranks": 0, "loss_rank_avg": 0.04031980037689209, "step": 8065, "valid_targets_mean": 4893.9, "valid_targets_min": 1076 }, { "epoch": 6.915167095115681, "grad_norm": 0.5722152732120999, "learning_rate": 1.8256716191293876e-08, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.07477788627147675, "step": 8070, "valid_targets_mean": 4832.0, "valid_targets_min": 2439 }, { "epoch": 6.919451585261354, "grad_norm": 0.6020483180818025, "learning_rate": 1.647693081700208e-08, "loss": 0.1211, "loss_nan_ranks": 0, "loss_rank_avg": 0.04321936517953873, "step": 8075, "valid_targets_mean": 4835.4, "valid_targets_min": 1616 }, { "epoch": 6.923736075407026, "grad_norm": 0.5670456675857146, "learning_rate": 1.4788367665061753e-08, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.07685419917106628, "step": 8080, "valid_targets_mean": 5860.4, "valid_targets_min": 2446 }, { "epoch": 6.928020565552699, "grad_norm": 0.4939827002011384, "learning_rate": 1.3191034443544859e-08, "loss": 0.1101, "loss_nan_ranks": 0, "loss_rank_avg": 0.049323923885822296, "step": 8085, "valid_targets_mean": 4900.1, "valid_targets_min": 3089 }, { "epoch": 6.932305055698372, "grad_norm": 0.5775169071638229, "learning_rate": 1.1684938444074256e-08, "loss": 0.1327, "loss_nan_ranks": 0, "loss_rank_avg": 0.0588383711874485, "step": 8090, "valid_targets_mean": 4254.9, "valid_targets_min": 2406 }, { "epoch": 6.936589545844044, "grad_norm": 0.5629445712235375, "learning_rate": 1.0270086541785961e-08, "loss": 0.1158, "loss_nan_ranks": 0, "loss_rank_avg": 0.0664314329624176, "step": 8095, "valid_targets_mean": 4874.4, "valid_targets_min": 1914 }, { "epoch": 6.940874035989717, "grad_norm": 0.5038614919165475, "learning_rate": 8.946485195295839e-09, "loss": 0.1226, "loss_nan_ranks": 0, "loss_rank_avg": 0.05850938707590103, "step": 8100, "valid_targets_mean": 6217.1, "valid_targets_min": 2366 }, { "epoch": 6.94515852613539, "grad_norm": 0.5841112429555259, "learning_rate": 7.714140446677399e-09, "loss": 0.1251, "loss_nan_ranks": 0, "loss_rank_avg": 0.06938346475362778, "step": 8105, "valid_targets_mean": 5006.5, "valid_targets_min": 1629 }, { "epoch": 6.949443016281062, "grad_norm": 0.5950489578435784, "learning_rate": 6.573057921421821e-09, "loss": 0.1265, "loss_nan_ranks": 0, "loss_rank_avg": 0.07542908191680908, "step": 8110, "valid_targets_mean": 4854.5, "valid_targets_min": 2653 }, { "epoch": 6.953727506426735, "grad_norm": 0.5433367260843878, "learning_rate": 5.523242828429087e-09, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.05837767571210861, "step": 8115, "valid_targets_mean": 5498.1, "valid_targets_min": 3257 }, { "epoch": 6.958011996572408, "grad_norm": 0.5579267091216227, "learning_rate": 4.5646999599657795e-09, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.047898173332214355, "step": 8120, "valid_targets_mean": 3744.8, "valid_targets_min": 993 }, { "epoch": 6.96229648671808, "grad_norm": 0.5502801957973467, "learning_rate": 3.697433691662866e-09, "loss": 0.1208, "loss_nan_ranks": 0, "loss_rank_avg": 0.04671556502580643, "step": 8125, "valid_targets_mean": 5065.5, "valid_targets_min": 1893 }, { "epoch": 6.966580976863753, "grad_norm": 0.6715401391059547, "learning_rate": 2.9214479824757336e-09, "loss": 0.1338, "loss_nan_ranks": 0, "loss_rank_avg": 0.0737813264131546, "step": 8130, "valid_targets_mean": 3978.1, "valid_targets_min": 2252 }, { "epoch": 6.970865467009426, "grad_norm": 0.5572764767170948, "learning_rate": 2.236746374681964e-09, "loss": 0.1351, "loss_nan_ranks": 0, "loss_rank_avg": 0.06324169039726257, "step": 8135, "valid_targets_mean": 4121.8, "valid_targets_min": 767 }, { "epoch": 6.975149957155098, "grad_norm": 0.6214094452567607, "learning_rate": 1.6433319938569115e-09, "loss": 0.125, "loss_nan_ranks": 0, "loss_rank_avg": 0.07531341910362244, "step": 8140, "valid_targets_mean": 4792.2, "valid_targets_min": 2175 }, { "epoch": 6.979434447300771, "grad_norm": 0.5631333769607573, "learning_rate": 1.1412075488581587e-09, "loss": 0.1255, "loss_nan_ranks": 0, "loss_rank_avg": 0.06048138439655304, "step": 8145, "valid_targets_mean": 4735.9, "valid_targets_min": 1720 }, { "epoch": 6.983718937446444, "grad_norm": 0.5522652498654058, "learning_rate": 7.303753318232964e-10, "loss": 0.1232, "loss_nan_ranks": 0, "loss_rank_avg": 0.06047441065311432, "step": 8150, "valid_targets_mean": 4334.2, "valid_targets_min": 2076 }, { "epoch": 6.988003427592116, "grad_norm": 0.5623147954093044, "learning_rate": 4.1083721814549893e-10, "loss": 0.1172, "loss_nan_ranks": 0, "loss_rank_avg": 0.07241150736808777, "step": 8155, "valid_targets_mean": 5543.4, "valid_targets_min": 2466 }, { "epoch": 6.992287917737789, "grad_norm": 0.5989116648786725, "learning_rate": 1.8259466647574386e-10, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.07918166369199753, "step": 8160, "valid_targets_mean": 4510.2, "valid_targets_min": 2247 }, { "epoch": 6.996572407883462, "grad_norm": 0.5320669172153315, "learning_rate": 4.564871871393095e-11, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.056516826152801514, "step": 8165, "valid_targets_mean": 4857.2, "valid_targets_min": 621 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.07527446001768112, "step": 8169, "total_flos": 4.1481371263550095e+18, "train_loss": 0.012115523323082897, "train_runtime": 26384.5271, "train_samples_per_second": 4.953, "train_steps_per_second": 0.31, "valid_targets_mean": 4146.9, "valid_targets_min": 1674 } ], "logging_steps": 5, "max_steps": 8169, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 4.1481371263550095e+18, "train_batch_size": 1, "trial_name": null, "trial_params": null }