{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 7.0, "eval_steps": 500, "global_step": 6664, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.005252100840336135, "grad_norm": 12.87344450799192, "learning_rate": 2.39880059970015e-07, "loss": 0.7749, "loss_nan_ranks": 0, "loss_rank_avg": 0.7653565406799316, "step": 5, "valid_targets_mean": 2484.8, "valid_targets_min": 784 }, { "epoch": 0.01050420168067227, "grad_norm": 12.707723147793125, "learning_rate": 5.397301349325338e-07, "loss": 0.7606, "loss_nan_ranks": 0, "loss_rank_avg": 0.7621961236000061, "step": 10, "valid_targets_mean": 2830.7, "valid_targets_min": 635 }, { "epoch": 0.015756302521008403, "grad_norm": 11.204400117593265, "learning_rate": 8.395802098950526e-07, "loss": 0.7482, "loss_nan_ranks": 0, "loss_rank_avg": 0.7473458051681519, "step": 15, "valid_targets_mean": 3091.0, "valid_targets_min": 1146 }, { "epoch": 0.02100840336134454, "grad_norm": 9.688069489628813, "learning_rate": 1.1394302848575713e-06, "loss": 0.7466, "loss_nan_ranks": 0, "loss_rank_avg": 0.7422138452529907, "step": 20, "valid_targets_mean": 2413.2, "valid_targets_min": 689 }, { "epoch": 0.026260504201680673, "grad_norm": 7.62742888265603, "learning_rate": 1.43928035982009e-06, "loss": 0.7287, "loss_nan_ranks": 0, "loss_rank_avg": 0.7463569045066833, "step": 25, "valid_targets_mean": 2688.5, "valid_targets_min": 1011 }, { "epoch": 0.031512605042016806, "grad_norm": 5.508936794357446, "learning_rate": 1.7391304347826088e-06, "loss": 0.6518, "loss_nan_ranks": 0, "loss_rank_avg": 0.6350823640823364, "step": 30, "valid_targets_mean": 2500.6, "valid_targets_min": 819 }, { "epoch": 0.03676470588235294, "grad_norm": 4.810314643948938, "learning_rate": 2.0389805097451275e-06, "loss": 0.6558, "loss_nan_ranks": 0, "loss_rank_avg": 0.6311067938804626, "step": 35, "valid_targets_mean": 2686.3, "valid_targets_min": 893 }, { "epoch": 0.04201680672268908, "grad_norm": 4.8557060388176545, "learning_rate": 2.3388305847076464e-06, "loss": 0.6284, "loss_nan_ranks": 0, "loss_rank_avg": 0.6066815257072449, "step": 40, "valid_targets_mean": 2177.2, "valid_targets_min": 1080 }, { "epoch": 0.04726890756302521, "grad_norm": 2.9119019293559685, "learning_rate": 2.6386806596701653e-06, "loss": 0.6094, "loss_nan_ranks": 0, "loss_rank_avg": 0.6400288343429565, "step": 45, "valid_targets_mean": 2633.9, "valid_targets_min": 963 }, { "epoch": 0.052521008403361345, "grad_norm": 2.5325988257181504, "learning_rate": 2.9385307346326843e-06, "loss": 0.5741, "loss_nan_ranks": 0, "loss_rank_avg": 0.5878869891166687, "step": 50, "valid_targets_mean": 2203.5, "valid_targets_min": 627 }, { "epoch": 0.05777310924369748, "grad_norm": 1.6332369639610234, "learning_rate": 3.2383808095952024e-06, "loss": 0.5072, "loss_nan_ranks": 0, "loss_rank_avg": 0.49458950757980347, "step": 55, "valid_targets_mean": 3035.3, "valid_targets_min": 830 }, { "epoch": 0.06302521008403361, "grad_norm": 1.2034100946296309, "learning_rate": 3.5382308845577213e-06, "loss": 0.5137, "loss_nan_ranks": 0, "loss_rank_avg": 0.4873230755329132, "step": 60, "valid_targets_mean": 2940.2, "valid_targets_min": 1009 }, { "epoch": 0.06827731092436974, "grad_norm": 1.1067968813199072, "learning_rate": 3.83808095952024e-06, "loss": 0.511, "loss_nan_ranks": 0, "loss_rank_avg": 0.4636586606502533, "step": 65, "valid_targets_mean": 2532.8, "valid_targets_min": 824 }, { "epoch": 0.07352941176470588, "grad_norm": 1.2850520360535964, "learning_rate": 4.137931034482759e-06, "loss": 0.4961, "loss_nan_ranks": 0, "loss_rank_avg": 0.4967666566371918, "step": 70, "valid_targets_mean": 1951.5, "valid_targets_min": 726 }, { "epoch": 0.07878151260504201, "grad_norm": 0.8971762854941586, "learning_rate": 4.437781109445278e-06, "loss": 0.4949, "loss_nan_ranks": 0, "loss_rank_avg": 0.43605613708496094, "step": 75, "valid_targets_mean": 2723.1, "valid_targets_min": 733 }, { "epoch": 0.08403361344537816, "grad_norm": 0.9430146035301179, "learning_rate": 4.737631184407796e-06, "loss": 0.4615, "loss_nan_ranks": 0, "loss_rank_avg": 0.4186355173587799, "step": 80, "valid_targets_mean": 2138.4, "valid_targets_min": 619 }, { "epoch": 0.08928571428571429, "grad_norm": 0.9397684354473573, "learning_rate": 5.037481259370315e-06, "loss": 0.4629, "loss_nan_ranks": 0, "loss_rank_avg": 0.447378933429718, "step": 85, "valid_targets_mean": 2195.4, "valid_targets_min": 985 }, { "epoch": 0.09453781512605042, "grad_norm": 0.9254373058058498, "learning_rate": 5.337331334332834e-06, "loss": 0.4579, "loss_nan_ranks": 0, "loss_rank_avg": 0.44608554244041443, "step": 90, "valid_targets_mean": 2305.1, "valid_targets_min": 1115 }, { "epoch": 0.09978991596638656, "grad_norm": 0.8895449710201235, "learning_rate": 5.6371814092953526e-06, "loss": 0.4429, "loss_nan_ranks": 0, "loss_rank_avg": 0.4577831029891968, "step": 95, "valid_targets_mean": 2365.8, "valid_targets_min": 1000 }, { "epoch": 0.10504201680672269, "grad_norm": 0.8582249839693272, "learning_rate": 5.937031484257871e-06, "loss": 0.4524, "loss_nan_ranks": 0, "loss_rank_avg": 0.43060487508773804, "step": 100, "valid_targets_mean": 2525.8, "valid_targets_min": 691 }, { "epoch": 0.11029411764705882, "grad_norm": 0.8328052594807136, "learning_rate": 6.2368815592203904e-06, "loss": 0.4351, "loss_nan_ranks": 0, "loss_rank_avg": 0.43569284677505493, "step": 105, "valid_targets_mean": 2433.1, "valid_targets_min": 681 }, { "epoch": 0.11554621848739496, "grad_norm": 0.8004894157898372, "learning_rate": 6.536731634182909e-06, "loss": 0.435, "loss_nan_ranks": 0, "loss_rank_avg": 0.4115639328956604, "step": 110, "valid_targets_mean": 2809.9, "valid_targets_min": 1462 }, { "epoch": 0.1207983193277311, "grad_norm": 0.8370123985640117, "learning_rate": 6.8365817091454274e-06, "loss": 0.4329, "loss_nan_ranks": 0, "loss_rank_avg": 0.40281569957733154, "step": 115, "valid_targets_mean": 2199.2, "valid_targets_min": 740 }, { "epoch": 0.12605042016806722, "grad_norm": 0.8695717739921266, "learning_rate": 7.136431784107947e-06, "loss": 0.4223, "loss_nan_ranks": 0, "loss_rank_avg": 0.4021134674549103, "step": 120, "valid_targets_mean": 2273.1, "valid_targets_min": 686 }, { "epoch": 0.13130252100840337, "grad_norm": 0.8006986968807501, "learning_rate": 7.436281859070465e-06, "loss": 0.4335, "loss_nan_ranks": 0, "loss_rank_avg": 0.4061618447303772, "step": 125, "valid_targets_mean": 2860.1, "valid_targets_min": 1215 }, { "epoch": 0.13655462184873948, "grad_norm": 0.8969789811481348, "learning_rate": 7.736131934032984e-06, "loss": 0.4152, "loss_nan_ranks": 0, "loss_rank_avg": 0.47167330980300903, "step": 130, "valid_targets_mean": 2499.8, "valid_targets_min": 1218 }, { "epoch": 0.14180672268907563, "grad_norm": 0.8068868280254967, "learning_rate": 8.035982008995503e-06, "loss": 0.4163, "loss_nan_ranks": 0, "loss_rank_avg": 0.4264189898967743, "step": 135, "valid_targets_mean": 2426.6, "valid_targets_min": 985 }, { "epoch": 0.14705882352941177, "grad_norm": 0.9031868308784958, "learning_rate": 8.335832083958023e-06, "loss": 0.4126, "loss_nan_ranks": 0, "loss_rank_avg": 0.4020998775959015, "step": 140, "valid_targets_mean": 2240.5, "valid_targets_min": 768 }, { "epoch": 0.15231092436974789, "grad_norm": 0.7811330017492059, "learning_rate": 8.63568215892054e-06, "loss": 0.3964, "loss_nan_ranks": 0, "loss_rank_avg": 0.4105680286884308, "step": 145, "valid_targets_mean": 2559.5, "valid_targets_min": 870 }, { "epoch": 0.15756302521008403, "grad_norm": 0.8087924248265574, "learning_rate": 8.93553223388306e-06, "loss": 0.4058, "loss_nan_ranks": 0, "loss_rank_avg": 0.4330301880836487, "step": 150, "valid_targets_mean": 2632.9, "valid_targets_min": 1231 }, { "epoch": 0.16281512605042017, "grad_norm": 0.7719589146187298, "learning_rate": 9.235382308845579e-06, "loss": 0.3981, "loss_nan_ranks": 0, "loss_rank_avg": 0.3908872604370117, "step": 155, "valid_targets_mean": 2874.4, "valid_targets_min": 730 }, { "epoch": 0.16806722689075632, "grad_norm": 0.8718120536448756, "learning_rate": 9.535232383808097e-06, "loss": 0.3981, "loss_nan_ranks": 0, "loss_rank_avg": 0.41889429092407227, "step": 160, "valid_targets_mean": 2393.1, "valid_targets_min": 737 }, { "epoch": 0.17331932773109243, "grad_norm": 0.8830904007290984, "learning_rate": 9.835082458770614e-06, "loss": 0.4037, "loss_nan_ranks": 0, "loss_rank_avg": 0.38836172223091125, "step": 165, "valid_targets_mean": 2164.8, "valid_targets_min": 819 }, { "epoch": 0.17857142857142858, "grad_norm": 0.8311418026284046, "learning_rate": 1.0134932533733135e-05, "loss": 0.3887, "loss_nan_ranks": 0, "loss_rank_avg": 0.3843948543071747, "step": 170, "valid_targets_mean": 2470.9, "valid_targets_min": 1080 }, { "epoch": 0.18382352941176472, "grad_norm": 0.8211185772584042, "learning_rate": 1.0434782608695653e-05, "loss": 0.4169, "loss_nan_ranks": 0, "loss_rank_avg": 0.4080219268798828, "step": 175, "valid_targets_mean": 2487.4, "valid_targets_min": 688 }, { "epoch": 0.18907563025210083, "grad_norm": 0.8630859100580258, "learning_rate": 1.0734632683658172e-05, "loss": 0.3844, "loss_nan_ranks": 0, "loss_rank_avg": 0.42095762491226196, "step": 180, "valid_targets_mean": 2252.2, "valid_targets_min": 744 }, { "epoch": 0.19432773109243698, "grad_norm": 0.7978994945119684, "learning_rate": 1.103448275862069e-05, "loss": 0.3844, "loss_nan_ranks": 0, "loss_rank_avg": 0.41790223121643066, "step": 185, "valid_targets_mean": 2912.1, "valid_targets_min": 940 }, { "epoch": 0.19957983193277312, "grad_norm": 0.8619777697515183, "learning_rate": 1.1334332833583211e-05, "loss": 0.3922, "loss_nan_ranks": 0, "loss_rank_avg": 0.4195566773414612, "step": 190, "valid_targets_mean": 2451.5, "valid_targets_min": 923 }, { "epoch": 0.20483193277310924, "grad_norm": 0.8075469823787889, "learning_rate": 1.1634182908545729e-05, "loss": 0.381, "loss_nan_ranks": 0, "loss_rank_avg": 0.3835638463497162, "step": 195, "valid_targets_mean": 2334.6, "valid_targets_min": 634 }, { "epoch": 0.21008403361344538, "grad_norm": 0.7886022090561562, "learning_rate": 1.1934032983508246e-05, "loss": 0.3732, "loss_nan_ranks": 0, "loss_rank_avg": 0.41375166177749634, "step": 200, "valid_targets_mean": 2972.5, "valid_targets_min": 1031 }, { "epoch": 0.21533613445378152, "grad_norm": 0.8061255296748036, "learning_rate": 1.2233883058470766e-05, "loss": 0.3888, "loss_nan_ranks": 0, "loss_rank_avg": 0.4238708019256592, "step": 205, "valid_targets_mean": 2525.8, "valid_targets_min": 625 }, { "epoch": 0.22058823529411764, "grad_norm": 0.8001397668970225, "learning_rate": 1.2533733133433283e-05, "loss": 0.3628, "loss_nan_ranks": 0, "loss_rank_avg": 0.3657309412956238, "step": 210, "valid_targets_mean": 2680.4, "valid_targets_min": 670 }, { "epoch": 0.22584033613445378, "grad_norm": 0.7848361664620995, "learning_rate": 1.2833583208395803e-05, "loss": 0.3762, "loss_nan_ranks": 0, "loss_rank_avg": 0.37307411432266235, "step": 215, "valid_targets_mean": 2759.8, "valid_targets_min": 748 }, { "epoch": 0.23109243697478993, "grad_norm": 0.9451943941703829, "learning_rate": 1.313343328335832e-05, "loss": 0.3721, "loss_nan_ranks": 0, "loss_rank_avg": 0.35972413420677185, "step": 220, "valid_targets_mean": 1986.0, "valid_targets_min": 1143 }, { "epoch": 0.23634453781512604, "grad_norm": 1.0257525942300505, "learning_rate": 1.3433283358320841e-05, "loss": 0.3903, "loss_nan_ranks": 0, "loss_rank_avg": 0.37196558713912964, "step": 225, "valid_targets_mean": 2237.6, "valid_targets_min": 1023 }, { "epoch": 0.2415966386554622, "grad_norm": 0.8450544047029999, "learning_rate": 1.3733133433283359e-05, "loss": 0.3774, "loss_nan_ranks": 0, "loss_rank_avg": 0.400920033454895, "step": 230, "valid_targets_mean": 2558.1, "valid_targets_min": 843 }, { "epoch": 0.24684873949579833, "grad_norm": 0.8081787234697447, "learning_rate": 1.4032983508245878e-05, "loss": 0.3585, "loss_nan_ranks": 0, "loss_rank_avg": 0.35195618867874146, "step": 235, "valid_targets_mean": 2621.5, "valid_targets_min": 749 }, { "epoch": 0.25210084033613445, "grad_norm": 0.8046828946061387, "learning_rate": 1.4332833583208396e-05, "loss": 0.3612, "loss_nan_ranks": 0, "loss_rank_avg": 0.340299516916275, "step": 240, "valid_targets_mean": 2374.2, "valid_targets_min": 1079 }, { "epoch": 0.25735294117647056, "grad_norm": 0.6971318909820771, "learning_rate": 1.4632683658170917e-05, "loss": 0.357, "loss_nan_ranks": 0, "loss_rank_avg": 0.3586806356906891, "step": 245, "valid_targets_mean": 3350.4, "valid_targets_min": 707 }, { "epoch": 0.26260504201680673, "grad_norm": 0.8055301071475804, "learning_rate": 1.4932533733133435e-05, "loss": 0.3433, "loss_nan_ranks": 0, "loss_rank_avg": 0.3433215320110321, "step": 250, "valid_targets_mean": 2368.8, "valid_targets_min": 640 }, { "epoch": 0.26785714285714285, "grad_norm": 0.8154286910342443, "learning_rate": 1.5232383808095954e-05, "loss": 0.358, "loss_nan_ranks": 0, "loss_rank_avg": 0.33199673891067505, "step": 255, "valid_targets_mean": 2458.3, "valid_targets_min": 867 }, { "epoch": 0.27310924369747897, "grad_norm": 0.8416573919590596, "learning_rate": 1.5532233883058472e-05, "loss": 0.3717, "loss_nan_ranks": 0, "loss_rank_avg": 0.3616263270378113, "step": 260, "valid_targets_mean": 2318.0, "valid_targets_min": 848 }, { "epoch": 0.27836134453781514, "grad_norm": 0.7678040770406672, "learning_rate": 1.5832083958020993e-05, "loss": 0.3621, "loss_nan_ranks": 0, "loss_rank_avg": 0.32790547609329224, "step": 265, "valid_targets_mean": 2317.4, "valid_targets_min": 597 }, { "epoch": 0.28361344537815125, "grad_norm": 0.8164391899177017, "learning_rate": 1.613193403298351e-05, "loss": 0.3392, "loss_nan_ranks": 0, "loss_rank_avg": 0.2930743098258972, "step": 270, "valid_targets_mean": 2118.6, "valid_targets_min": 692 }, { "epoch": 0.28886554621848737, "grad_norm": 0.8248688372806788, "learning_rate": 1.6431784107946028e-05, "loss": 0.3646, "loss_nan_ranks": 0, "loss_rank_avg": 0.3935636579990387, "step": 275, "valid_targets_mean": 2466.6, "valid_targets_min": 589 }, { "epoch": 0.29411764705882354, "grad_norm": 0.8270276632057298, "learning_rate": 1.6731634182908546e-05, "loss": 0.3683, "loss_nan_ranks": 0, "loss_rank_avg": 0.36888253688812256, "step": 280, "valid_targets_mean": 2239.0, "valid_targets_min": 765 }, { "epoch": 0.29936974789915966, "grad_norm": 0.8394101421073619, "learning_rate": 1.7031484257871064e-05, "loss": 0.3563, "loss_nan_ranks": 0, "loss_rank_avg": 0.3346269130706787, "step": 285, "valid_targets_mean": 2003.6, "valid_targets_min": 686 }, { "epoch": 0.30462184873949577, "grad_norm": 0.7147367181058835, "learning_rate": 1.7331334332833585e-05, "loss": 0.3588, "loss_nan_ranks": 0, "loss_rank_avg": 0.3740352988243103, "step": 290, "valid_targets_mean": 3159.9, "valid_targets_min": 1551 }, { "epoch": 0.30987394957983194, "grad_norm": 0.8491621210785679, "learning_rate": 1.7631184407796102e-05, "loss": 0.3563, "loss_nan_ranks": 0, "loss_rank_avg": 0.357749342918396, "step": 295, "valid_targets_mean": 2103.2, "valid_targets_min": 782 }, { "epoch": 0.31512605042016806, "grad_norm": 0.8318921687266874, "learning_rate": 1.7931034482758623e-05, "loss": 0.3319, "loss_nan_ranks": 0, "loss_rank_avg": 0.3408452868461609, "step": 300, "valid_targets_mean": 2045.0, "valid_targets_min": 534 }, { "epoch": 0.32037815126050423, "grad_norm": 0.8396347924881318, "learning_rate": 1.823088455772114e-05, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.3563663959503174, "step": 305, "valid_targets_mean": 2256.4, "valid_targets_min": 854 }, { "epoch": 0.32563025210084034, "grad_norm": 0.9205468135189474, "learning_rate": 1.853073463268366e-05, "loss": 0.3732, "loss_nan_ranks": 0, "loss_rank_avg": 0.39193105697631836, "step": 310, "valid_targets_mean": 2059.1, "valid_targets_min": 1011 }, { "epoch": 0.33088235294117646, "grad_norm": 0.9135710271321404, "learning_rate": 1.8830584707646176e-05, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.3061055541038513, "step": 315, "valid_targets_mean": 1836.5, "valid_targets_min": 891 }, { "epoch": 0.33613445378151263, "grad_norm": 0.913185572728451, "learning_rate": 1.9130434782608697e-05, "loss": 0.3472, "loss_nan_ranks": 0, "loss_rank_avg": 0.3164549171924591, "step": 320, "valid_targets_mean": 2192.6, "valid_targets_min": 594 }, { "epoch": 0.34138655462184875, "grad_norm": 0.7411966725143038, "learning_rate": 1.9430284857571215e-05, "loss": 0.3551, "loss_nan_ranks": 0, "loss_rank_avg": 0.34439602494239807, "step": 325, "valid_targets_mean": 2740.4, "valid_targets_min": 926 }, { "epoch": 0.34663865546218486, "grad_norm": 0.7141106760577947, "learning_rate": 1.9730134932533736e-05, "loss": 0.3467, "loss_nan_ranks": 0, "loss_rank_avg": 0.3687133193016052, "step": 330, "valid_targets_mean": 2977.1, "valid_targets_min": 885 }, { "epoch": 0.35189075630252103, "grad_norm": 0.8006543236123854, "learning_rate": 2.0029985007496254e-05, "loss": 0.3435, "loss_nan_ranks": 0, "loss_rank_avg": 0.3490038514137268, "step": 335, "valid_targets_mean": 2345.1, "valid_targets_min": 733 }, { "epoch": 0.35714285714285715, "grad_norm": 0.7847814844972669, "learning_rate": 2.0329835082458775e-05, "loss": 0.3439, "loss_nan_ranks": 0, "loss_rank_avg": 0.3197982609272003, "step": 340, "valid_targets_mean": 2583.3, "valid_targets_min": 758 }, { "epoch": 0.36239495798319327, "grad_norm": 0.9492857105812816, "learning_rate": 2.0629685157421292e-05, "loss": 0.3519, "loss_nan_ranks": 0, "loss_rank_avg": 0.3854501247406006, "step": 345, "valid_targets_mean": 2491.8, "valid_targets_min": 738 }, { "epoch": 0.36764705882352944, "grad_norm": 0.9063284452571975, "learning_rate": 2.092953523238381e-05, "loss": 0.3585, "loss_nan_ranks": 0, "loss_rank_avg": 0.3553091883659363, "step": 350, "valid_targets_mean": 1893.2, "valid_targets_min": 638 }, { "epoch": 0.37289915966386555, "grad_norm": 0.7830522409215324, "learning_rate": 2.1229385307346328e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.35570859909057617, "step": 355, "valid_targets_mean": 2596.5, "valid_targets_min": 571 }, { "epoch": 0.37815126050420167, "grad_norm": 0.9034654728534351, "learning_rate": 2.152923538230885e-05, "loss": 0.3633, "loss_nan_ranks": 0, "loss_rank_avg": 0.3349594175815582, "step": 360, "valid_targets_mean": 1895.6, "valid_targets_min": 675 }, { "epoch": 0.38340336134453784, "grad_norm": 0.7718514232416079, "learning_rate": 2.1829085457271363e-05, "loss": 0.3499, "loss_nan_ranks": 0, "loss_rank_avg": 0.3692238926887512, "step": 365, "valid_targets_mean": 3021.2, "valid_targets_min": 743 }, { "epoch": 0.38865546218487396, "grad_norm": 0.7100879122429138, "learning_rate": 2.2128935532233884e-05, "loss": 0.3618, "loss_nan_ranks": 0, "loss_rank_avg": 0.38098081946372986, "step": 370, "valid_targets_mean": 3113.8, "valid_targets_min": 1343 }, { "epoch": 0.3939075630252101, "grad_norm": 0.9674664797223852, "learning_rate": 2.2428785607196405e-05, "loss": 0.3563, "loss_nan_ranks": 0, "loss_rank_avg": 0.335666298866272, "step": 375, "valid_targets_mean": 1930.9, "valid_targets_min": 656 }, { "epoch": 0.39915966386554624, "grad_norm": 0.9243345478210326, "learning_rate": 2.2728635682158923e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.33842527866363525, "step": 380, "valid_targets_mean": 2132.2, "valid_targets_min": 780 }, { "epoch": 0.40441176470588236, "grad_norm": 0.8789172880338919, "learning_rate": 2.302848575712144e-05, "loss": 0.3538, "loss_nan_ranks": 0, "loss_rank_avg": 0.3681184947490692, "step": 385, "valid_targets_mean": 2242.4, "valid_targets_min": 636 }, { "epoch": 0.4096638655462185, "grad_norm": 0.8586032021607275, "learning_rate": 2.3328335832083958e-05, "loss": 0.3611, "loss_nan_ranks": 0, "loss_rank_avg": 0.40162259340286255, "step": 390, "valid_targets_mean": 2104.2, "valid_targets_min": 1341 }, { "epoch": 0.41491596638655465, "grad_norm": 0.7759128620985057, "learning_rate": 2.362818590704648e-05, "loss": 0.3534, "loss_nan_ranks": 0, "loss_rank_avg": 0.30948907136917114, "step": 395, "valid_targets_mean": 2376.9, "valid_targets_min": 1305 }, { "epoch": 0.42016806722689076, "grad_norm": 0.8511116280560821, "learning_rate": 2.3928035982009e-05, "loss": 0.3428, "loss_nan_ranks": 0, "loss_rank_avg": 0.335288405418396, "step": 400, "valid_targets_mean": 2221.9, "valid_targets_min": 869 }, { "epoch": 0.4254201680672269, "grad_norm": 0.8282588416488064, "learning_rate": 2.4227886056971515e-05, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.2992272973060608, "step": 405, "valid_targets_mean": 2456.8, "valid_targets_min": 797 }, { "epoch": 0.43067226890756305, "grad_norm": 0.8894895733438389, "learning_rate": 2.4527736131934036e-05, "loss": 0.3417, "loss_nan_ranks": 0, "loss_rank_avg": 0.3676615357398987, "step": 410, "valid_targets_mean": 2224.9, "valid_targets_min": 1024 }, { "epoch": 0.43592436974789917, "grad_norm": 0.6776249586308555, "learning_rate": 2.4827586206896553e-05, "loss": 0.3381, "loss_nan_ranks": 0, "loss_rank_avg": 0.3416297435760498, "step": 415, "valid_targets_mean": 3067.1, "valid_targets_min": 548 }, { "epoch": 0.4411764705882353, "grad_norm": 0.775573641251283, "learning_rate": 2.5127436281859074e-05, "loss": 0.3254, "loss_nan_ranks": 0, "loss_rank_avg": 0.33019617199897766, "step": 420, "valid_targets_mean": 2569.1, "valid_targets_min": 870 }, { "epoch": 0.44642857142857145, "grad_norm": 0.8373072328217271, "learning_rate": 2.542728635682159e-05, "loss": 0.3402, "loss_nan_ranks": 0, "loss_rank_avg": 0.33131086826324463, "step": 425, "valid_targets_mean": 2256.8, "valid_targets_min": 734 }, { "epoch": 0.45168067226890757, "grad_norm": 0.8453545100732337, "learning_rate": 2.572713643178411e-05, "loss": 0.3243, "loss_nan_ranks": 0, "loss_rank_avg": 0.3512518107891083, "step": 430, "valid_targets_mean": 2501.5, "valid_targets_min": 544 }, { "epoch": 0.4569327731092437, "grad_norm": 0.8253450678943121, "learning_rate": 2.602698650674663e-05, "loss": 0.3365, "loss_nan_ranks": 0, "loss_rank_avg": 0.3878710865974426, "step": 435, "valid_targets_mean": 2262.6, "valid_targets_min": 614 }, { "epoch": 0.46218487394957986, "grad_norm": 0.6830047934435176, "learning_rate": 2.632683658170915e-05, "loss": 0.3246, "loss_nan_ranks": 0, "loss_rank_avg": 0.32986515760421753, "step": 440, "valid_targets_mean": 2881.2, "valid_targets_min": 826 }, { "epoch": 0.46743697478991597, "grad_norm": 0.7176824990335685, "learning_rate": 2.6626686656671666e-05, "loss": 0.3396, "loss_nan_ranks": 0, "loss_rank_avg": 0.3406386971473694, "step": 445, "valid_targets_mean": 2875.5, "valid_targets_min": 716 }, { "epoch": 0.4726890756302521, "grad_norm": 0.8474215992592125, "learning_rate": 2.6926536731634184e-05, "loss": 0.3537, "loss_nan_ranks": 0, "loss_rank_avg": 0.3648040294647217, "step": 450, "valid_targets_mean": 2027.9, "valid_targets_min": 826 }, { "epoch": 0.47794117647058826, "grad_norm": 1.095403929365044, "learning_rate": 2.7226386806596705e-05, "loss": 0.3518, "loss_nan_ranks": 0, "loss_rank_avg": 0.33743467926979065, "step": 455, "valid_targets_mean": 2896.9, "valid_targets_min": 922 }, { "epoch": 0.4831932773109244, "grad_norm": 0.7470324162963815, "learning_rate": 2.752623688155922e-05, "loss": 0.3492, "loss_nan_ranks": 0, "loss_rank_avg": 0.322024405002594, "step": 460, "valid_targets_mean": 2677.2, "valid_targets_min": 1139 }, { "epoch": 0.4884453781512605, "grad_norm": 0.7287288163080067, "learning_rate": 2.782608695652174e-05, "loss": 0.3337, "loss_nan_ranks": 0, "loss_rank_avg": 0.3294079601764679, "step": 465, "valid_targets_mean": 2836.6, "valid_targets_min": 668 }, { "epoch": 0.49369747899159666, "grad_norm": 0.7571889256497794, "learning_rate": 2.812593703148426e-05, "loss": 0.3408, "loss_nan_ranks": 0, "loss_rank_avg": 0.3153488337993622, "step": 470, "valid_targets_mean": 2510.1, "valid_targets_min": 713 }, { "epoch": 0.4989495798319328, "grad_norm": 0.7390238171828771, "learning_rate": 2.8425787106446782e-05, "loss": 0.3346, "loss_nan_ranks": 0, "loss_rank_avg": 0.3535560965538025, "step": 475, "valid_targets_mean": 2723.5, "valid_targets_min": 1336 }, { "epoch": 0.5042016806722689, "grad_norm": 0.7519915733907849, "learning_rate": 2.8725637181409296e-05, "loss": 0.3336, "loss_nan_ranks": 0, "loss_rank_avg": 0.35906684398651123, "step": 480, "valid_targets_mean": 2768.1, "valid_targets_min": 906 }, { "epoch": 0.509453781512605, "grad_norm": 0.8835497372225222, "learning_rate": 2.9025487256371818e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.30021750926971436, "step": 485, "valid_targets_mean": 1918.7, "valid_targets_min": 595 }, { "epoch": 0.5147058823529411, "grad_norm": 0.7720200309244449, "learning_rate": 2.9325337331334335e-05, "loss": 0.3371, "loss_nan_ranks": 0, "loss_rank_avg": 0.2973299026489258, "step": 490, "valid_targets_mean": 2384.1, "valid_targets_min": 768 }, { "epoch": 0.5199579831932774, "grad_norm": 0.7920180853215862, "learning_rate": 2.9625187406296856e-05, "loss": 0.3357, "loss_nan_ranks": 0, "loss_rank_avg": 0.31775835156440735, "step": 495, "valid_targets_mean": 2716.2, "valid_targets_min": 732 }, { "epoch": 0.5252100840336135, "grad_norm": 0.8442161626685477, "learning_rate": 2.992503748125937e-05, "loss": 0.3404, "loss_nan_ranks": 0, "loss_rank_avg": 0.304614782333374, "step": 500, "valid_targets_mean": 1944.6, "valid_targets_min": 898 }, { "epoch": 0.5304621848739496, "grad_norm": 0.8063704786094186, "learning_rate": 3.022488755622189e-05, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.3063597083091736, "step": 505, "valid_targets_mean": 2314.1, "valid_targets_min": 655 }, { "epoch": 0.5357142857142857, "grad_norm": 0.8885170741957255, "learning_rate": 3.052473763118441e-05, "loss": 0.3186, "loss_nan_ranks": 0, "loss_rank_avg": 0.301100492477417, "step": 510, "valid_targets_mean": 1699.1, "valid_targets_min": 649 }, { "epoch": 0.5409663865546218, "grad_norm": 0.7707180348154409, "learning_rate": 3.0824587706146934e-05, "loss": 0.3444, "loss_nan_ranks": 0, "loss_rank_avg": 0.33862438797950745, "step": 515, "valid_targets_mean": 2648.4, "valid_targets_min": 850 }, { "epoch": 0.5462184873949579, "grad_norm": 0.7331236147987067, "learning_rate": 3.112443778110945e-05, "loss": 0.3572, "loss_nan_ranks": 0, "loss_rank_avg": 0.3474993109703064, "step": 520, "valid_targets_mean": 2870.6, "valid_targets_min": 843 }, { "epoch": 0.5514705882352942, "grad_norm": 0.9814672284053637, "learning_rate": 3.142428785607197e-05, "loss": 0.3307, "loss_nan_ranks": 0, "loss_rank_avg": 0.334958016872406, "step": 525, "valid_targets_mean": 2415.3, "valid_targets_min": 904 }, { "epoch": 0.5567226890756303, "grad_norm": 0.7379782030619627, "learning_rate": 3.172413793103448e-05, "loss": 0.3268, "loss_nan_ranks": 0, "loss_rank_avg": 0.29642948508262634, "step": 530, "valid_targets_mean": 2672.1, "valid_targets_min": 733 }, { "epoch": 0.5619747899159664, "grad_norm": 0.7091140893245311, "learning_rate": 3.2023988005997004e-05, "loss": 0.3153, "loss_nan_ranks": 0, "loss_rank_avg": 0.28314292430877686, "step": 535, "valid_targets_mean": 2483.3, "valid_targets_min": 845 }, { "epoch": 0.5672268907563025, "grad_norm": 0.7575431351825522, "learning_rate": 3.2323838080959525e-05, "loss": 0.324, "loss_nan_ranks": 0, "loss_rank_avg": 0.33548930287361145, "step": 540, "valid_targets_mean": 2529.8, "valid_targets_min": 789 }, { "epoch": 0.5724789915966386, "grad_norm": 0.7600622983828266, "learning_rate": 3.262368815592204e-05, "loss": 0.3395, "loss_nan_ranks": 0, "loss_rank_avg": 0.3454827666282654, "step": 545, "valid_targets_mean": 2808.9, "valid_targets_min": 914 }, { "epoch": 0.5777310924369747, "grad_norm": 0.8183170811821894, "learning_rate": 3.292353823088456e-05, "loss": 0.3224, "loss_nan_ranks": 0, "loss_rank_avg": 0.35002923011779785, "step": 550, "valid_targets_mean": 2794.5, "valid_targets_min": 617 }, { "epoch": 0.582983193277311, "grad_norm": 0.8057355550873148, "learning_rate": 3.3223388305847075e-05, "loss": 0.3333, "loss_nan_ranks": 0, "loss_rank_avg": 0.3431859612464905, "step": 555, "valid_targets_mean": 2285.7, "valid_targets_min": 557 }, { "epoch": 0.5882352941176471, "grad_norm": 0.6311718548224762, "learning_rate": 3.3523238380809596e-05, "loss": 0.3372, "loss_nan_ranks": 0, "loss_rank_avg": 0.3158794641494751, "step": 560, "valid_targets_mean": 3329.5, "valid_targets_min": 1114 }, { "epoch": 0.5934873949579832, "grad_norm": 0.7483509818624398, "learning_rate": 3.382308845577212e-05, "loss": 0.3101, "loss_nan_ranks": 0, "loss_rank_avg": 0.312336266040802, "step": 565, "valid_targets_mean": 2451.1, "valid_targets_min": 692 }, { "epoch": 0.5987394957983193, "grad_norm": 0.8180747042153188, "learning_rate": 3.412293853073464e-05, "loss": 0.3288, "loss_nan_ranks": 0, "loss_rank_avg": 0.32389289140701294, "step": 570, "valid_targets_mean": 2601.9, "valid_targets_min": 658 }, { "epoch": 0.6039915966386554, "grad_norm": 0.7501508192177901, "learning_rate": 3.442278860569715e-05, "loss": 0.3178, "loss_nan_ranks": 0, "loss_rank_avg": 0.3347775936126709, "step": 575, "valid_targets_mean": 2365.9, "valid_targets_min": 795 }, { "epoch": 0.6092436974789915, "grad_norm": 0.8986962858297536, "learning_rate": 3.4722638680659673e-05, "loss": 0.3175, "loss_nan_ranks": 0, "loss_rank_avg": 0.2883639931678772, "step": 580, "valid_targets_mean": 2002.2, "valid_targets_min": 1167 }, { "epoch": 0.6144957983193278, "grad_norm": 0.7802444960510159, "learning_rate": 3.5022488755622194e-05, "loss": 0.3346, "loss_nan_ranks": 0, "loss_rank_avg": 0.32042810320854187, "step": 585, "valid_targets_mean": 2517.3, "valid_targets_min": 782 }, { "epoch": 0.6197478991596639, "grad_norm": 0.8123611572368629, "learning_rate": 3.5322338830584716e-05, "loss": 0.3421, "loss_nan_ranks": 0, "loss_rank_avg": 0.3365861773490906, "step": 590, "valid_targets_mean": 2191.0, "valid_targets_min": 741 }, { "epoch": 0.625, "grad_norm": 0.7007108414732764, "learning_rate": 3.562218890554723e-05, "loss": 0.3405, "loss_nan_ranks": 0, "loss_rank_avg": 0.3454342484474182, "step": 595, "valid_targets_mean": 2924.4, "valid_targets_min": 1165 }, { "epoch": 0.6302521008403361, "grad_norm": 0.730987978325978, "learning_rate": 3.592203898050975e-05, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.29325562715530396, "step": 600, "valid_targets_mean": 2913.4, "valid_targets_min": 812 }, { "epoch": 0.6355042016806722, "grad_norm": 0.7733724038568615, "learning_rate": 3.6221889055472265e-05, "loss": 0.3195, "loss_nan_ranks": 0, "loss_rank_avg": 0.3013491928577423, "step": 605, "valid_targets_mean": 2295.1, "valid_targets_min": 850 }, { "epoch": 0.6407563025210085, "grad_norm": 0.8343650173831091, "learning_rate": 3.6521739130434786e-05, "loss": 0.3194, "loss_nan_ranks": 0, "loss_rank_avg": 0.29321059584617615, "step": 610, "valid_targets_mean": 1838.8, "valid_targets_min": 1024 }, { "epoch": 0.6460084033613446, "grad_norm": 0.8241043537661473, "learning_rate": 3.68215892053973e-05, "loss": 0.3207, "loss_nan_ranks": 0, "loss_rank_avg": 0.32989972829818726, "step": 615, "valid_targets_mean": 2260.1, "valid_targets_min": 611 }, { "epoch": 0.6512605042016807, "grad_norm": 0.8204056966498567, "learning_rate": 3.712143928035982e-05, "loss": 0.3318, "loss_nan_ranks": 0, "loss_rank_avg": 0.32474619150161743, "step": 620, "valid_targets_mean": 2229.6, "valid_targets_min": 738 }, { "epoch": 0.6565126050420168, "grad_norm": 0.7119267457996982, "learning_rate": 3.742128935532234e-05, "loss": 0.3374, "loss_nan_ranks": 0, "loss_rank_avg": 0.3413497507572174, "step": 625, "valid_targets_mean": 2606.0, "valid_targets_min": 886 }, { "epoch": 0.6617647058823529, "grad_norm": 0.8282736254561877, "learning_rate": 3.772113943028486e-05, "loss": 0.3145, "loss_nan_ranks": 0, "loss_rank_avg": 0.30755430459976196, "step": 630, "valid_targets_mean": 1902.6, "valid_targets_min": 933 }, { "epoch": 0.667016806722689, "grad_norm": 0.7523816591845006, "learning_rate": 3.802098950524738e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.34018948674201965, "step": 635, "valid_targets_mean": 2412.2, "valid_targets_min": 727 }, { "epoch": 0.6722689075630253, "grad_norm": 0.762541870874189, "learning_rate": 3.83208395802099e-05, "loss": 0.3223, "loss_nan_ranks": 0, "loss_rank_avg": 0.3180159330368042, "step": 640, "valid_targets_mean": 2287.2, "valid_targets_min": 994 }, { "epoch": 0.6775210084033614, "grad_norm": 1.0029207465299363, "learning_rate": 3.862068965517242e-05, "loss": 0.3572, "loss_nan_ranks": 0, "loss_rank_avg": 0.33629217743873596, "step": 645, "valid_targets_mean": 2997.9, "valid_targets_min": 1170 }, { "epoch": 0.6827731092436975, "grad_norm": 0.7213964566380182, "learning_rate": 3.8920539730134934e-05, "loss": 0.3128, "loss_nan_ranks": 0, "loss_rank_avg": 0.2845936417579651, "step": 650, "valid_targets_mean": 2431.8, "valid_targets_min": 657 }, { "epoch": 0.6880252100840336, "grad_norm": 0.8519735795162455, "learning_rate": 3.9220389805097455e-05, "loss": 0.3433, "loss_nan_ranks": 0, "loss_rank_avg": 0.3487856984138489, "step": 655, "valid_targets_mean": 2218.6, "valid_targets_min": 954 }, { "epoch": 0.6932773109243697, "grad_norm": 0.7046220956008892, "learning_rate": 3.9520239880059976e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.3212737441062927, "step": 660, "valid_targets_mean": 2970.2, "valid_targets_min": 1285 }, { "epoch": 0.6985294117647058, "grad_norm": 0.7336185220602566, "learning_rate": 3.982008995502249e-05, "loss": 0.3157, "loss_nan_ranks": 0, "loss_rank_avg": 0.3486784100532532, "step": 665, "valid_targets_mean": 2758.5, "valid_targets_min": 924 }, { "epoch": 0.7037815126050421, "grad_norm": 0.8287435711662308, "learning_rate": 3.9999989022799437e-05, "loss": 0.3279, "loss_nan_ranks": 0, "loss_rank_avg": 0.3096350431442261, "step": 670, "valid_targets_mean": 1968.1, "valid_targets_min": 890 }, { "epoch": 0.7090336134453782, "grad_norm": 0.8202847564434639, "learning_rate": 3.9999865529431466e-05, "loss": 0.3302, "loss_nan_ranks": 0, "loss_rank_avg": 0.3207584023475647, "step": 675, "valid_targets_mean": 2397.3, "valid_targets_min": 792 }, { "epoch": 0.7142857142857143, "grad_norm": 0.6219543558575774, "learning_rate": 3.9999604822044886e-05, "loss": 0.3056, "loss_nan_ranks": 0, "loss_rank_avg": 0.2984098196029663, "step": 680, "valid_targets_mean": 3388.2, "valid_targets_min": 1117 }, { "epoch": 0.7195378151260504, "grad_norm": 0.7173660798726208, "learning_rate": 3.999920690242835e-05, "loss": 0.304, "loss_nan_ranks": 0, "loss_rank_avg": 0.29944783449172974, "step": 685, "valid_targets_mean": 2623.8, "valid_targets_min": 768 }, { "epoch": 0.7247899159663865, "grad_norm": 0.6960902757404932, "learning_rate": 3.999867177331189e-05, "loss": 0.3217, "loss_nan_ranks": 0, "loss_rank_avg": 0.3305845856666565, "step": 690, "valid_targets_mean": 3031.8, "valid_targets_min": 1091 }, { "epoch": 0.7300420168067226, "grad_norm": 0.9054223785892286, "learning_rate": 3.9997999438366895e-05, "loss": 0.3396, "loss_nan_ranks": 0, "loss_rank_avg": 0.33356064558029175, "step": 695, "valid_targets_mean": 2308.3, "valid_targets_min": 989 }, { "epoch": 0.7352941176470589, "grad_norm": 0.7885273248848218, "learning_rate": 3.9997189902206065e-05, "loss": 0.3376, "loss_nan_ranks": 0, "loss_rank_avg": 0.35361307859420776, "step": 700, "valid_targets_mean": 2145.7, "valid_targets_min": 732 }, { "epoch": 0.740546218487395, "grad_norm": 0.7007173394110273, "learning_rate": 3.999624317038344e-05, "loss": 0.3054, "loss_nan_ranks": 0, "loss_rank_avg": 0.3023601770401001, "step": 705, "valid_targets_mean": 3050.5, "valid_targets_min": 677 }, { "epoch": 0.7457983193277311, "grad_norm": 0.6606567930836675, "learning_rate": 3.9995159249394303e-05, "loss": 0.3167, "loss_nan_ranks": 0, "loss_rank_avg": 0.34521594643592834, "step": 710, "valid_targets_mean": 2787.5, "valid_targets_min": 657 }, { "epoch": 0.7510504201680672, "grad_norm": 0.7674014202376552, "learning_rate": 3.999393814667517e-05, "loss": 0.3251, "loss_nan_ranks": 0, "loss_rank_avg": 0.3120829164981842, "step": 715, "valid_targets_mean": 2107.4, "valid_targets_min": 771 }, { "epoch": 0.7563025210084033, "grad_norm": 0.778065171637885, "learning_rate": 3.9992579870603695e-05, "loss": 0.3154, "loss_nan_ranks": 0, "loss_rank_avg": 0.3578265905380249, "step": 720, "valid_targets_mean": 2320.1, "valid_targets_min": 881 }, { "epoch": 0.7615546218487395, "grad_norm": 0.6597642723911712, "learning_rate": 3.999108443049869e-05, "loss": 0.3072, "loss_nan_ranks": 0, "loss_rank_avg": 0.3022955656051636, "step": 725, "valid_targets_mean": 2848.9, "valid_targets_min": 1035 }, { "epoch": 0.7668067226890757, "grad_norm": 0.7875093632298531, "learning_rate": 3.998945183661997e-05, "loss": 0.3373, "loss_nan_ranks": 0, "loss_rank_avg": 0.2969299256801605, "step": 730, "valid_targets_mean": 2284.4, "valid_targets_min": 783 }, { "epoch": 0.7720588235294118, "grad_norm": 0.718806100635945, "learning_rate": 3.9987682100168376e-05, "loss": 0.314, "loss_nan_ranks": 0, "loss_rank_avg": 0.30758941173553467, "step": 735, "valid_targets_mean": 3248.9, "valid_targets_min": 888 }, { "epoch": 0.7773109243697479, "grad_norm": 0.6716380195670248, "learning_rate": 3.99857752332856e-05, "loss": 0.3062, "loss_nan_ranks": 0, "loss_rank_avg": 0.29802027344703674, "step": 740, "valid_targets_mean": 2760.8, "valid_targets_min": 917 }, { "epoch": 0.782563025210084, "grad_norm": 0.7048509390731609, "learning_rate": 3.998373124905418e-05, "loss": 0.3266, "loss_nan_ranks": 0, "loss_rank_avg": 0.346552312374115, "step": 745, "valid_targets_mean": 2789.3, "valid_targets_min": 778 }, { "epoch": 0.7878151260504201, "grad_norm": 0.6889434405961281, "learning_rate": 3.9981550161497375e-05, "loss": 0.3285, "loss_nan_ranks": 0, "loss_rank_avg": 0.30958837270736694, "step": 750, "valid_targets_mean": 2730.2, "valid_targets_min": 815 }, { "epoch": 0.7930672268907563, "grad_norm": 0.830218274291599, "learning_rate": 3.9979231985579074e-05, "loss": 0.3098, "loss_nan_ranks": 0, "loss_rank_avg": 0.29535311460494995, "step": 755, "valid_targets_mean": 2651.5, "valid_targets_min": 750 }, { "epoch": 0.7983193277310925, "grad_norm": 0.869991526672995, "learning_rate": 3.99767767372037e-05, "loss": 0.3155, "loss_nan_ranks": 0, "loss_rank_avg": 0.2807968854904175, "step": 760, "valid_targets_mean": 1711.4, "valid_targets_min": 699 }, { "epoch": 0.8035714285714286, "grad_norm": 0.7081493643105407, "learning_rate": 3.997418443321609e-05, "loss": 0.3097, "loss_nan_ranks": 0, "loss_rank_avg": 0.32702767848968506, "step": 765, "valid_targets_mean": 2585.1, "valid_targets_min": 572 }, { "epoch": 0.8088235294117647, "grad_norm": 0.8332144275405594, "learning_rate": 3.997145509140138e-05, "loss": 0.3095, "loss_nan_ranks": 0, "loss_rank_avg": 0.31555208563804626, "step": 770, "valid_targets_mean": 2041.9, "valid_targets_min": 785 }, { "epoch": 0.8140756302521008, "grad_norm": 0.6009347239627268, "learning_rate": 3.9968588730484896e-05, "loss": 0.3284, "loss_nan_ranks": 0, "loss_rank_avg": 0.34607839584350586, "step": 775, "valid_targets_mean": 3614.8, "valid_targets_min": 1437 }, { "epoch": 0.819327731092437, "grad_norm": 0.7137919217562437, "learning_rate": 3.9965585370132013e-05, "loss": 0.314, "loss_nan_ranks": 0, "loss_rank_avg": 0.30686646699905396, "step": 780, "valid_targets_mean": 2493.3, "valid_targets_min": 893 }, { "epoch": 0.8245798319327731, "grad_norm": 0.921127052828424, "learning_rate": 3.996244503094804e-05, "loss": 0.3143, "loss_nan_ranks": 0, "loss_rank_avg": 0.29819056391716003, "step": 785, "valid_targets_mean": 1954.9, "valid_targets_min": 880 }, { "epoch": 0.8298319327731093, "grad_norm": 0.7650761079657684, "learning_rate": 3.995916773447804e-05, "loss": 0.3196, "loss_nan_ranks": 0, "loss_rank_avg": 0.2871814966201782, "step": 790, "valid_targets_mean": 2216.4, "valid_targets_min": 746 }, { "epoch": 0.8350840336134454, "grad_norm": 0.7916639791964368, "learning_rate": 3.995575350320671e-05, "loss": 0.3237, "loss_nan_ranks": 0, "loss_rank_avg": 0.3441137373447418, "step": 795, "valid_targets_mean": 2616.8, "valid_targets_min": 848 }, { "epoch": 0.8403361344537815, "grad_norm": 0.6287517180487977, "learning_rate": 3.995220236055824e-05, "loss": 0.3135, "loss_nan_ranks": 0, "loss_rank_avg": 0.31627726554870605, "step": 800, "valid_targets_mean": 3041.9, "valid_targets_min": 744 }, { "epoch": 0.8455882352941176, "grad_norm": 0.6231303563829806, "learning_rate": 3.99485143308961e-05, "loss": 0.3099, "loss_nan_ranks": 0, "loss_rank_avg": 0.3036961853504181, "step": 805, "valid_targets_mean": 3131.9, "valid_targets_min": 974 }, { "epoch": 0.8508403361344538, "grad_norm": 0.7183070177297722, "learning_rate": 3.994468943952296e-05, "loss": 0.3272, "loss_nan_ranks": 0, "loss_rank_avg": 0.32938453555107117, "step": 810, "valid_targets_mean": 2472.3, "valid_targets_min": 867 }, { "epoch": 0.8560924369747899, "grad_norm": 0.7681753001830797, "learning_rate": 3.994072771268041e-05, "loss": 0.3195, "loss_nan_ranks": 0, "loss_rank_avg": 0.3146156072616577, "step": 815, "valid_targets_mean": 2485.6, "valid_targets_min": 903 }, { "epoch": 0.8613445378151261, "grad_norm": 0.6508689610348719, "learning_rate": 3.993662917754885e-05, "loss": 0.3127, "loss_nan_ranks": 0, "loss_rank_avg": 0.32557421922683716, "step": 820, "valid_targets_mean": 2845.4, "valid_targets_min": 692 }, { "epoch": 0.8665966386554622, "grad_norm": 0.7108824995997928, "learning_rate": 3.993239386224732e-05, "loss": 0.3082, "loss_nan_ranks": 0, "loss_rank_avg": 0.27090033888816833, "step": 825, "valid_targets_mean": 2473.5, "valid_targets_min": 734 }, { "epoch": 0.8718487394957983, "grad_norm": 0.7733012632993366, "learning_rate": 3.992802179583322e-05, "loss": 0.3199, "loss_nan_ranks": 0, "loss_rank_avg": 0.32703638076782227, "step": 830, "valid_targets_mean": 2476.1, "valid_targets_min": 773 }, { "epoch": 0.8771008403361344, "grad_norm": 0.725543154459089, "learning_rate": 3.9923513008302204e-05, "loss": 0.3169, "loss_nan_ranks": 0, "loss_rank_avg": 0.34420400857925415, "step": 835, "valid_targets_mean": 2456.4, "valid_targets_min": 1279 }, { "epoch": 0.8823529411764706, "grad_norm": 0.6577502601354023, "learning_rate": 3.991886753058792e-05, "loss": 0.3014, "loss_nan_ranks": 0, "loss_rank_avg": 0.27701324224472046, "step": 840, "valid_targets_mean": 2375.6, "valid_targets_min": 692 }, { "epoch": 0.8876050420168067, "grad_norm": 0.6971018819451299, "learning_rate": 3.991408539456182e-05, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.29996004700660706, "step": 845, "valid_targets_mean": 2597.3, "valid_targets_min": 1058 }, { "epoch": 0.8928571428571429, "grad_norm": 0.6864026260317219, "learning_rate": 3.990916663303293e-05, "loss": 0.3211, "loss_nan_ranks": 0, "loss_rank_avg": 0.3099818229675293, "step": 850, "valid_targets_mean": 2555.9, "valid_targets_min": 1232 }, { "epoch": 0.898109243697479, "grad_norm": 0.6612404353720289, "learning_rate": 3.990411127974762e-05, "loss": 0.2985, "loss_nan_ranks": 0, "loss_rank_avg": 0.32130175828933716, "step": 855, "valid_targets_mean": 3308.6, "valid_targets_min": 727 }, { "epoch": 0.9033613445378151, "grad_norm": 0.8109760616029387, "learning_rate": 3.989891936938939e-05, "loss": 0.297, "loss_nan_ranks": 0, "loss_rank_avg": 0.30671462416648865, "step": 860, "valid_targets_mean": 1730.1, "valid_targets_min": 635 }, { "epoch": 0.9086134453781513, "grad_norm": 0.7674061973927943, "learning_rate": 3.9893590937578634e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.35476604104042053, "step": 865, "valid_targets_mean": 1927.0, "valid_targets_min": 882 }, { "epoch": 0.9138655462184874, "grad_norm": 0.8917074057700859, "learning_rate": 3.9888126020872375e-05, "loss": 0.3193, "loss_nan_ranks": 0, "loss_rank_avg": 0.3417109251022339, "step": 870, "valid_targets_mean": 2367.9, "valid_targets_min": 956 }, { "epoch": 0.9191176470588235, "grad_norm": 0.7447344177878483, "learning_rate": 3.988252465676401e-05, "loss": 0.332, "loss_nan_ranks": 0, "loss_rank_avg": 0.3013457655906677, "step": 875, "valid_targets_mean": 2151.2, "valid_targets_min": 715 }, { "epoch": 0.9243697478991597, "grad_norm": 0.6389313482178219, "learning_rate": 3.98767868836831e-05, "loss": 0.2987, "loss_nan_ranks": 0, "loss_rank_avg": 0.3207515478134155, "step": 880, "valid_targets_mean": 3044.4, "valid_targets_min": 698 }, { "epoch": 0.9296218487394958, "grad_norm": 0.7460485228221652, "learning_rate": 3.987091274099504e-05, "loss": 0.3008, "loss_nan_ranks": 0, "loss_rank_avg": 0.298840194940567, "step": 885, "valid_targets_mean": 2523.6, "valid_targets_min": 750 }, { "epoch": 0.9348739495798319, "grad_norm": 0.7123957413614789, "learning_rate": 3.986490226900084e-05, "loss": 0.2958, "loss_nan_ranks": 0, "loss_rank_avg": 0.3151017725467682, "step": 890, "valid_targets_mean": 2639.6, "valid_targets_min": 856 }, { "epoch": 0.9401260504201681, "grad_norm": 0.8425889968517829, "learning_rate": 3.985875550893684e-05, "loss": 0.3007, "loss_nan_ranks": 0, "loss_rank_avg": 0.3078573942184448, "step": 895, "valid_targets_mean": 2052.1, "valid_targets_min": 634 }, { "epoch": 0.9453781512605042, "grad_norm": 0.6910638587235646, "learning_rate": 3.9852472502974386e-05, "loss": 0.2981, "loss_nan_ranks": 0, "loss_rank_avg": 0.3093729019165039, "step": 900, "valid_targets_mean": 2373.8, "valid_targets_min": 919 }, { "epoch": 0.9506302521008403, "grad_norm": 0.67274771832946, "learning_rate": 3.984605329421961e-05, "loss": 0.3064, "loss_nan_ranks": 0, "loss_rank_avg": 0.3389376997947693, "step": 905, "valid_targets_mean": 2981.9, "valid_targets_min": 822 }, { "epoch": 0.9558823529411765, "grad_norm": 0.7287563442852749, "learning_rate": 3.983949792671307e-05, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.29178452491760254, "step": 910, "valid_targets_mean": 2206.9, "valid_targets_min": 953 }, { "epoch": 0.9611344537815126, "grad_norm": 0.6697336132699603, "learning_rate": 3.9832806445429486e-05, "loss": 0.3059, "loss_nan_ranks": 0, "loss_rank_avg": 0.2787833511829376, "step": 915, "valid_targets_mean": 2421.2, "valid_targets_min": 1033 }, { "epoch": 0.9663865546218487, "grad_norm": 0.7721239770788888, "learning_rate": 3.982597889627742e-05, "loss": 0.3084, "loss_nan_ranks": 0, "loss_rank_avg": 0.3243314027786255, "step": 920, "valid_targets_mean": 2458.9, "valid_targets_min": 713 }, { "epoch": 0.9716386554621849, "grad_norm": 0.6890378426610851, "learning_rate": 3.981901532609896e-05, "loss": 0.313, "loss_nan_ranks": 0, "loss_rank_avg": 0.3086700439453125, "step": 925, "valid_targets_mean": 2401.8, "valid_targets_min": 926 }, { "epoch": 0.976890756302521, "grad_norm": 0.7281226712845131, "learning_rate": 3.9811915782669406e-05, "loss": 0.3124, "loss_nan_ranks": 0, "loss_rank_avg": 0.27539515495300293, "step": 930, "valid_targets_mean": 2145.1, "valid_targets_min": 725 }, { "epoch": 0.9821428571428571, "grad_norm": 0.7223280692952256, "learning_rate": 3.980468031469691e-05, "loss": 0.3144, "loss_nan_ranks": 0, "loss_rank_avg": 0.2952006459236145, "step": 935, "valid_targets_mean": 2334.9, "valid_targets_min": 1055 }, { "epoch": 0.9873949579831933, "grad_norm": 0.7460709191349191, "learning_rate": 3.9797308971822206e-05, "loss": 0.3175, "loss_nan_ranks": 0, "loss_rank_avg": 0.3261488676071167, "step": 940, "valid_targets_mean": 2191.4, "valid_targets_min": 684 }, { "epoch": 0.9926470588235294, "grad_norm": 0.6186791687377395, "learning_rate": 3.978980180461821e-05, "loss": 0.3292, "loss_nan_ranks": 0, "loss_rank_avg": 0.33339810371398926, "step": 945, "valid_targets_mean": 3133.6, "valid_targets_min": 816 }, { "epoch": 0.9978991596638656, "grad_norm": 0.8177731068661213, "learning_rate": 3.9782158864589696e-05, "loss": 0.3013, "loss_nan_ranks": 0, "loss_rank_avg": 0.27547362446784973, "step": 950, "valid_targets_mean": 1856.8, "valid_targets_min": 736 }, { "epoch": 1.0031512605042017, "grad_norm": 0.7256412516546766, "learning_rate": 3.977438020417293e-05, "loss": 0.2844, "loss_nan_ranks": 0, "loss_rank_avg": 0.305136114358902, "step": 955, "valid_targets_mean": 2359.5, "valid_targets_min": 734 }, { "epoch": 1.0084033613445378, "grad_norm": 0.7379697373188653, "learning_rate": 3.9766465876735354e-05, "loss": 0.2853, "loss_nan_ranks": 0, "loss_rank_avg": 0.2883484661579132, "step": 960, "valid_targets_mean": 2517.8, "valid_targets_min": 723 }, { "epoch": 1.013655462184874, "grad_norm": 0.7450004669339628, "learning_rate": 3.9758415936575155e-05, "loss": 0.2694, "loss_nan_ranks": 0, "loss_rank_avg": 0.2624656856060028, "step": 965, "valid_targets_mean": 2335.6, "valid_targets_min": 697 }, { "epoch": 1.01890756302521, "grad_norm": 0.8213378024423946, "learning_rate": 3.975023043892094e-05, "loss": 0.2998, "loss_nan_ranks": 0, "loss_rank_avg": 0.3582037091255188, "step": 970, "valid_targets_mean": 2665.7, "valid_targets_min": 730 }, { "epoch": 1.0241596638655461, "grad_norm": 1.1203862991152767, "learning_rate": 3.974190943993133e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.2818828821182251, "step": 975, "valid_targets_mean": 1555.1, "valid_targets_min": 668 }, { "epoch": 1.0294117647058822, "grad_norm": 0.5968672236493667, "learning_rate": 3.973345299669461e-05, "loss": 0.2909, "loss_nan_ranks": 0, "loss_rank_avg": 0.24849054217338562, "step": 980, "valid_targets_mean": 3073.6, "valid_targets_min": 745 }, { "epoch": 1.0346638655462186, "grad_norm": 0.6412679780590781, "learning_rate": 3.972486116722828e-05, "loss": 0.2966, "loss_nan_ranks": 0, "loss_rank_avg": 0.270571231842041, "step": 985, "valid_targets_mean": 2620.9, "valid_targets_min": 1058 }, { "epoch": 1.0399159663865547, "grad_norm": 0.658674789610642, "learning_rate": 3.971613401047872e-05, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.28596004843711853, "step": 990, "valid_targets_mean": 2736.1, "valid_targets_min": 696 }, { "epoch": 1.0451680672268908, "grad_norm": 0.708522171289682, "learning_rate": 3.970727158632075e-05, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.25710612535476685, "step": 995, "valid_targets_mean": 2025.1, "valid_targets_min": 742 }, { "epoch": 1.050420168067227, "grad_norm": 0.8163565196188108, "learning_rate": 3.969827395555721e-05, "loss": 0.2842, "loss_nan_ranks": 0, "loss_rank_avg": 0.3168991506099701, "step": 1000, "valid_targets_mean": 2106.7, "valid_targets_min": 901 }, { "epoch": 1.055672268907563, "grad_norm": 0.7814582268431446, "learning_rate": 3.968914117991857e-05, "loss": 0.2953, "loss_nan_ranks": 0, "loss_rank_avg": 0.269026517868042, "step": 1005, "valid_targets_mean": 2927.3, "valid_targets_min": 936 }, { "epoch": 1.0609243697478992, "grad_norm": 0.7483470353521008, "learning_rate": 3.967987332206249e-05, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.2755717635154724, "step": 1010, "valid_targets_mean": 2053.3, "valid_targets_min": 857 }, { "epoch": 1.0661764705882353, "grad_norm": 0.6950043296063686, "learning_rate": 3.967047044557341e-05, "loss": 0.2927, "loss_nan_ranks": 0, "loss_rank_avg": 0.2624019682407379, "step": 1015, "valid_targets_mean": 2560.6, "valid_targets_min": 918 }, { "epoch": 1.0714285714285714, "grad_norm": 0.7326135503168667, "learning_rate": 3.966093261496208e-05, "loss": 0.2827, "loss_nan_ranks": 0, "loss_rank_avg": 0.2939094305038452, "step": 1020, "valid_targets_mean": 2364.4, "valid_targets_min": 780 }, { "epoch": 1.0766806722689075, "grad_norm": 0.7595424312977608, "learning_rate": 3.9651259895665146e-05, "loss": 0.303, "loss_nan_ranks": 0, "loss_rank_avg": 0.32039862871170044, "step": 1025, "valid_targets_mean": 2230.6, "valid_targets_min": 614 }, { "epoch": 1.0819327731092436, "grad_norm": 0.745092373926396, "learning_rate": 3.9641452354044687e-05, "loss": 0.2933, "loss_nan_ranks": 0, "loss_rank_avg": 0.30866172909736633, "step": 1030, "valid_targets_mean": 2336.8, "valid_targets_min": 1140 }, { "epoch": 1.0871848739495797, "grad_norm": 0.7617543273247012, "learning_rate": 3.9631510057387765e-05, "loss": 0.2765, "loss_nan_ranks": 0, "loss_rank_avg": 0.2596009075641632, "step": 1035, "valid_targets_mean": 2062.8, "valid_targets_min": 785 }, { "epoch": 1.092436974789916, "grad_norm": 0.8286121150834354, "learning_rate": 3.962143307390596e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.2832181453704834, "step": 1040, "valid_targets_mean": 2286.1, "valid_targets_min": 1170 }, { "epoch": 1.0976890756302522, "grad_norm": 0.8421971274176083, "learning_rate": 3.961122147273491e-05, "loss": 0.28, "loss_nan_ranks": 0, "loss_rank_avg": 0.31647855043411255, "step": 1045, "valid_targets_mean": 2367.7, "valid_targets_min": 1091 }, { "epoch": 1.1029411764705883, "grad_norm": 0.7098338434234529, "learning_rate": 3.9600875323933826e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.30434438586235046, "step": 1050, "valid_targets_mean": 2628.7, "valid_targets_min": 1227 }, { "epoch": 1.1081932773109244, "grad_norm": 0.6866219477953722, "learning_rate": 3.959039469848502e-05, "loss": 0.2878, "loss_nan_ranks": 0, "loss_rank_avg": 0.29877203702926636, "step": 1055, "valid_targets_mean": 2690.5, "valid_targets_min": 666 }, { "epoch": 1.1134453781512605, "grad_norm": 0.6372603497209481, "learning_rate": 3.9579779668293416e-05, "loss": 0.3004, "loss_nan_ranks": 0, "loss_rank_avg": 0.28999483585357666, "step": 1060, "valid_targets_mean": 2948.1, "valid_targets_min": 652 }, { "epoch": 1.1186974789915967, "grad_norm": 0.6799822940846726, "learning_rate": 3.956903030618605e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.27467814087867737, "step": 1065, "valid_targets_mean": 2615.4, "valid_targets_min": 777 }, { "epoch": 1.1239495798319328, "grad_norm": 0.7809972116466566, "learning_rate": 3.955814668591156e-05, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.27500802278518677, "step": 1070, "valid_targets_mean": 2294.4, "valid_targets_min": 725 }, { "epoch": 1.129201680672269, "grad_norm": 0.7524552269972444, "learning_rate": 3.9547128882139735e-05, "loss": 0.274, "loss_nan_ranks": 0, "loss_rank_avg": 0.2802833616733551, "step": 1075, "valid_targets_mean": 2288.1, "valid_targets_min": 802 }, { "epoch": 1.134453781512605, "grad_norm": 0.6658052832741743, "learning_rate": 3.9535976970460925e-05, "loss": 0.3048, "loss_nan_ranks": 0, "loss_rank_avg": 0.3079906702041626, "step": 1080, "valid_targets_mean": 3495.8, "valid_targets_min": 1241 }, { "epoch": 1.1397058823529411, "grad_norm": 0.7347104088170611, "learning_rate": 3.9524691027385585e-05, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.31090694665908813, "step": 1085, "valid_targets_mean": 2511.8, "valid_targets_min": 849 }, { "epoch": 1.1449579831932772, "grad_norm": 0.6724112220847397, "learning_rate": 3.95132711303437e-05, "loss": 0.2997, "loss_nan_ranks": 0, "loss_rank_avg": 0.30762532353401184, "step": 1090, "valid_targets_mean": 2850.2, "valid_targets_min": 922 }, { "epoch": 1.1502100840336134, "grad_norm": 0.8334744080367508, "learning_rate": 3.9501717357684315e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.28743976354599, "step": 1095, "valid_targets_mean": 2099.1, "valid_targets_min": 744 }, { "epoch": 1.1554621848739495, "grad_norm": 0.7032590588711007, "learning_rate": 3.9490029788674934e-05, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.2826242446899414, "step": 1100, "valid_targets_mean": 2369.9, "valid_targets_min": 1013 }, { "epoch": 1.1607142857142858, "grad_norm": 1.221702121249645, "learning_rate": 3.9478208503501e-05, "loss": 0.288, "loss_nan_ranks": 0, "loss_rank_avg": 0.2712562680244446, "step": 1105, "valid_targets_mean": 2393.2, "valid_targets_min": 756 }, { "epoch": 1.165966386554622, "grad_norm": 0.7494443041520203, "learning_rate": 3.946625358326538e-05, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.2519804835319519, "step": 1110, "valid_targets_mean": 1945.5, "valid_targets_min": 637 }, { "epoch": 1.171218487394958, "grad_norm": 0.5997164956764384, "learning_rate": 3.945416510998775e-05, "loss": 0.2959, "loss_nan_ranks": 0, "loss_rank_avg": 0.2693081498146057, "step": 1115, "valid_targets_mean": 3155.6, "valid_targets_min": 738 }, { "epoch": 1.1764705882352942, "grad_norm": 0.6293715830721176, "learning_rate": 3.944194316660406e-05, "loss": 0.2876, "loss_nan_ranks": 0, "loss_rank_avg": 0.2860058546066284, "step": 1120, "valid_targets_mean": 2777.3, "valid_targets_min": 955 }, { "epoch": 1.1817226890756303, "grad_norm": 0.7097668355853033, "learning_rate": 3.942958783696598e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.2959762215614319, "step": 1125, "valid_targets_mean": 2465.1, "valid_targets_min": 670 }, { "epoch": 1.1869747899159664, "grad_norm": 0.6825216992106221, "learning_rate": 3.94170992058403e-05, "loss": 0.2773, "loss_nan_ranks": 0, "loss_rank_avg": 0.27206242084503174, "step": 1130, "valid_targets_mean": 2581.8, "valid_targets_min": 922 }, { "epoch": 1.1922268907563025, "grad_norm": 0.6192081356673204, "learning_rate": 3.9404477358908354e-05, "loss": 0.264, "loss_nan_ranks": 0, "loss_rank_avg": 0.25278788805007935, "step": 1135, "valid_targets_mean": 2664.7, "valid_targets_min": 790 }, { "epoch": 1.1974789915966386, "grad_norm": 0.811292426338912, "learning_rate": 3.9391722382765445e-05, "loss": 0.2948, "loss_nan_ranks": 0, "loss_rank_avg": 0.29716646671295166, "step": 1140, "valid_targets_mean": 1980.2, "valid_targets_min": 914 }, { "epoch": 1.2027310924369747, "grad_norm": 0.7668088242832095, "learning_rate": 3.937883436492025e-05, "loss": 0.2877, "loss_nan_ranks": 0, "loss_rank_avg": 0.27448099851608276, "step": 1145, "valid_targets_mean": 1986.5, "valid_targets_min": 826 }, { "epoch": 1.2079831932773109, "grad_norm": 0.7413211114263699, "learning_rate": 3.9365813393794186e-05, "loss": 0.2983, "loss_nan_ranks": 0, "loss_rank_avg": 0.2899211049079895, "step": 1150, "valid_targets_mean": 2858.4, "valid_targets_min": 826 }, { "epoch": 1.213235294117647, "grad_norm": 0.7546705832538436, "learning_rate": 3.9352659558720836e-05, "loss": 0.2826, "loss_nan_ranks": 0, "loss_rank_avg": 0.2793716490268707, "step": 1155, "valid_targets_mean": 2138.5, "valid_targets_min": 820 }, { "epoch": 1.2184873949579833, "grad_norm": 0.782588277733481, "learning_rate": 3.933937294994535e-05, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.2977146804332733, "step": 1160, "valid_targets_mean": 2275.8, "valid_targets_min": 669 }, { "epoch": 1.2237394957983194, "grad_norm": 0.8153448615714938, "learning_rate": 3.932595365862379e-05, "loss": 0.2974, "loss_nan_ranks": 0, "loss_rank_avg": 0.3228553533554077, "step": 1165, "valid_targets_mean": 2634.8, "valid_targets_min": 720 }, { "epoch": 1.2289915966386555, "grad_norm": 0.792990263276749, "learning_rate": 3.9312401776822504e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.26295557618141174, "step": 1170, "valid_targets_mean": 1794.0, "valid_targets_min": 746 }, { "epoch": 1.2342436974789917, "grad_norm": 0.6797271279062665, "learning_rate": 3.9298717397517546e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.27940213680267334, "step": 1175, "valid_targets_mean": 2708.9, "valid_targets_min": 1078 }, { "epoch": 1.2394957983193278, "grad_norm": 0.6849285603022243, "learning_rate": 3.928490061459396e-05, "loss": 0.2776, "loss_nan_ranks": 0, "loss_rank_avg": 0.2747243046760559, "step": 1180, "valid_targets_mean": 2251.1, "valid_targets_min": 888 }, { "epoch": 1.2447478991596639, "grad_norm": 0.7245761997254816, "learning_rate": 3.927095152284521e-05, "loss": 0.2924, "loss_nan_ranks": 0, "loss_rank_avg": 0.3488772511482239, "step": 1185, "valid_targets_mean": 3074.4, "valid_targets_min": 789 }, { "epoch": 1.25, "grad_norm": 0.7010066220238207, "learning_rate": 3.925687021797249e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.29797542095184326, "step": 1190, "valid_targets_mean": 2721.6, "valid_targets_min": 867 }, { "epoch": 1.2552521008403361, "grad_norm": 1.0179359955088225, "learning_rate": 3.924265679658407e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.27947139739990234, "step": 1195, "valid_targets_mean": 1642.1, "valid_targets_min": 722 }, { "epoch": 1.2605042016806722, "grad_norm": 0.7149247912396931, "learning_rate": 3.922831135619462e-05, "loss": 0.2831, "loss_nan_ranks": 0, "loss_rank_avg": 0.2821911573410034, "step": 1200, "valid_targets_mean": 2422.2, "valid_targets_min": 761 }, { "epoch": 1.2657563025210083, "grad_norm": 0.7243464387956448, "learning_rate": 3.9213833995224605e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.2676169276237488, "step": 1205, "valid_targets_mean": 2188.3, "valid_targets_min": 699 }, { "epoch": 1.2710084033613445, "grad_norm": 0.7370679575877426, "learning_rate": 3.919922481299952e-05, "loss": 0.3017, "loss_nan_ranks": 0, "loss_rank_avg": 0.32717978954315186, "step": 1210, "valid_targets_mean": 2311.9, "valid_targets_min": 713 }, { "epoch": 1.2762605042016806, "grad_norm": 0.6894289625236196, "learning_rate": 3.918448390974928e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.26075074076652527, "step": 1215, "valid_targets_mean": 2090.9, "valid_targets_min": 615 }, { "epoch": 1.2815126050420167, "grad_norm": 0.8026290889025559, "learning_rate": 3.9169611386607476e-05, "loss": 0.2928, "loss_nan_ranks": 0, "loss_rank_avg": 0.30541282892227173, "step": 1220, "valid_targets_mean": 2121.8, "valid_targets_min": 722 }, { "epoch": 1.2867647058823528, "grad_norm": 0.7771870350210088, "learning_rate": 3.9154607345610746e-05, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.2856689691543579, "step": 1225, "valid_targets_mean": 2416.0, "valid_targets_min": 1196 }, { "epoch": 1.2920168067226891, "grad_norm": 0.673563167861582, "learning_rate": 3.913947188969801e-05, "loss": 0.3009, "loss_nan_ranks": 0, "loss_rank_avg": 0.2647175192832947, "step": 1230, "valid_targets_mean": 2471.2, "valid_targets_min": 849 }, { "epoch": 1.2972689075630253, "grad_norm": 0.6531080612213936, "learning_rate": 3.912420512270981e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.22836507856845856, "step": 1235, "valid_targets_mean": 2253.1, "valid_targets_min": 922 }, { "epoch": 1.3025210084033614, "grad_norm": 0.7035585449641938, "learning_rate": 3.910880714938757e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.3099633455276489, "step": 1240, "valid_targets_mean": 2499.9, "valid_targets_min": 841 }, { "epoch": 1.3077731092436975, "grad_norm": 0.5567277712502462, "learning_rate": 3.909327807537288e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.28143376111984253, "step": 1245, "valid_targets_mean": 3603.4, "valid_targets_min": 1081 }, { "epoch": 1.3130252100840336, "grad_norm": 0.7110770433202822, "learning_rate": 3.90776180072068e-05, "loss": 0.2744, "loss_nan_ranks": 0, "loss_rank_avg": 0.2797868251800537, "step": 1250, "valid_targets_mean": 2393.1, "valid_targets_min": 804 }, { "epoch": 1.3182773109243697, "grad_norm": 0.5586358952592809, "learning_rate": 3.906182705232909e-05, "loss": 0.2778, "loss_nan_ranks": 0, "loss_rank_avg": 0.2782168388366699, "step": 1255, "valid_targets_mean": 4218.8, "valid_targets_min": 891 }, { "epoch": 1.3235294117647058, "grad_norm": 0.7634189610982803, "learning_rate": 3.904590531907751e-05, "loss": 0.286, "loss_nan_ranks": 0, "loss_rank_avg": 0.30689549446105957, "step": 1260, "valid_targets_mean": 2308.6, "valid_targets_min": 881 }, { "epoch": 1.328781512605042, "grad_norm": 0.660398552740273, "learning_rate": 3.9029852916687034e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.29954206943511963, "step": 1265, "valid_targets_mean": 2645.9, "valid_targets_min": 777 }, { "epoch": 1.334033613445378, "grad_norm": 0.674497976039509, "learning_rate": 3.9013669955289136e-05, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.2616213858127594, "step": 1270, "valid_targets_mean": 2590.4, "valid_targets_min": 578 }, { "epoch": 1.3392857142857144, "grad_norm": 0.6745461538720665, "learning_rate": 3.899735654591101e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.2934377193450928, "step": 1275, "valid_targets_mean": 2654.6, "valid_targets_min": 788 }, { "epoch": 1.3445378151260505, "grad_norm": 0.6298474437654481, "learning_rate": 3.898091280047486e-05, "loss": 0.2907, "loss_nan_ranks": 0, "loss_rank_avg": 0.26556211709976196, "step": 1280, "valid_targets_mean": 3061.3, "valid_targets_min": 905 }, { "epoch": 1.3497899159663866, "grad_norm": 0.6789724693265738, "learning_rate": 3.896433883179703e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.24146893620491028, "step": 1285, "valid_targets_mean": 2094.8, "valid_targets_min": 1109 }, { "epoch": 1.3550420168067228, "grad_norm": 0.7300952923000248, "learning_rate": 3.894763475358736e-05, "loss": 0.2687, "loss_nan_ranks": 0, "loss_rank_avg": 0.2770267724990845, "step": 1290, "valid_targets_mean": 2336.6, "valid_targets_min": 706 }, { "epoch": 1.3602941176470589, "grad_norm": 0.8086297463249519, "learning_rate": 3.8930800680448275e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.26473838090896606, "step": 1295, "valid_targets_mean": 1924.0, "valid_targets_min": 1099 }, { "epoch": 1.365546218487395, "grad_norm": 0.6977529571217691, "learning_rate": 3.891383672787411e-05, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.2646206021308899, "step": 1300, "valid_targets_mean": 2431.1, "valid_targets_min": 818 }, { "epoch": 1.370798319327731, "grad_norm": 0.7033155019588632, "learning_rate": 3.889674301225025e-05, "loss": 0.2746, "loss_nan_ranks": 0, "loss_rank_avg": 0.27550557255744934, "step": 1305, "valid_targets_mean": 2446.4, "valid_targets_min": 776 }, { "epoch": 1.3760504201680672, "grad_norm": 0.7011256224002429, "learning_rate": 3.8879519650852356e-05, "loss": 0.2798, "loss_nan_ranks": 0, "loss_rank_avg": 0.29224735498428345, "step": 1310, "valid_targets_mean": 2337.5, "valid_targets_min": 724 }, { "epoch": 1.3813025210084033, "grad_norm": 0.7551918929706497, "learning_rate": 3.886216676184555e-05, "loss": 0.2786, "loss_nan_ranks": 0, "loss_rank_avg": 0.25635597109794617, "step": 1315, "valid_targets_mean": 1767.4, "valid_targets_min": 903 }, { "epoch": 1.3865546218487395, "grad_norm": 0.841773127497859, "learning_rate": 3.8844684464283614e-05, "loss": 0.2729, "loss_nan_ranks": 0, "loss_rank_avg": 0.28463175892829895, "step": 1320, "valid_targets_mean": 2054.4, "valid_targets_min": 1058 }, { "epoch": 1.3918067226890756, "grad_norm": 0.714138459758691, "learning_rate": 3.882707287810817e-05, "loss": 0.2829, "loss_nan_ranks": 0, "loss_rank_avg": 0.3063795566558838, "step": 1325, "valid_targets_mean": 2356.1, "valid_targets_min": 980 }, { "epoch": 1.3970588235294117, "grad_norm": 0.7951782867715268, "learning_rate": 3.880933212414786e-05, "loss": 0.2791, "loss_nan_ranks": 0, "loss_rank_avg": 0.31758105754852295, "step": 1330, "valid_targets_mean": 2118.9, "valid_targets_min": 685 }, { "epoch": 1.4023109243697478, "grad_norm": 0.6803907534201502, "learning_rate": 3.87914623241175e-05, "loss": 0.2774, "loss_nan_ranks": 0, "loss_rank_avg": 0.2610444724559784, "step": 1335, "valid_targets_mean": 2595.9, "valid_targets_min": 636 }, { "epoch": 1.407563025210084, "grad_norm": 0.7146731724902138, "learning_rate": 3.877346360061728e-05, "loss": 0.2903, "loss_nan_ranks": 0, "loss_rank_avg": 0.2991168200969696, "step": 1340, "valid_targets_mean": 2701.4, "valid_targets_min": 931 }, { "epoch": 1.41281512605042, "grad_norm": 0.7591356155611764, "learning_rate": 3.8755336077131894e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.2531967759132385, "step": 1345, "valid_targets_mean": 1822.8, "valid_targets_min": 673 }, { "epoch": 1.4180672268907564, "grad_norm": 0.6930387851247973, "learning_rate": 3.873707987802967e-05, "loss": 0.2775, "loss_nan_ranks": 0, "loss_rank_avg": 0.2844356298446655, "step": 1350, "valid_targets_mean": 2694.1, "valid_targets_min": 657 }, { "epoch": 1.4233193277310925, "grad_norm": 0.6030534452348743, "learning_rate": 3.871869512856179e-05, "loss": 0.2738, "loss_nan_ranks": 0, "loss_rank_avg": 0.2641228139400482, "step": 1355, "valid_targets_mean": 3138.3, "valid_targets_min": 916 }, { "epoch": 1.4285714285714286, "grad_norm": 0.5730393066215059, "learning_rate": 3.870018195486138e-05, "loss": 0.2695, "loss_nan_ranks": 0, "loss_rank_avg": 0.24910803139209747, "step": 1360, "valid_targets_mean": 3588.1, "valid_targets_min": 1099 }, { "epoch": 1.4338235294117647, "grad_norm": 0.7755395352301468, "learning_rate": 3.868154048394262e-05, "loss": 0.276, "loss_nan_ranks": 0, "loss_rank_avg": 0.2994786202907562, "step": 1365, "valid_targets_mean": 2700.9, "valid_targets_min": 1110 }, { "epoch": 1.4390756302521008, "grad_norm": 0.7005171055078728, "learning_rate": 3.8662770843699944e-05, "loss": 0.2938, "loss_nan_ranks": 0, "loss_rank_avg": 0.3116563558578491, "step": 1370, "valid_targets_mean": 2591.6, "valid_targets_min": 591 }, { "epoch": 1.444327731092437, "grad_norm": 0.7295296113213054, "learning_rate": 3.8643873162907086e-05, "loss": 0.2858, "loss_nan_ranks": 0, "loss_rank_avg": 0.2686575651168823, "step": 1375, "valid_targets_mean": 2169.4, "valid_targets_min": 690 }, { "epoch": 1.449579831932773, "grad_norm": 0.728303365746196, "learning_rate": 3.862484757121627e-05, "loss": 0.3071, "loss_nan_ranks": 0, "loss_rank_avg": 0.343506395816803, "step": 1380, "valid_targets_mean": 2436.4, "valid_targets_min": 859 }, { "epoch": 1.4548319327731092, "grad_norm": 0.7264219557451437, "learning_rate": 3.860569419915727e-05, "loss": 0.2952, "loss_nan_ranks": 0, "loss_rank_avg": 0.27744126319885254, "step": 1385, "valid_targets_mean": 2069.1, "valid_targets_min": 682 }, { "epoch": 1.4600840336134453, "grad_norm": 0.7451210015033147, "learning_rate": 3.858641317813653e-05, "loss": 0.2592, "loss_nan_ranks": 0, "loss_rank_avg": 0.264180064201355, "step": 1390, "valid_targets_mean": 2131.1, "valid_targets_min": 530 }, { "epoch": 1.4653361344537816, "grad_norm": 0.7180216886659947, "learning_rate": 3.8567004640436234e-05, "loss": 0.2864, "loss_nan_ranks": 0, "loss_rank_avg": 0.28325045108795166, "step": 1395, "valid_targets_mean": 2150.3, "valid_targets_min": 1239 }, { "epoch": 1.4705882352941178, "grad_norm": 0.6005140811506897, "learning_rate": 3.8547468719213476e-05, "loss": 0.291, "loss_nan_ranks": 0, "loss_rank_avg": 0.2805612087249756, "step": 1400, "valid_targets_mean": 2986.0, "valid_targets_min": 549 }, { "epoch": 1.4758403361344539, "grad_norm": 0.6701734829120335, "learning_rate": 3.852780554849925e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.2722683250904083, "step": 1405, "valid_targets_mean": 2545.0, "valid_targets_min": 957 }, { "epoch": 1.48109243697479, "grad_norm": 0.7156588483612103, "learning_rate": 3.850801526319761e-05, "loss": 0.2917, "loss_nan_ranks": 0, "loss_rank_avg": 0.3095453381538391, "step": 1410, "valid_targets_mean": 2583.2, "valid_targets_min": 739 }, { "epoch": 1.486344537815126, "grad_norm": 0.6515593357765462, "learning_rate": 3.84880979990847e-05, "loss": 0.278, "loss_nan_ranks": 0, "loss_rank_avg": 0.2939472198486328, "step": 1415, "valid_targets_mean": 2874.5, "valid_targets_min": 1405 }, { "epoch": 1.4915966386554622, "grad_norm": 0.6808237094478136, "learning_rate": 3.846805389280782e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.29528388381004333, "step": 1420, "valid_targets_mean": 2692.4, "valid_targets_min": 704 }, { "epoch": 1.4968487394957983, "grad_norm": 0.6429218218943833, "learning_rate": 3.844788308188452e-05, "loss": 0.2749, "loss_nan_ranks": 0, "loss_rank_avg": 0.24127134680747986, "step": 1425, "valid_targets_mean": 2371.2, "valid_targets_min": 765 }, { "epoch": 1.5021008403361344, "grad_norm": 0.7293161414772861, "learning_rate": 3.8427585704701634e-05, "loss": 0.289, "loss_nan_ranks": 0, "loss_rank_avg": 0.32644128799438477, "step": 1430, "valid_targets_mean": 2395.9, "valid_targets_min": 885 }, { "epoch": 1.5073529411764706, "grad_norm": 0.6776284586447868, "learning_rate": 3.840716190051433e-05, "loss": 0.2978, "loss_nan_ranks": 0, "loss_rank_avg": 0.2834451198577881, "step": 1435, "valid_targets_mean": 2865.2, "valid_targets_min": 726 }, { "epoch": 1.5126050420168067, "grad_norm": 0.7065935410256674, "learning_rate": 3.8386611809445155e-05, "loss": 0.2874, "loss_nan_ranks": 0, "loss_rank_avg": 0.2767036557197571, "step": 1440, "valid_targets_mean": 2116.9, "valid_targets_min": 1347 }, { "epoch": 1.5178571428571428, "grad_norm": 0.6875344935274045, "learning_rate": 3.8365935572483095e-05, "loss": 0.2797, "loss_nan_ranks": 0, "loss_rank_avg": 0.25539255142211914, "step": 1445, "valid_targets_mean": 2034.7, "valid_targets_min": 807 }, { "epoch": 1.523109243697479, "grad_norm": 0.6114420882513082, "learning_rate": 3.834513333148258e-05, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.3040091097354889, "step": 1450, "valid_targets_mean": 3394.8, "valid_targets_min": 835 }, { "epoch": 1.528361344537815, "grad_norm": 0.7351299306831928, "learning_rate": 3.832420522916252e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.29218441247940063, "step": 1455, "valid_targets_mean": 2289.6, "valid_targets_min": 659 }, { "epoch": 1.5336134453781511, "grad_norm": 0.6742529951804918, "learning_rate": 3.830315140910534e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.27924418449401855, "step": 1460, "valid_targets_mean": 2554.1, "valid_targets_min": 728 }, { "epoch": 1.5388655462184873, "grad_norm": 0.642103371520459, "learning_rate": 3.8281972015755965e-05, "loss": 0.2912, "loss_nan_ranks": 0, "loss_rank_avg": 0.28389638662338257, "step": 1465, "valid_targets_mean": 2878.4, "valid_targets_min": 768 }, { "epoch": 1.5441176470588234, "grad_norm": 0.6652065712153472, "learning_rate": 3.826066719442086e-05, "loss": 0.3033, "loss_nan_ranks": 0, "loss_rank_avg": 0.28304386138916016, "step": 1470, "valid_targets_mean": 3034.9, "valid_targets_min": 1390 }, { "epoch": 1.5493697478991597, "grad_norm": 0.6732297614547262, "learning_rate": 3.823923709126701e-05, "loss": 0.2739, "loss_nan_ranks": 0, "loss_rank_avg": 0.27302515506744385, "step": 1475, "valid_targets_mean": 2630.1, "valid_targets_min": 661 }, { "epoch": 1.5546218487394958, "grad_norm": 0.7977790582505264, "learning_rate": 3.821768185332095e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.23856990039348602, "step": 1480, "valid_targets_mean": 1874.7, "valid_targets_min": 895 }, { "epoch": 1.559873949579832, "grad_norm": 0.6416684613994287, "learning_rate": 3.81960016284677e-05, "loss": 0.2789, "loss_nan_ranks": 0, "loss_rank_avg": 0.2834779918193817, "step": 1485, "valid_targets_mean": 2730.8, "valid_targets_min": 742 }, { "epoch": 1.565126050420168, "grad_norm": 0.7215663679705727, "learning_rate": 3.817419656544979e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.28470200300216675, "step": 1490, "valid_targets_mean": 2297.9, "valid_targets_min": 741 }, { "epoch": 1.5703781512605042, "grad_norm": 0.7210848118654766, "learning_rate": 3.815226681386626e-05, "loss": 0.3029, "loss_nan_ranks": 0, "loss_rank_avg": 0.30118465423583984, "step": 1495, "valid_targets_mean": 2422.6, "valid_targets_min": 672 }, { "epoch": 1.5756302521008403, "grad_norm": 0.7318400772244765, "learning_rate": 3.8130212524171576e-05, "loss": 0.2871, "loss_nan_ranks": 0, "loss_rank_avg": 0.3544023036956787, "step": 1500, "valid_targets_mean": 2730.2, "valid_targets_min": 662 }, { "epoch": 1.5808823529411766, "grad_norm": 0.764194530000509, "learning_rate": 3.810803384767465e-05, "loss": 0.2668, "loss_nan_ranks": 0, "loss_rank_avg": 0.22156544029712677, "step": 1505, "valid_targets_mean": 1869.6, "valid_targets_min": 629 }, { "epoch": 1.5861344537815127, "grad_norm": 0.7198936509540297, "learning_rate": 3.808573093653777e-05, "loss": 0.2803, "loss_nan_ranks": 0, "loss_rank_avg": 0.29135745763778687, "step": 1510, "valid_targets_mean": 2092.8, "valid_targets_min": 756 }, { "epoch": 1.5913865546218489, "grad_norm": 0.664810251317532, "learning_rate": 3.806330394377556e-05, "loss": 0.2671, "loss_nan_ranks": 0, "loss_rank_avg": 0.2656877934932709, "step": 1515, "valid_targets_mean": 2300.4, "valid_targets_min": 684 }, { "epoch": 1.596638655462185, "grad_norm": 0.7873381808170635, "learning_rate": 3.8040753023253956e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.2537113130092621, "step": 1520, "valid_targets_mean": 2188.1, "valid_targets_min": 776 }, { "epoch": 1.601890756302521, "grad_norm": 0.8013762972275075, "learning_rate": 3.801807832968912e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.28357455134391785, "step": 1525, "valid_targets_mean": 1841.9, "valid_targets_min": 765 }, { "epoch": 1.6071428571428572, "grad_norm": 0.6363572479336133, "learning_rate": 3.799528001864637e-05, "loss": 0.2632, "loss_nan_ranks": 0, "loss_rank_avg": 0.28672128915786743, "step": 1530, "valid_targets_mean": 2678.1, "valid_targets_min": 804 }, { "epoch": 1.6123949579831933, "grad_norm": 0.626675259486661, "learning_rate": 3.797235824653918e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.2521238327026367, "step": 1535, "valid_targets_mean": 2923.1, "valid_targets_min": 727 }, { "epoch": 1.6176470588235294, "grad_norm": 0.7719429167065398, "learning_rate": 3.7949313170628006e-05, "loss": 0.2855, "loss_nan_ranks": 0, "loss_rank_avg": 0.26524102687835693, "step": 1540, "valid_targets_mean": 2188.1, "valid_targets_min": 889 }, { "epoch": 1.6228991596638656, "grad_norm": 0.6140414130735539, "learning_rate": 3.79261449490193e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.28398892283439636, "step": 1545, "valid_targets_mean": 2975.3, "valid_targets_min": 870 }, { "epoch": 1.6281512605042017, "grad_norm": 0.6333512043620656, "learning_rate": 3.7902853740664356e-05, "loss": 0.2777, "loss_nan_ranks": 0, "loss_rank_avg": 0.25651031732559204, "step": 1550, "valid_targets_mean": 2676.1, "valid_targets_min": 885 }, { "epoch": 1.6334033613445378, "grad_norm": 0.7945225853691145, "learning_rate": 3.7879439705358286e-05, "loss": 0.2886, "loss_nan_ranks": 0, "loss_rank_avg": 0.28769397735595703, "step": 1555, "valid_targets_mean": 2333.7, "valid_targets_min": 1012 }, { "epoch": 1.638655462184874, "grad_norm": 0.6613578680004154, "learning_rate": 3.785590300373884e-05, "loss": 0.2963, "loss_nan_ranks": 0, "loss_rank_avg": 0.2788962423801422, "step": 1560, "valid_targets_mean": 2716.4, "valid_targets_min": 1120 }, { "epoch": 1.64390756302521, "grad_norm": 0.6200210594873011, "learning_rate": 3.7832243797285385e-05, "loss": 0.2742, "loss_nan_ranks": 0, "loss_rank_avg": 0.30993425846099854, "step": 1565, "valid_targets_mean": 3246.9, "valid_targets_min": 704 }, { "epoch": 1.6491596638655461, "grad_norm": 0.6841959383278441, "learning_rate": 3.780846224831775e-05, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.29545074701309204, "step": 1570, "valid_targets_mean": 2656.0, "valid_targets_min": 1143 }, { "epoch": 1.6544117647058822, "grad_norm": 0.646661736839655, "learning_rate": 3.7784558519995135e-05, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.2950468063354492, "step": 1575, "valid_targets_mean": 2778.9, "valid_targets_min": 830 }, { "epoch": 1.6596638655462184, "grad_norm": 0.5963871526060771, "learning_rate": 3.776053277631496e-05, "loss": 0.2784, "loss_nan_ranks": 0, "loss_rank_avg": 0.27574625611305237, "step": 1580, "valid_targets_mean": 2941.4, "valid_targets_min": 812 }, { "epoch": 1.6649159663865545, "grad_norm": 0.6789032459708729, "learning_rate": 3.7736385182111785e-05, "loss": 0.2766, "loss_nan_ranks": 0, "loss_rank_avg": 0.28872212767601013, "step": 1585, "valid_targets_mean": 2428.8, "valid_targets_min": 1240 }, { "epoch": 1.6701680672268906, "grad_norm": 0.8766320854428324, "learning_rate": 3.771211590305614e-05, "loss": 0.2937, "loss_nan_ranks": 0, "loss_rank_avg": 0.27332085371017456, "step": 1590, "valid_targets_mean": 2621.5, "valid_targets_min": 1095 }, { "epoch": 1.675420168067227, "grad_norm": 0.6841578200409935, "learning_rate": 3.768772510565342e-05, "loss": 0.2698, "loss_nan_ranks": 0, "loss_rank_avg": 0.2623317241668701, "step": 1595, "valid_targets_mean": 2145.7, "valid_targets_min": 788 }, { "epoch": 1.680672268907563, "grad_norm": 0.7486173630607642, "learning_rate": 3.76632129572427e-05, "loss": 0.2732, "loss_nan_ranks": 0, "loss_rank_avg": 0.306223064661026, "step": 1600, "valid_targets_mean": 2413.9, "valid_targets_min": 822 }, { "epoch": 1.6859243697478992, "grad_norm": 0.6168280825117122, "learning_rate": 3.763857962599565e-05, "loss": 0.2747, "loss_nan_ranks": 0, "loss_rank_avg": 0.26991304755210876, "step": 1605, "valid_targets_mean": 2552.2, "valid_targets_min": 1097 }, { "epoch": 1.6911764705882353, "grad_norm": 0.6766304351456689, "learning_rate": 3.761382528091531e-05, "loss": 0.2759, "loss_nan_ranks": 0, "loss_rank_avg": 0.28340253233909607, "step": 1610, "valid_targets_mean": 2665.7, "valid_targets_min": 1184 }, { "epoch": 1.6964285714285714, "grad_norm": 0.7062299801799153, "learning_rate": 3.7588950091834986e-05, "loss": 0.2863, "loss_nan_ranks": 0, "loss_rank_avg": 0.27810871601104736, "step": 1615, "valid_targets_mean": 2484.9, "valid_targets_min": 720 }, { "epoch": 1.7016806722689075, "grad_norm": 0.6152392266872755, "learning_rate": 3.756395422941706e-05, "loss": 0.2823, "loss_nan_ranks": 0, "loss_rank_avg": 0.3008061647415161, "step": 1620, "valid_targets_mean": 3126.2, "valid_targets_min": 892 }, { "epoch": 1.7069327731092439, "grad_norm": 0.5905779852643404, "learning_rate": 3.753883786515181e-05, "loss": 0.2714, "loss_nan_ranks": 0, "loss_rank_avg": 0.26379841566085815, "step": 1625, "valid_targets_mean": 3115.7, "valid_targets_min": 916 }, { "epoch": 1.71218487394958, "grad_norm": 0.7318199425494478, "learning_rate": 3.751360117135628e-05, "loss": 0.2544, "loss_nan_ranks": 0, "loss_rank_avg": 0.2550744414329529, "step": 1630, "valid_targets_mean": 2223.6, "valid_targets_min": 679 }, { "epoch": 1.717436974789916, "grad_norm": 0.663349889323202, "learning_rate": 3.7488244321173025e-05, "loss": 0.2836, "loss_nan_ranks": 0, "loss_rank_avg": 0.2922671437263489, "step": 1635, "valid_targets_mean": 2466.1, "valid_targets_min": 694 }, { "epoch": 1.7226890756302522, "grad_norm": 0.7439072694880867, "learning_rate": 3.746276748856898e-05, "loss": 0.2728, "loss_nan_ranks": 0, "loss_rank_avg": 0.2746467590332031, "step": 1640, "valid_targets_mean": 2209.7, "valid_targets_min": 968 }, { "epoch": 1.7279411764705883, "grad_norm": 0.7242128901414696, "learning_rate": 3.743717084833425e-05, "loss": 0.2713, "loss_nan_ranks": 0, "loss_rank_avg": 0.2738949656486511, "step": 1645, "valid_targets_mean": 2048.8, "valid_targets_min": 703 }, { "epoch": 1.7331932773109244, "grad_norm": 0.5975483868192742, "learning_rate": 3.741145457608093e-05, "loss": 0.2834, "loss_nan_ranks": 0, "loss_rank_avg": 0.2882964611053467, "step": 1650, "valid_targets_mean": 3101.3, "valid_targets_min": 768 }, { "epoch": 1.7384453781512605, "grad_norm": 0.7199800936223271, "learning_rate": 3.738561884824183e-05, "loss": 0.2895, "loss_nan_ranks": 0, "loss_rank_avg": 0.31954213976860046, "step": 1655, "valid_targets_mean": 2576.0, "valid_targets_min": 1213 }, { "epoch": 1.7436974789915967, "grad_norm": 0.643400369166649, "learning_rate": 3.735966384206936e-05, "loss": 0.2691, "loss_nan_ranks": 0, "loss_rank_avg": 0.2960051894187927, "step": 1660, "valid_targets_mean": 3030.7, "valid_targets_min": 824 }, { "epoch": 1.7489495798319328, "grad_norm": 0.5952106042261482, "learning_rate": 3.733358973563425e-05, "loss": 0.2851, "loss_nan_ranks": 0, "loss_rank_avg": 0.29441675543785095, "step": 1665, "valid_targets_mean": 3160.8, "valid_targets_min": 1137 }, { "epoch": 1.754201680672269, "grad_norm": 0.6786980642043301, "learning_rate": 3.730739670782435e-05, "loss": 0.2809, "loss_nan_ranks": 0, "loss_rank_avg": 0.2848990559577942, "step": 1670, "valid_targets_mean": 2464.0, "valid_targets_min": 900 }, { "epoch": 1.759453781512605, "grad_norm": 0.6509095658222819, "learning_rate": 3.72810849383434e-05, "loss": 0.2678, "loss_nan_ranks": 0, "loss_rank_avg": 0.26271501183509827, "step": 1675, "valid_targets_mean": 2341.4, "valid_targets_min": 537 }, { "epoch": 1.7647058823529411, "grad_norm": 0.7898671503621937, "learning_rate": 3.725465460770978e-05, "loss": 0.3089, "loss_nan_ranks": 0, "loss_rank_avg": 0.3113194704055786, "step": 1680, "valid_targets_mean": 2466.2, "valid_targets_min": 846 }, { "epoch": 1.7699579831932772, "grad_norm": 0.6739070075903468, "learning_rate": 3.7228105897255324e-05, "loss": 0.2811, "loss_nan_ranks": 0, "loss_rank_avg": 0.2531262934207916, "step": 1685, "valid_targets_mean": 2049.8, "valid_targets_min": 732 }, { "epoch": 1.7752100840336134, "grad_norm": 0.6710697879150522, "learning_rate": 3.7201438989124e-05, "loss": 0.2761, "loss_nan_ranks": 0, "loss_rank_avg": 0.28480058908462524, "step": 1690, "valid_targets_mean": 2619.4, "valid_targets_min": 1076 }, { "epoch": 1.7804621848739495, "grad_norm": 0.662695525206772, "learning_rate": 3.717465406627074e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.2571936547756195, "step": 1695, "valid_targets_mean": 2399.6, "valid_targets_min": 924 }, { "epoch": 1.7857142857142856, "grad_norm": 0.6320359884584241, "learning_rate": 3.714775131246011e-05, "loss": 0.2818, "loss_nan_ranks": 0, "loss_rank_avg": 0.2644287347793579, "step": 1700, "valid_targets_mean": 2833.1, "valid_targets_min": 1022 }, { "epoch": 1.7909663865546217, "grad_norm": 0.5608837993978538, "learning_rate": 3.71207309122651e-05, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.25060662627220154, "step": 1705, "valid_targets_mean": 3011.6, "valid_targets_min": 830 }, { "epoch": 1.7962184873949578, "grad_norm": 0.7749333627981896, "learning_rate": 3.709359305106585e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.3079194128513336, "step": 1710, "valid_targets_mean": 2177.3, "valid_targets_min": 622 }, { "epoch": 1.8014705882352942, "grad_norm": 0.6704960756054471, "learning_rate": 3.7066337915048354e-05, "loss": 0.2633, "loss_nan_ranks": 0, "loss_rank_avg": 0.24317601323127747, "step": 1715, "valid_targets_mean": 2278.3, "valid_targets_min": 777 }, { "epoch": 1.8067226890756303, "grad_norm": 0.726852310035077, "learning_rate": 3.7038965691203205e-05, "loss": 0.2867, "loss_nan_ranks": 0, "loss_rank_avg": 0.2838640809059143, "step": 1720, "valid_targets_mean": 2385.5, "valid_targets_min": 750 }, { "epoch": 1.8119747899159664, "grad_norm": 0.7307615924485396, "learning_rate": 3.701147656732431e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.2594029903411865, "step": 1725, "valid_targets_mean": 2254.4, "valid_targets_min": 823 }, { "epoch": 1.8172268907563025, "grad_norm": 0.6804119390418033, "learning_rate": 3.6983870732007596e-05, "loss": 0.2897, "loss_nan_ranks": 0, "loss_rank_avg": 0.30185481905937195, "step": 1730, "valid_targets_mean": 2529.1, "valid_targets_min": 861 }, { "epoch": 1.8224789915966386, "grad_norm": 0.5971578197210542, "learning_rate": 3.695614837464972e-05, "loss": 0.2799, "loss_nan_ranks": 0, "loss_rank_avg": 0.2714010179042816, "step": 1735, "valid_targets_mean": 2919.9, "valid_targets_min": 934 }, { "epoch": 1.8277310924369747, "grad_norm": 0.7432330036153248, "learning_rate": 3.692830968544675e-05, "loss": 0.2905, "loss_nan_ranks": 0, "loss_rank_avg": 0.2643352150917053, "step": 1740, "valid_targets_mean": 2157.0, "valid_targets_min": 913 }, { "epoch": 1.832983193277311, "grad_norm": 0.9451021623758795, "learning_rate": 3.690035485539291e-05, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.2754422128200531, "step": 1745, "valid_targets_mean": 2272.9, "valid_targets_min": 748 }, { "epoch": 1.8382352941176472, "grad_norm": 0.6448983937098554, "learning_rate": 3.6872284076279205e-05, "loss": 0.2735, "loss_nan_ranks": 0, "loss_rank_avg": 0.27130642533302307, "step": 1750, "valid_targets_mean": 2665.2, "valid_targets_min": 713 }, { "epoch": 1.8434873949579833, "grad_norm": 0.6568847222392369, "learning_rate": 3.684409754069215e-05, "loss": 0.2887, "loss_nan_ranks": 0, "loss_rank_avg": 0.28479936718940735, "step": 1755, "valid_targets_mean": 2863.5, "valid_targets_min": 687 }, { "epoch": 1.8487394957983194, "grad_norm": 0.9463446748898482, "learning_rate": 3.681579544201244e-05, "loss": 0.265, "loss_nan_ranks": 0, "loss_rank_avg": 0.267799973487854, "step": 1760, "valid_targets_mean": 2591.4, "valid_targets_min": 891 }, { "epoch": 1.8539915966386555, "grad_norm": 0.6626299146737941, "learning_rate": 3.6787377974413614e-05, "loss": 0.275, "loss_nan_ranks": 0, "loss_rank_avg": 0.26858189702033997, "step": 1765, "valid_targets_mean": 2298.1, "valid_targets_min": 783 }, { "epoch": 1.8592436974789917, "grad_norm": 0.5511447233080423, "learning_rate": 3.6758845332860734e-05, "loss": 0.2641, "loss_nan_ranks": 0, "loss_rank_avg": 0.25503212213516235, "step": 1770, "valid_targets_mean": 3300.6, "valid_targets_min": 812 }, { "epoch": 1.8644957983193278, "grad_norm": 0.6864216219048197, "learning_rate": 3.673019771310903e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.29600006341934204, "step": 1775, "valid_targets_mean": 2480.2, "valid_targets_min": 607 }, { "epoch": 1.8697478991596639, "grad_norm": 0.6727603790480745, "learning_rate": 3.670143531170258e-05, "loss": 0.2847, "loss_nan_ranks": 0, "loss_rank_avg": 0.2595556974411011, "step": 1780, "valid_targets_mean": 2553.4, "valid_targets_min": 733 }, { "epoch": 1.875, "grad_norm": 0.6449743095704825, "learning_rate": 3.667255832597294e-05, "loss": 0.2719, "loss_nan_ranks": 0, "loss_rank_avg": 0.287334680557251, "step": 1785, "valid_targets_mean": 2550.0, "valid_targets_min": 674 }, { "epoch": 1.8802521008403361, "grad_norm": 0.7356297744717748, "learning_rate": 3.664356695403781e-05, "loss": 0.2709, "loss_nan_ranks": 0, "loss_rank_avg": 0.2541128993034363, "step": 1790, "valid_targets_mean": 1760.9, "valid_targets_min": 800 }, { "epoch": 1.8855042016806722, "grad_norm": 0.6441525341607449, "learning_rate": 3.661446139479965e-05, "loss": 0.2722, "loss_nan_ranks": 0, "loss_rank_avg": 0.2607778310775757, "step": 1795, "valid_targets_mean": 2639.6, "valid_targets_min": 748 }, { "epoch": 1.8907563025210083, "grad_norm": 0.6764765078850176, "learning_rate": 3.658524184794436e-05, "loss": 0.2808, "loss_nan_ranks": 0, "loss_rank_avg": 0.2690533399581909, "step": 1800, "valid_targets_mean": 2191.6, "valid_targets_min": 797 }, { "epoch": 1.8960084033613445, "grad_norm": 0.6223425261146642, "learning_rate": 3.655590851393984e-05, "loss": 0.266, "loss_nan_ranks": 0, "loss_rank_avg": 0.2553020417690277, "step": 1805, "valid_targets_mean": 2840.2, "valid_targets_min": 718 }, { "epoch": 1.9012605042016806, "grad_norm": 0.571683682772899, "learning_rate": 3.652646159403468e-05, "loss": 0.2724, "loss_nan_ranks": 0, "loss_rank_avg": 0.2515188455581665, "step": 1810, "valid_targets_mean": 3140.4, "valid_targets_min": 919 }, { "epoch": 1.9065126050420167, "grad_norm": 0.6705352110164979, "learning_rate": 3.649690129025675e-05, "loss": 0.285, "loss_nan_ranks": 0, "loss_rank_avg": 0.28106388449668884, "step": 1815, "valid_targets_mean": 2872.1, "valid_targets_min": 713 }, { "epoch": 1.9117647058823528, "grad_norm": 0.6674867092826292, "learning_rate": 3.6467227805411824e-05, "loss": 0.2805, "loss_nan_ranks": 0, "loss_rank_avg": 0.2530893385410309, "step": 1820, "valid_targets_mean": 2187.0, "valid_targets_min": 1228 }, { "epoch": 1.917016806722689, "grad_norm": 0.7791624483418543, "learning_rate": 3.6437441343082174e-05, "loss": 0.2576, "loss_nan_ranks": 0, "loss_rank_avg": 0.25658732652664185, "step": 1825, "valid_targets_mean": 1671.2, "valid_targets_min": 830 }, { "epoch": 1.9222689075630253, "grad_norm": 0.7296738608202369, "learning_rate": 3.6407542107625167e-05, "loss": 0.2785, "loss_nan_ranks": 0, "loss_rank_avg": 0.25650477409362793, "step": 1830, "valid_targets_mean": 2080.8, "valid_targets_min": 596 }, { "epoch": 1.9275210084033614, "grad_norm": 0.6401628879972454, "learning_rate": 3.637753030417192e-05, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.271770179271698, "step": 1835, "valid_targets_mean": 2537.3, "valid_targets_min": 1114 }, { "epoch": 1.9327731092436975, "grad_norm": 0.6126369558801827, "learning_rate": 3.6347406138625805e-05, "loss": 0.2925, "loss_nan_ranks": 0, "loss_rank_avg": 0.2938627600669861, "step": 1840, "valid_targets_mean": 2981.4, "valid_targets_min": 800 }, { "epoch": 1.9380252100840336, "grad_norm": 0.7218262814733415, "learning_rate": 3.631716981766111e-05, "loss": 0.2786, "loss_nan_ranks": 0, "loss_rank_avg": 0.30355095863342285, "step": 1845, "valid_targets_mean": 2301.2, "valid_targets_min": 641 }, { "epoch": 1.9432773109243697, "grad_norm": 0.668031618282193, "learning_rate": 3.6286821548721594e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.27426058053970337, "step": 1850, "valid_targets_mean": 2243.2, "valid_targets_min": 570 }, { "epoch": 1.9485294117647058, "grad_norm": 0.752574443244231, "learning_rate": 3.625636154001904e-05, "loss": 0.2859, "loss_nan_ranks": 0, "loss_rank_avg": 0.3078942894935608, "step": 1855, "valid_targets_mean": 2398.1, "valid_targets_min": 760 }, { "epoch": 1.9537815126050422, "grad_norm": 0.7317868910075894, "learning_rate": 3.622579000053186e-05, "loss": 0.2737, "loss_nan_ranks": 0, "loss_rank_avg": 0.28089436888694763, "step": 1860, "valid_targets_mean": 2312.2, "valid_targets_min": 824 }, { "epoch": 1.9590336134453783, "grad_norm": 0.5809494600449272, "learning_rate": 3.619510714000368e-05, "loss": 0.2872, "loss_nan_ranks": 0, "loss_rank_avg": 0.28781622648239136, "step": 1865, "valid_targets_mean": 3431.6, "valid_targets_min": 729 }, { "epoch": 1.9642857142857144, "grad_norm": 0.6561581539587649, "learning_rate": 3.616431316894181e-05, "loss": 0.2752, "loss_nan_ranks": 0, "loss_rank_avg": 0.2707546651363373, "step": 1870, "valid_targets_mean": 2314.8, "valid_targets_min": 634 }, { "epoch": 1.9695378151260505, "grad_norm": 0.6586257109850335, "learning_rate": 3.613340829861592e-05, "loss": 0.2674, "loss_nan_ranks": 0, "loss_rank_avg": 0.28310245275497437, "step": 1875, "valid_targets_mean": 2942.6, "valid_targets_min": 936 }, { "epoch": 1.9747899159663866, "grad_norm": 0.6401802852139319, "learning_rate": 3.61023927410565e-05, "loss": 0.2666, "loss_nan_ranks": 0, "loss_rank_avg": 0.290630578994751, "step": 1880, "valid_targets_mean": 2797.1, "valid_targets_min": 655 }, { "epoch": 1.9800420168067228, "grad_norm": 0.6218936013613373, "learning_rate": 3.607126670905346e-05, "loss": 0.2807, "loss_nan_ranks": 0, "loss_rank_avg": 0.27291837334632874, "step": 1885, "valid_targets_mean": 2842.4, "valid_targets_min": 484 }, { "epoch": 1.9852941176470589, "grad_norm": 0.6591905106890031, "learning_rate": 3.60400304161546e-05, "loss": 0.2745, "loss_nan_ranks": 0, "loss_rank_avg": 0.24094945192337036, "step": 1890, "valid_targets_mean": 2038.6, "valid_targets_min": 657 }, { "epoch": 1.990546218487395, "grad_norm": 0.6093929527492841, "learning_rate": 3.600868407666426e-05, "loss": 0.2653, "loss_nan_ranks": 0, "loss_rank_avg": 0.251456618309021, "step": 1895, "valid_targets_mean": 2710.1, "valid_targets_min": 740 }, { "epoch": 1.995798319327731, "grad_norm": 0.7825350266466161, "learning_rate": 3.597722790564172e-05, "loss": 0.2824, "loss_nan_ranks": 0, "loss_rank_avg": 0.288199245929718, "step": 1900, "valid_targets_mean": 1974.7, "valid_targets_min": 722 }, { "epoch": 2.0010504201680672, "grad_norm": 0.5933761068921561, "learning_rate": 3.5945662118899824e-05, "loss": 0.2795, "loss_nan_ranks": 0, "loss_rank_avg": 0.2670100927352905, "step": 1905, "valid_targets_mean": 3187.6, "valid_targets_min": 725 }, { "epoch": 2.0063025210084033, "grad_norm": 0.681788431886679, "learning_rate": 3.5913986933003455e-05, "loss": 0.2537, "loss_nan_ranks": 0, "loss_rank_avg": 0.23222820460796356, "step": 1910, "valid_targets_mean": 2392.1, "valid_targets_min": 856 }, { "epoch": 2.0115546218487395, "grad_norm": 0.6959432299927795, "learning_rate": 3.5882202565268046e-05, "loss": 0.2578, "loss_nan_ranks": 0, "loss_rank_avg": 0.25007233023643494, "step": 1915, "valid_targets_mean": 2417.9, "valid_targets_min": 775 }, { "epoch": 2.0168067226890756, "grad_norm": 0.7488088088666018, "learning_rate": 3.58503092337581e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.26307564973831177, "step": 1920, "valid_targets_mean": 2433.2, "valid_targets_min": 923 }, { "epoch": 2.0220588235294117, "grad_norm": 0.8762656352125061, "learning_rate": 3.5818307157285705e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.2252756655216217, "step": 1925, "valid_targets_mean": 2069.1, "valid_targets_min": 848 }, { "epoch": 2.027310924369748, "grad_norm": 0.7108878947236019, "learning_rate": 3.5786196555409006e-05, "loss": 0.2483, "loss_nan_ranks": 0, "loss_rank_avg": 0.2223615050315857, "step": 1930, "valid_targets_mean": 2248.2, "valid_targets_min": 1239 }, { "epoch": 2.032563025210084, "grad_norm": 0.6819496202558551, "learning_rate": 3.575397764843073e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.2185153365135193, "step": 1935, "valid_targets_mean": 2224.1, "valid_targets_min": 757 }, { "epoch": 2.03781512605042, "grad_norm": 0.6372992890667374, "learning_rate": 3.572165065739664e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.2360488474369049, "step": 1940, "valid_targets_mean": 2788.4, "valid_targets_min": 889 }, { "epoch": 2.043067226890756, "grad_norm": 0.6386451317642459, "learning_rate": 3.5689215804094053e-05, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.22324788570404053, "step": 1945, "valid_targets_mean": 2618.2, "valid_targets_min": 994 }, { "epoch": 2.0483193277310923, "grad_norm": 0.7004427658132236, "learning_rate": 3.5656673311050285e-05, "loss": 0.2515, "loss_nan_ranks": 0, "loss_rank_avg": 0.27351114153862, "step": 1950, "valid_targets_mean": 2478.5, "valid_targets_min": 933 }, { "epoch": 2.0535714285714284, "grad_norm": 0.7101917295820503, "learning_rate": 3.562402340153115e-05, "loss": 0.2297, "loss_nan_ranks": 0, "loss_rank_avg": 0.2520638406276703, "step": 1955, "valid_targets_mean": 2472.2, "valid_targets_min": 1105 }, { "epoch": 2.0588235294117645, "grad_norm": 0.6511098248209234, "learning_rate": 3.559126629953942e-05, "loss": 0.2551, "loss_nan_ranks": 0, "loss_rank_avg": 0.2435356080532074, "step": 1960, "valid_targets_mean": 3219.1, "valid_targets_min": 1104 }, { "epoch": 2.064075630252101, "grad_norm": 0.6358952603701429, "learning_rate": 3.5558402229813287e-05, "loss": 0.2449, "loss_nan_ranks": 0, "loss_rank_avg": 0.2297707498073578, "step": 1965, "valid_targets_mean": 2425.1, "valid_targets_min": 881 }, { "epoch": 2.069327731092437, "grad_norm": 0.6868889163392828, "learning_rate": 3.552543141782483e-05, "loss": 0.2333, "loss_nan_ranks": 0, "loss_rank_avg": 0.24342474341392517, "step": 1970, "valid_targets_mean": 2674.5, "valid_targets_min": 522 }, { "epoch": 2.0745798319327733, "grad_norm": 0.6503662588808112, "learning_rate": 3.549235408977843e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.23457615077495575, "step": 1975, "valid_targets_mean": 2697.2, "valid_targets_min": 874 }, { "epoch": 2.0798319327731094, "grad_norm": 0.822377652612648, "learning_rate": 3.545917047260928e-05, "loss": 0.2556, "loss_nan_ranks": 0, "loss_rank_avg": 0.26807093620300293, "step": 1980, "valid_targets_mean": 1928.6, "valid_targets_min": 930 }, { "epoch": 2.0850840336134455, "grad_norm": 0.7145196067189729, "learning_rate": 3.542588079398179e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.26111432909965515, "step": 1985, "valid_targets_mean": 2330.2, "valid_targets_min": 727 }, { "epoch": 2.0903361344537816, "grad_norm": 0.7523096751763567, "learning_rate": 3.539248528228801e-05, "loss": 0.2426, "loss_nan_ranks": 0, "loss_rank_avg": 0.24235697090625763, "step": 1990, "valid_targets_mean": 2053.5, "valid_targets_min": 790 }, { "epoch": 2.0955882352941178, "grad_norm": 0.7632438420213485, "learning_rate": 3.535898416664611e-05, "loss": 0.2326, "loss_nan_ranks": 0, "loss_rank_avg": 0.22527560591697693, "step": 1995, "valid_targets_mean": 2201.0, "valid_targets_min": 765 }, { "epoch": 2.100840336134454, "grad_norm": 0.7057387201013904, "learning_rate": 3.5325377676898766e-05, "loss": 0.233, "loss_nan_ranks": 0, "loss_rank_avg": 0.25476691126823425, "step": 2000, "valid_targets_mean": 2419.0, "valid_targets_min": 944 }, { "epoch": 2.10609243697479, "grad_norm": 0.6906581075458723, "learning_rate": 3.529166604361161e-05, "loss": 0.2323, "loss_nan_ranks": 0, "loss_rank_avg": 0.19508974254131317, "step": 2005, "valid_targets_mean": 1831.8, "valid_targets_min": 959 }, { "epoch": 2.111344537815126, "grad_norm": 0.7527030761728207, "learning_rate": 3.525784949807162e-05, "loss": 0.2359, "loss_nan_ranks": 0, "loss_rank_avg": 0.23376065492630005, "step": 2010, "valid_targets_mean": 2055.6, "valid_targets_min": 522 }, { "epoch": 2.116596638655462, "grad_norm": 0.6868567018841076, "learning_rate": 3.522392827228557e-05, "loss": 0.2511, "loss_nan_ranks": 0, "loss_rank_avg": 0.2521514296531677, "step": 2015, "valid_targets_mean": 3081.2, "valid_targets_min": 1079 }, { "epoch": 2.1218487394957983, "grad_norm": 0.6159147126631715, "learning_rate": 3.518990259897841e-05, "loss": 0.2301, "loss_nan_ranks": 0, "loss_rank_avg": 0.24102434515953064, "step": 2020, "valid_targets_mean": 3128.9, "valid_targets_min": 856 }, { "epoch": 2.1271008403361344, "grad_norm": 0.6607408752549182, "learning_rate": 3.515577271159167e-05, "loss": 0.2451, "loss_nan_ranks": 0, "loss_rank_avg": 0.24916204810142517, "step": 2025, "valid_targets_mean": 2437.9, "valid_targets_min": 895 }, { "epoch": 2.1323529411764706, "grad_norm": 0.6823759669457126, "learning_rate": 3.512153884428188e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.24420082569122314, "step": 2030, "valid_targets_mean": 2662.5, "valid_targets_min": 1212 }, { "epoch": 2.1376050420168067, "grad_norm": 0.8063415806620354, "learning_rate": 3.5087201231918944e-05, "loss": 0.2482, "loss_nan_ranks": 0, "loss_rank_avg": 0.255155086517334, "step": 2035, "valid_targets_mean": 2731.2, "valid_targets_min": 669 }, { "epoch": 2.142857142857143, "grad_norm": 0.7415414698356663, "learning_rate": 3.505276011008454e-05, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.23635327816009521, "step": 2040, "valid_targets_mean": 2135.6, "valid_targets_min": 713 }, { "epoch": 2.148109243697479, "grad_norm": 0.6907057684258697, "learning_rate": 3.501821571507048e-05, "loss": 0.2379, "loss_nan_ranks": 0, "loss_rank_avg": 0.24406486749649048, "step": 2045, "valid_targets_mean": 2447.7, "valid_targets_min": 625 }, { "epoch": 2.153361344537815, "grad_norm": 0.6782470155275483, "learning_rate": 3.498356828387714e-05, "loss": 0.2463, "loss_nan_ranks": 0, "loss_rank_avg": 0.23916223645210266, "step": 2050, "valid_targets_mean": 2313.4, "valid_targets_min": 761 }, { "epoch": 2.158613445378151, "grad_norm": 0.5671322606625604, "learning_rate": 3.494881805421176e-05, "loss": 0.2438, "loss_nan_ranks": 0, "loss_rank_avg": 0.19718879461288452, "step": 2055, "valid_targets_mean": 2824.4, "valid_targets_min": 677 }, { "epoch": 2.1638655462184873, "grad_norm": 0.9382283657965643, "learning_rate": 3.4913965264486894e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.25609293580055237, "step": 2060, "valid_targets_mean": 1910.2, "valid_targets_min": 732 }, { "epoch": 2.1691176470588234, "grad_norm": 0.6346830510041134, "learning_rate": 3.48790101538187e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.2414173036813736, "step": 2065, "valid_targets_mean": 2811.0, "valid_targets_min": 1046 }, { "epoch": 2.1743697478991595, "grad_norm": 0.7269704066923304, "learning_rate": 3.484395296202537e-05, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.24697639048099518, "step": 2070, "valid_targets_mean": 2118.1, "valid_targets_min": 1008 }, { "epoch": 2.1796218487394956, "grad_norm": 0.6343101249317197, "learning_rate": 3.480879392962541e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.23526614904403687, "step": 2075, "valid_targets_mean": 2820.8, "valid_targets_min": 635 }, { "epoch": 2.184873949579832, "grad_norm": 0.7287435124218465, "learning_rate": 3.477353329783606e-05, "loss": 0.2366, "loss_nan_ranks": 0, "loss_rank_avg": 0.24225783348083496, "step": 2080, "valid_targets_mean": 2625.6, "valid_targets_min": 1045 }, { "epoch": 2.190126050420168, "grad_norm": 0.713355174077326, "learning_rate": 3.4738171308571595e-05, "loss": 0.2524, "loss_nan_ranks": 0, "loss_rank_avg": 0.254425972700119, "step": 2085, "valid_targets_mean": 2268.8, "valid_targets_min": 802 }, { "epoch": 2.1953781512605044, "grad_norm": 0.6705604877150245, "learning_rate": 3.470270820444168e-05, "loss": 0.2453, "loss_nan_ranks": 0, "loss_rank_avg": 0.2541666328907013, "step": 2090, "valid_targets_mean": 2757.6, "valid_targets_min": 952 }, { "epoch": 2.2006302521008405, "grad_norm": 0.7233467972990565, "learning_rate": 3.4667144228749697e-05, "loss": 0.2656, "loss_nan_ranks": 0, "loss_rank_avg": 0.25709813833236694, "step": 2095, "valid_targets_mean": 2277.6, "valid_targets_min": 661 }, { "epoch": 2.2058823529411766, "grad_norm": 0.7024704278871472, "learning_rate": 3.463147962549109e-05, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.238604336977005, "step": 2100, "valid_targets_mean": 2394.7, "valid_targets_min": 830 }, { "epoch": 2.2111344537815127, "grad_norm": 0.7334542386999148, "learning_rate": 3.459571463935168e-05, "loss": 0.2423, "loss_nan_ranks": 0, "loss_rank_avg": 0.25194650888442993, "step": 2105, "valid_targets_mean": 2613.2, "valid_targets_min": 1580 }, { "epoch": 2.216386554621849, "grad_norm": 0.645760996168686, "learning_rate": 3.455984951570598e-05, "loss": 0.2452, "loss_nan_ranks": 0, "loss_rank_avg": 0.22080859541893005, "step": 2110, "valid_targets_mean": 2687.3, "valid_targets_min": 738 }, { "epoch": 2.221638655462185, "grad_norm": 0.6519130528193421, "learning_rate": 3.452388450061556e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.2937582731246948, "step": 2115, "valid_targets_mean": 3205.2, "valid_targets_min": 1111 }, { "epoch": 2.226890756302521, "grad_norm": 0.6624235701635455, "learning_rate": 3.448781984082727e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.21843945980072021, "step": 2120, "valid_targets_mean": 2508.0, "valid_targets_min": 1057 }, { "epoch": 2.232142857142857, "grad_norm": 0.7029645390202783, "learning_rate": 3.4451655783771625e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.2414093017578125, "step": 2125, "valid_targets_mean": 2228.1, "valid_targets_min": 684 }, { "epoch": 2.2373949579831933, "grad_norm": 0.7968386644644923, "learning_rate": 3.4415392577561064e-05, "loss": 0.2339, "loss_nan_ranks": 0, "loss_rank_avg": 0.24058222770690918, "step": 2130, "valid_targets_mean": 1892.4, "valid_targets_min": 705 }, { "epoch": 2.2426470588235294, "grad_norm": 0.7056496069912468, "learning_rate": 3.4379030470988285e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.24626708030700684, "step": 2135, "valid_targets_mean": 2260.1, "valid_targets_min": 928 }, { "epoch": 2.2478991596638656, "grad_norm": 0.6124790183288958, "learning_rate": 3.4342569713524496e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.22665052115917206, "step": 2140, "valid_targets_mean": 3020.3, "valid_targets_min": 1178 }, { "epoch": 2.2531512605042017, "grad_norm": 0.7290143698690328, "learning_rate": 3.4306010555317735e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.26667648553848267, "step": 2145, "valid_targets_mean": 2242.3, "valid_targets_min": 822 }, { "epoch": 2.258403361344538, "grad_norm": 0.6119475782036818, "learning_rate": 3.4269353247191135e-05, "loss": 0.2374, "loss_nan_ranks": 0, "loss_rank_avg": 0.2166629135608673, "step": 2150, "valid_targets_mean": 2546.4, "valid_targets_min": 997 }, { "epoch": 2.263655462184874, "grad_norm": 0.6765056487027129, "learning_rate": 3.423259804064122e-05, "loss": 0.2492, "loss_nan_ranks": 0, "loss_rank_avg": 0.24621796607971191, "step": 2155, "valid_targets_mean": 2518.2, "valid_targets_min": 1296 }, { "epoch": 2.26890756302521, "grad_norm": 0.711905698459275, "learning_rate": 3.419574518783616e-05, "loss": 0.2287, "loss_nan_ranks": 0, "loss_rank_avg": 0.24736756086349487, "step": 2160, "valid_targets_mean": 3044.6, "valid_targets_min": 607 }, { "epoch": 2.274159663865546, "grad_norm": 0.6672052083995789, "learning_rate": 3.4158794941614055e-05, "loss": 0.2546, "loss_nan_ranks": 0, "loss_rank_avg": 0.24737080931663513, "step": 2165, "valid_targets_mean": 3020.8, "valid_targets_min": 740 }, { "epoch": 2.2794117647058822, "grad_norm": 0.7567079909016078, "learning_rate": 3.4121747555481216e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.2148715853691101, "step": 2170, "valid_targets_mean": 1714.9, "valid_targets_min": 646 }, { "epoch": 2.2846638655462184, "grad_norm": 0.7056947251086683, "learning_rate": 3.4084603283610365e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.27144932746887207, "step": 2175, "valid_targets_mean": 2400.7, "valid_targets_min": 873 }, { "epoch": 2.2899159663865545, "grad_norm": 0.7646246632019781, "learning_rate": 3.404736238083897e-05, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.23836296796798706, "step": 2180, "valid_targets_mean": 2148.2, "valid_targets_min": 709 }, { "epoch": 2.2951680672268906, "grad_norm": 0.6677517363916046, "learning_rate": 3.401002510266744e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.24747160077095032, "step": 2185, "valid_targets_mean": 2523.8, "valid_targets_min": 677 }, { "epoch": 2.3004201680672267, "grad_norm": 0.7787607353169186, "learning_rate": 3.397259170525739e-05, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.24741989374160767, "step": 2190, "valid_targets_mean": 2161.8, "valid_targets_min": 1218 }, { "epoch": 2.3056722689075633, "grad_norm": 0.6898906104395905, "learning_rate": 3.393506244542991e-05, "loss": 0.2345, "loss_nan_ranks": 0, "loss_rank_avg": 0.21572214365005493, "step": 2195, "valid_targets_mean": 2425.9, "valid_targets_min": 754 }, { "epoch": 2.310924369747899, "grad_norm": 0.7076822593529297, "learning_rate": 3.389743758066374e-05, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.2650451064109802, "step": 2200, "valid_targets_mean": 2744.9, "valid_targets_min": 807 }, { "epoch": 2.3161764705882355, "grad_norm": 0.7536553955769041, "learning_rate": 3.385971736909357e-05, "loss": 0.257, "loss_nan_ranks": 0, "loss_rank_avg": 0.2877483367919922, "step": 2205, "valid_targets_mean": 2068.6, "valid_targets_min": 657 }, { "epoch": 2.3214285714285716, "grad_norm": 0.7234207845549456, "learning_rate": 3.382190206950822e-05, "loss": 0.2504, "loss_nan_ranks": 0, "loss_rank_avg": 0.243576318025589, "step": 2210, "valid_targets_mean": 2941.5, "valid_targets_min": 967 }, { "epoch": 2.3266806722689077, "grad_norm": 0.7515713668566515, "learning_rate": 3.3783991941348916e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.264710009098053, "step": 2215, "valid_targets_mean": 2004.6, "valid_targets_min": 732 }, { "epoch": 2.331932773109244, "grad_norm": 0.6251497478316201, "learning_rate": 3.374598724470745e-05, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.24632088840007782, "step": 2220, "valid_targets_mean": 2663.2, "valid_targets_min": 786 }, { "epoch": 2.33718487394958, "grad_norm": 0.6823271730426904, "learning_rate": 3.370788824032441e-05, "loss": 0.2411, "loss_nan_ranks": 0, "loss_rank_avg": 0.24375592172145844, "step": 2225, "valid_targets_mean": 2528.2, "valid_targets_min": 1099 }, { "epoch": 2.342436974789916, "grad_norm": 0.650663602449571, "learning_rate": 3.366969518958746e-05, "loss": 0.2552, "loss_nan_ranks": 0, "loss_rank_avg": 0.2503768801689148, "step": 2230, "valid_targets_mean": 2865.1, "valid_targets_min": 679 }, { "epoch": 2.347689075630252, "grad_norm": 0.6601800895017542, "learning_rate": 3.363140835452945e-05, "loss": 0.2565, "loss_nan_ranks": 0, "loss_rank_avg": 0.2578763961791992, "step": 2235, "valid_targets_mean": 2738.4, "valid_targets_min": 1007 }, { "epoch": 2.3529411764705883, "grad_norm": 0.692317322973956, "learning_rate": 3.3593027997826654e-05, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.2523569166660309, "step": 2240, "valid_targets_mean": 2517.1, "valid_targets_min": 714 }, { "epoch": 2.3581932773109244, "grad_norm": 0.7286731675117749, "learning_rate": 3.355455438279702e-05, "loss": 0.228, "loss_nan_ranks": 0, "loss_rank_avg": 0.20360924303531647, "step": 2245, "valid_targets_mean": 1795.9, "valid_targets_min": 521 }, { "epoch": 2.3634453781512605, "grad_norm": 0.7006474168718877, "learning_rate": 3.351598777339827e-05, "loss": 0.2312, "loss_nan_ranks": 0, "loss_rank_avg": 0.2347767949104309, "step": 2250, "valid_targets_mean": 2666.3, "valid_targets_min": 1020 }, { "epoch": 2.3686974789915967, "grad_norm": 0.5939844727687064, "learning_rate": 3.3477328434226164e-05, "loss": 0.2413, "loss_nan_ranks": 0, "loss_rank_avg": 0.23968379199504852, "step": 2255, "valid_targets_mean": 3521.1, "valid_targets_min": 1437 }, { "epoch": 2.3739495798319328, "grad_norm": 0.7625687687660169, "learning_rate": 3.343857663051264e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.20183886587619781, "step": 2260, "valid_targets_mean": 1734.0, "valid_targets_min": 727 }, { "epoch": 2.379201680672269, "grad_norm": 0.7219603926351075, "learning_rate": 3.339973262812403e-05, "loss": 0.2486, "loss_nan_ranks": 0, "loss_rank_avg": 0.22381290793418884, "step": 2265, "valid_targets_mean": 2065.6, "valid_targets_min": 753 }, { "epoch": 2.384453781512605, "grad_norm": 0.6274958459143466, "learning_rate": 3.336079669355921e-05, "loss": 0.2592, "loss_nan_ranks": 0, "loss_rank_avg": 0.26679128408432007, "step": 2270, "valid_targets_mean": 3185.1, "valid_targets_min": 886 }, { "epoch": 2.389705882352941, "grad_norm": 0.6780169305716136, "learning_rate": 3.332176909394777e-05, "loss": 0.2304, "loss_nan_ranks": 0, "loss_rank_avg": 0.2543075978755951, "step": 2275, "valid_targets_mean": 2658.4, "valid_targets_min": 790 }, { "epoch": 2.3949579831932772, "grad_norm": 0.5895782853276299, "learning_rate": 3.3282650097048206e-05, "loss": 0.2562, "loss_nan_ranks": 0, "loss_rank_avg": 0.23634852468967438, "step": 2280, "valid_targets_mean": 3037.2, "valid_targets_min": 938 }, { "epoch": 2.4002100840336134, "grad_norm": 0.7590461713759683, "learning_rate": 3.324343997124606e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.23115390539169312, "step": 2285, "valid_targets_mean": 2907.3, "valid_targets_min": 1192 }, { "epoch": 2.4054621848739495, "grad_norm": 0.7830457306094891, "learning_rate": 3.3204138985552094e-05, "loss": 0.2334, "loss_nan_ranks": 0, "loss_rank_avg": 0.27056723833084106, "step": 2290, "valid_targets_mean": 1997.1, "valid_targets_min": 627 }, { "epoch": 2.4107142857142856, "grad_norm": 0.6194407127598283, "learning_rate": 3.316474740960041e-05, "loss": 0.2445, "loss_nan_ranks": 0, "loss_rank_avg": 0.19772791862487793, "step": 2295, "valid_targets_mean": 2389.4, "valid_targets_min": 783 }, { "epoch": 2.4159663865546217, "grad_norm": 0.6520643182398843, "learning_rate": 3.312526551364667e-05, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.22252126038074493, "step": 2300, "valid_targets_mean": 2424.2, "valid_targets_min": 658 }, { "epoch": 2.421218487394958, "grad_norm": 0.6888170634914532, "learning_rate": 3.308569356856616e-05, "loss": 0.2456, "loss_nan_ranks": 0, "loss_rank_avg": 0.24550795555114746, "step": 2305, "valid_targets_mean": 2487.7, "valid_targets_min": 701 }, { "epoch": 2.426470588235294, "grad_norm": 0.5982413076324926, "learning_rate": 3.3046031845851993e-05, "loss": 0.2497, "loss_nan_ranks": 0, "loss_rank_avg": 0.25226032733917236, "step": 2310, "valid_targets_mean": 3157.9, "valid_targets_min": 760 }, { "epoch": 2.43172268907563, "grad_norm": 0.6571326373833773, "learning_rate": 3.3006280617613214e-05, "loss": 0.227, "loss_nan_ranks": 0, "loss_rank_avg": 0.22074852883815765, "step": 2315, "valid_targets_mean": 2177.3, "valid_targets_min": 651 }, { "epoch": 2.4369747899159666, "grad_norm": 0.6894533182551907, "learning_rate": 3.296644015657295e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.21584966778755188, "step": 2320, "valid_targets_mean": 2304.4, "valid_targets_min": 864 }, { "epoch": 2.4422268907563023, "grad_norm": 0.6972919721870979, "learning_rate": 3.292651073606652e-05, "loss": 0.2328, "loss_nan_ranks": 0, "loss_rank_avg": 0.23415690660476685, "step": 2325, "valid_targets_mean": 2303.6, "valid_targets_min": 642 }, { "epoch": 2.447478991596639, "grad_norm": 0.6334274393400314, "learning_rate": 3.288649263003958e-05, "loss": 0.239, "loss_nan_ranks": 0, "loss_rank_avg": 0.23000667989253998, "step": 2330, "valid_targets_mean": 2705.6, "valid_targets_min": 752 }, { "epoch": 2.452731092436975, "grad_norm": 0.618380033342548, "learning_rate": 3.284638611304623e-05, "loss": 0.237, "loss_nan_ranks": 0, "loss_rank_avg": 0.2020508050918579, "step": 2335, "valid_targets_mean": 2487.5, "valid_targets_min": 1089 }, { "epoch": 2.457983193277311, "grad_norm": 0.6426580413501916, "learning_rate": 3.280619146024714e-05, "loss": 0.242, "loss_nan_ranks": 0, "loss_rank_avg": 0.23832888901233673, "step": 2340, "valid_targets_mean": 2668.8, "valid_targets_min": 627 }, { "epoch": 2.463235294117647, "grad_norm": 0.6496710491874221, "learning_rate": 3.2765908947407665e-05, "loss": 0.2465, "loss_nan_ranks": 0, "loss_rank_avg": 0.24643950164318085, "step": 2345, "valid_targets_mean": 3095.7, "valid_targets_min": 1618 }, { "epoch": 2.4684873949579833, "grad_norm": 0.6671046199265696, "learning_rate": 3.2725538850895933e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.24697118997573853, "step": 2350, "valid_targets_mean": 3175.2, "valid_targets_min": 662 }, { "epoch": 2.4737394957983194, "grad_norm": 0.608779379161093, "learning_rate": 3.268508144768096e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.2293773591518402, "step": 2355, "valid_targets_mean": 2969.8, "valid_targets_min": 814 }, { "epoch": 2.4789915966386555, "grad_norm": 0.7152715550331328, "learning_rate": 3.264453701533075e-05, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.24297022819519043, "step": 2360, "valid_targets_mean": 2333.1, "valid_targets_min": 717 }, { "epoch": 2.4842436974789917, "grad_norm": 0.6884766551131825, "learning_rate": 3.260390583201041e-05, "loss": 0.2468, "loss_nan_ranks": 0, "loss_rank_avg": 0.2274142950773239, "step": 2365, "valid_targets_mean": 2203.9, "valid_targets_min": 886 }, { "epoch": 2.4894957983193278, "grad_norm": 0.6696446459706793, "learning_rate": 3.2563188176480217e-05, "loss": 0.2394, "loss_nan_ranks": 0, "loss_rank_avg": 0.2381383329629898, "step": 2370, "valid_targets_mean": 2626.6, "valid_targets_min": 841 }, { "epoch": 2.494747899159664, "grad_norm": 0.6401047773492371, "learning_rate": 3.252238432809368e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.2555871307849884, "step": 2375, "valid_targets_mean": 2559.3, "valid_targets_min": 244 }, { "epoch": 2.5, "grad_norm": 0.7122232018012691, "learning_rate": 3.2481494566795716e-05, "loss": 0.2501, "loss_nan_ranks": 0, "loss_rank_avg": 0.2375078648328781, "step": 2380, "valid_targets_mean": 2202.1, "valid_targets_min": 756 }, { "epoch": 2.505252100840336, "grad_norm": 0.6808348421830116, "learning_rate": 3.244051917312061e-05, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.23621997237205505, "step": 2385, "valid_targets_mean": 2670.9, "valid_targets_min": 769 }, { "epoch": 2.5105042016806722, "grad_norm": 0.6243398513672342, "learning_rate": 3.239945842819018e-05, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.23079396784305573, "step": 2390, "valid_targets_mean": 2769.6, "valid_targets_min": 1140 }, { "epoch": 2.5157563025210083, "grad_norm": 0.6608060434787372, "learning_rate": 3.2358312613711804e-05, "loss": 0.2547, "loss_nan_ranks": 0, "loss_rank_avg": 0.253095418214798, "step": 2395, "valid_targets_mean": 2660.6, "valid_targets_min": 612 }, { "epoch": 2.5210084033613445, "grad_norm": 0.7121224716293856, "learning_rate": 3.231708201197653e-05, "loss": 0.2408, "loss_nan_ranks": 0, "loss_rank_avg": 0.21336033940315247, "step": 2400, "valid_targets_mean": 2111.9, "valid_targets_min": 718 }, { "epoch": 2.5262605042016806, "grad_norm": 0.6338382678155583, "learning_rate": 3.227576690585706e-05, "loss": 0.2496, "loss_nan_ranks": 0, "loss_rank_avg": 0.2580583095550537, "step": 2405, "valid_targets_mean": 3034.8, "valid_targets_min": 770 }, { "epoch": 2.5315126050420167, "grad_norm": 0.7538479941411893, "learning_rate": 3.223436757880591e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.22333016991615295, "step": 2410, "valid_targets_mean": 1899.9, "valid_targets_min": 793 }, { "epoch": 2.536764705882353, "grad_norm": 0.6566761719653834, "learning_rate": 3.219288431485337e-05, "loss": 0.2396, "loss_nan_ranks": 0, "loss_rank_avg": 0.24630621075630188, "step": 2415, "valid_targets_mean": 2439.4, "valid_targets_min": 803 }, { "epoch": 2.542016806722689, "grad_norm": 0.6042493534650838, "learning_rate": 3.2151317398605646e-05, "loss": 0.2392, "loss_nan_ranks": 0, "loss_rank_avg": 0.25575879216194153, "step": 2420, "valid_targets_mean": 3347.0, "valid_targets_min": 1460 }, { "epoch": 2.5472689075630255, "grad_norm": 0.6284939551656498, "learning_rate": 3.2109667115242815e-05, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.24401450157165527, "step": 2425, "valid_targets_mean": 2538.7, "valid_targets_min": 721 }, { "epoch": 2.552521008403361, "grad_norm": 0.6528228615180638, "learning_rate": 3.206793375051694e-05, "loss": 0.2495, "loss_nan_ranks": 0, "loss_rank_avg": 0.25775042176246643, "step": 2430, "valid_targets_mean": 2766.4, "valid_targets_min": 844 }, { "epoch": 2.5577731092436977, "grad_norm": 0.6809614766621044, "learning_rate": 3.2026117590750086e-05, "loss": 0.2415, "loss_nan_ranks": 0, "loss_rank_avg": 0.25471678376197815, "step": 2435, "valid_targets_mean": 2465.3, "valid_targets_min": 800 }, { "epoch": 2.5630252100840334, "grad_norm": 0.7551843328572223, "learning_rate": 3.198421892283235e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.2478971630334854, "step": 2440, "valid_targets_mean": 2033.8, "valid_targets_min": 788 }, { "epoch": 2.56827731092437, "grad_norm": 0.732748269558122, "learning_rate": 3.1942238034219885e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.25034216046333313, "step": 2445, "valid_targets_mean": 2231.6, "valid_targets_min": 700 }, { "epoch": 2.5735294117647056, "grad_norm": 0.6778858165535954, "learning_rate": 3.190017521293296e-05, "loss": 0.2494, "loss_nan_ranks": 0, "loss_rank_avg": 0.23393598198890686, "step": 2450, "valid_targets_mean": 2473.6, "valid_targets_min": 706 }, { "epoch": 2.578781512605042, "grad_norm": 0.6028467351028476, "learning_rate": 3.185803074755395e-05, "loss": 0.2458, "loss_nan_ranks": 0, "loss_rank_avg": 0.2509484887123108, "step": 2455, "valid_targets_mean": 2993.6, "valid_targets_min": 1079 }, { "epoch": 2.5840336134453783, "grad_norm": 0.7291609586754345, "learning_rate": 3.1815804927225363e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.2330750823020935, "step": 2460, "valid_targets_mean": 2394.2, "valid_targets_min": 744 }, { "epoch": 2.5892857142857144, "grad_norm": 0.7117035098015625, "learning_rate": 3.1773498041647876e-05, "loss": 0.2477, "loss_nan_ranks": 0, "loss_rank_avg": 0.2390121966600418, "step": 2465, "valid_targets_mean": 2322.9, "valid_targets_min": 972 }, { "epoch": 2.5945378151260505, "grad_norm": 0.7267971531615649, "learning_rate": 3.173111038107834e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.24882632493972778, "step": 2470, "valid_targets_mean": 2219.9, "valid_targets_min": 887 }, { "epoch": 2.5997899159663866, "grad_norm": 0.6553214599651517, "learning_rate": 3.168864223632776e-05, "loss": 0.2386, "loss_nan_ranks": 0, "loss_rank_avg": 0.23804202675819397, "step": 2475, "valid_targets_mean": 2536.0, "valid_targets_min": 791 }, { "epoch": 2.6050420168067228, "grad_norm": 0.6758403503740037, "learning_rate": 3.1646093898759334e-05, "loss": 0.235, "loss_nan_ranks": 0, "loss_rank_avg": 0.23084652423858643, "step": 2480, "valid_targets_mean": 2361.0, "valid_targets_min": 713 }, { "epoch": 2.610294117647059, "grad_norm": 0.7731853525222528, "learning_rate": 3.160346566028645e-05, "loss": 0.2566, "loss_nan_ranks": 0, "loss_rank_avg": 0.27315887808799744, "step": 2485, "valid_targets_mean": 1826.8, "valid_targets_min": 611 }, { "epoch": 2.615546218487395, "grad_norm": 0.7568845150659382, "learning_rate": 3.156075781337068e-05, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.26611223816871643, "step": 2490, "valid_targets_mean": 2255.1, "valid_targets_min": 750 }, { "epoch": 2.620798319327731, "grad_norm": 0.7862703099000441, "learning_rate": 3.1517970651019735e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.26096102595329285, "step": 2495, "valid_targets_mean": 2134.9, "valid_targets_min": 625 }, { "epoch": 2.6260504201680672, "grad_norm": 0.67585915869592, "learning_rate": 3.1475104466785536e-05, "loss": 0.2462, "loss_nan_ranks": 0, "loss_rank_avg": 0.26358675956726074, "step": 2500, "valid_targets_mean": 2735.0, "valid_targets_min": 668 }, { "epoch": 2.6313025210084033, "grad_norm": 0.6329275844175969, "learning_rate": 3.143215955476211e-05, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.24213485419750214, "step": 2505, "valid_targets_mean": 2604.1, "valid_targets_min": 832 }, { "epoch": 2.6365546218487395, "grad_norm": 0.6225761182265704, "learning_rate": 3.138913620958365e-05, "loss": 0.2581, "loss_nan_ranks": 0, "loss_rank_avg": 0.2655182480812073, "step": 2510, "valid_targets_mean": 3134.6, "valid_targets_min": 1472 }, { "epoch": 2.6418067226890756, "grad_norm": 0.6693316147755365, "learning_rate": 3.134603472642244e-05, "loss": 0.2612, "loss_nan_ranks": 0, "loss_rank_avg": 0.2521858513355255, "step": 2515, "valid_targets_mean": 2876.2, "valid_targets_min": 772 }, { "epoch": 2.6470588235294117, "grad_norm": 0.7037886165836804, "learning_rate": 3.1302855400986866e-05, "loss": 0.2518, "loss_nan_ranks": 0, "loss_rank_avg": 0.26977285742759705, "step": 2520, "valid_targets_mean": 2489.3, "valid_targets_min": 730 }, { "epoch": 2.652310924369748, "grad_norm": 0.7880145756624581, "learning_rate": 3.1259598529519336e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.24999578297138214, "step": 2525, "valid_targets_mean": 2124.8, "valid_targets_min": 592 }, { "epoch": 2.657563025210084, "grad_norm": 0.6308106007836234, "learning_rate": 3.121626440879432e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.2530635595321655, "step": 2530, "valid_targets_mean": 2594.6, "valid_targets_min": 645 }, { "epoch": 2.66281512605042, "grad_norm": 0.7372282318557066, "learning_rate": 3.117285333611625e-05, "loss": 0.2264, "loss_nan_ranks": 0, "loss_rank_avg": 0.2395913451910019, "step": 2535, "valid_targets_mean": 1904.2, "valid_targets_min": 965 }, { "epoch": 2.668067226890756, "grad_norm": 0.667012830669792, "learning_rate": 3.112936560931752e-05, "loss": 0.2315, "loss_nan_ranks": 0, "loss_rank_avg": 0.22841016948223114, "step": 2540, "valid_targets_mean": 2184.2, "valid_targets_min": 942 }, { "epoch": 2.6733193277310923, "grad_norm": 0.6644445077742529, "learning_rate": 3.108580152675642e-05, "loss": 0.2501, "loss_nan_ranks": 0, "loss_rank_avg": 0.23634028434753418, "step": 2545, "valid_targets_mean": 2397.2, "valid_targets_min": 720 }, { "epoch": 2.678571428571429, "grad_norm": 0.7787179904265334, "learning_rate": 3.104216138731511e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.2434334009885788, "step": 2550, "valid_targets_mean": 2057.8, "valid_targets_min": 591 }, { "epoch": 2.6838235294117645, "grad_norm": 0.6846974855879137, "learning_rate": 3.0998445490397546e-05, "loss": 0.2379, "loss_nan_ranks": 0, "loss_rank_avg": 0.24789969623088837, "step": 2555, "valid_targets_mean": 2343.2, "valid_targets_min": 518 }, { "epoch": 2.689075630252101, "grad_norm": 0.7370020291648643, "learning_rate": 3.095465413592743e-05, "loss": 0.2442, "loss_nan_ranks": 0, "loss_rank_avg": 0.25336140394210815, "step": 2560, "valid_targets_mean": 2095.1, "valid_targets_min": 530 }, { "epoch": 2.6943277310924367, "grad_norm": 0.6326410487326921, "learning_rate": 3.091078762434616e-05, "loss": 0.241, "loss_nan_ranks": 0, "loss_rank_avg": 0.2503868043422699, "step": 2565, "valid_targets_mean": 2962.9, "valid_targets_min": 782 }, { "epoch": 2.6995798319327733, "grad_norm": 0.6774135014050404, "learning_rate": 3.086684625661081e-05, "loss": 0.2402, "loss_nan_ranks": 0, "loss_rank_avg": 0.2455071359872818, "step": 2570, "valid_targets_mean": 2381.1, "valid_targets_min": 744 }, { "epoch": 2.7048319327731094, "grad_norm": 0.6927859104567512, "learning_rate": 3.082283033419197e-05, "loss": 0.2543, "loss_nan_ranks": 0, "loss_rank_avg": 0.29159125685691833, "step": 2575, "valid_targets_mean": 2816.8, "valid_targets_min": 1047 }, { "epoch": 2.7100840336134455, "grad_norm": 0.6723232233408306, "learning_rate": 3.077874015907174e-05, "loss": 0.2481, "loss_nan_ranks": 0, "loss_rank_avg": 0.2541651725769043, "step": 2580, "valid_targets_mean": 2508.1, "valid_targets_min": 615 }, { "epoch": 2.7153361344537816, "grad_norm": 0.6173987363991384, "learning_rate": 3.073457603374167e-05, "loss": 0.2295, "loss_nan_ranks": 0, "loss_rank_avg": 0.2286214530467987, "step": 2585, "valid_targets_mean": 3016.7, "valid_targets_min": 687 }, { "epoch": 2.7205882352941178, "grad_norm": 0.7180860813557801, "learning_rate": 3.069033826120066e-05, "loss": 0.2476, "loss_nan_ranks": 0, "loss_rank_avg": 0.23617371916770935, "step": 2590, "valid_targets_mean": 2155.6, "valid_targets_min": 805 }, { "epoch": 2.725840336134454, "grad_norm": 0.6332083889121407, "learning_rate": 3.064602714495286e-05, "loss": 0.2303, "loss_nan_ranks": 0, "loss_rank_avg": 0.2275339514017105, "step": 2595, "valid_targets_mean": 2649.5, "valid_targets_min": 812 }, { "epoch": 2.73109243697479, "grad_norm": 0.5824671695502105, "learning_rate": 3.060164298900565e-05, "loss": 0.2474, "loss_nan_ranks": 0, "loss_rank_avg": 0.21272224187850952, "step": 2600, "valid_targets_mean": 2831.7, "valid_targets_min": 1280 }, { "epoch": 2.736344537815126, "grad_norm": 0.7999352632938964, "learning_rate": 3.055718609786749e-05, "loss": 0.2357, "loss_nan_ranks": 0, "loss_rank_avg": 0.23128217458724976, "step": 2605, "valid_targets_mean": 1753.5, "valid_targets_min": 704 }, { "epoch": 2.741596638655462, "grad_norm": 0.6862220018448458, "learning_rate": 3.051265677654585e-05, "loss": 0.2388, "loss_nan_ranks": 0, "loss_rank_avg": 0.24940389394760132, "step": 2610, "valid_targets_mean": 2828.1, "valid_targets_min": 1251 }, { "epoch": 2.7468487394957983, "grad_norm": 0.7409612251295014, "learning_rate": 3.0468055330545162e-05, "loss": 0.2466, "loss_nan_ranks": 0, "loss_rank_avg": 0.226776584982872, "step": 2615, "valid_targets_mean": 2611.8, "valid_targets_min": 698 }, { "epoch": 2.7521008403361344, "grad_norm": 0.7045597400364605, "learning_rate": 3.0423382065864653e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.22663600742816925, "step": 2620, "valid_targets_mean": 1957.2, "valid_targets_min": 713 }, { "epoch": 2.7573529411764706, "grad_norm": 0.7198164206409869, "learning_rate": 3.0378637288996304e-05, "loss": 0.2404, "loss_nan_ranks": 0, "loss_rank_avg": 0.23351144790649414, "step": 2625, "valid_targets_mean": 2081.1, "valid_targets_min": 694 }, { "epoch": 2.7626050420168067, "grad_norm": 0.5873814818670327, "learning_rate": 3.033382130692269e-05, "loss": 0.243, "loss_nan_ranks": 0, "loss_rank_avg": 0.21516209840774536, "step": 2630, "valid_targets_mean": 2769.6, "valid_targets_min": 657 }, { "epoch": 2.767857142857143, "grad_norm": 0.6335582852038116, "learning_rate": 3.0288934427114955e-05, "loss": 0.2364, "loss_nan_ranks": 0, "loss_rank_avg": 0.2048596739768982, "step": 2635, "valid_targets_mean": 2169.6, "valid_targets_min": 697 }, { "epoch": 2.773109243697479, "grad_norm": 0.67104459281815, "learning_rate": 3.0243976957530602e-05, "loss": 0.2512, "loss_nan_ranks": 0, "loss_rank_avg": 0.2463095635175705, "step": 2640, "valid_targets_mean": 2423.3, "valid_targets_min": 702 }, { "epoch": 2.778361344537815, "grad_norm": 0.6291113433855628, "learning_rate": 3.0198949206611475e-05, "loss": 0.2302, "loss_nan_ranks": 0, "loss_rank_avg": 0.247708261013031, "step": 2645, "valid_targets_mean": 2842.7, "valid_targets_min": 680 }, { "epoch": 2.783613445378151, "grad_norm": 0.7183619458186878, "learning_rate": 3.0153851483281582e-05, "loss": 0.2478, "loss_nan_ranks": 0, "loss_rank_avg": 0.25846749544143677, "step": 2650, "valid_targets_mean": 2008.1, "valid_targets_min": 881 }, { "epoch": 2.7888655462184873, "grad_norm": 0.6296111197357144, "learning_rate": 3.010868409694499e-05, "loss": 0.2311, "loss_nan_ranks": 0, "loss_rank_avg": 0.2236376702785492, "step": 2655, "valid_targets_mean": 2598.8, "valid_targets_min": 1260 }, { "epoch": 2.7941176470588234, "grad_norm": 0.6152933998116437, "learning_rate": 3.0063447357483712e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.22628861665725708, "step": 2660, "valid_targets_mean": 2571.6, "valid_targets_min": 759 }, { "epoch": 2.79936974789916, "grad_norm": 0.6612164055765357, "learning_rate": 3.0018141575255587e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.22041192650794983, "step": 2665, "valid_targets_mean": 2249.2, "valid_targets_min": 865 }, { "epoch": 2.8046218487394956, "grad_norm": 0.7274917143243959, "learning_rate": 2.9972767061092107e-05, "loss": 0.2358, "loss_nan_ranks": 0, "loss_rank_avg": 0.2216116338968277, "step": 2670, "valid_targets_mean": 1970.0, "valid_targets_min": 648 }, { "epoch": 2.809873949579832, "grad_norm": 0.6906029702041456, "learning_rate": 2.9927324126296352e-05, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.23099112510681152, "step": 2675, "valid_targets_mean": 2226.4, "valid_targets_min": 786 }, { "epoch": 2.815126050420168, "grad_norm": 0.6602585381068012, "learning_rate": 2.98818130826408e-05, "loss": 0.2395, "loss_nan_ranks": 0, "loss_rank_avg": 0.23484909534454346, "step": 2680, "valid_targets_mean": 2583.8, "valid_targets_min": 584 }, { "epoch": 2.8203781512605044, "grad_norm": 0.700101600296082, "learning_rate": 2.9836234242365204e-05, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.26351702213287354, "step": 2685, "valid_targets_mean": 2604.2, "valid_targets_min": 1181 }, { "epoch": 2.82563025210084, "grad_norm": 1.1113414468630831, "learning_rate": 2.979058791817447e-05, "loss": 0.2361, "loss_nan_ranks": 0, "loss_rank_avg": 0.2611852288246155, "step": 2690, "valid_targets_mean": 2256.4, "valid_targets_min": 820 }, { "epoch": 2.8308823529411766, "grad_norm": 0.6092742628805521, "learning_rate": 2.974487442323647e-05, "loss": 0.2433, "loss_nan_ranks": 0, "loss_rank_avg": 0.22087091207504272, "step": 2695, "valid_targets_mean": 2595.6, "valid_targets_min": 869 }, { "epoch": 2.8361344537815127, "grad_norm": 0.6990782326556737, "learning_rate": 2.9699094071179938e-05, "loss": 0.2424, "loss_nan_ranks": 0, "loss_rank_avg": 0.24499669671058655, "step": 2700, "valid_targets_mean": 2403.4, "valid_targets_min": 737 }, { "epoch": 2.841386554621849, "grad_norm": 0.6311106363395269, "learning_rate": 2.9653247176092286e-05, "loss": 0.2526, "loss_nan_ranks": 0, "loss_rank_avg": 0.23955629765987396, "step": 2705, "valid_targets_mean": 3173.2, "valid_targets_min": 1337 }, { "epoch": 2.846638655462185, "grad_norm": 0.6466020830134367, "learning_rate": 2.9607334052517466e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.25517964363098145, "step": 2710, "valid_targets_mean": 2581.2, "valid_targets_min": 869 }, { "epoch": 2.851890756302521, "grad_norm": 0.6364448114027271, "learning_rate": 2.9561355015453803e-05, "loss": 0.2428, "loss_nan_ranks": 0, "loss_rank_avg": 0.23851974308490753, "step": 2715, "valid_targets_mean": 2660.0, "valid_targets_min": 514 }, { "epoch": 2.857142857142857, "grad_norm": 0.6924312748250914, "learning_rate": 2.9515310380351847e-05, "loss": 0.2427, "loss_nan_ranks": 0, "loss_rank_avg": 0.25390565395355225, "step": 2720, "valid_targets_mean": 2458.5, "valid_targets_min": 740 }, { "epoch": 2.8623949579831933, "grad_norm": 0.6680820681499023, "learning_rate": 2.9469200463112186e-05, "loss": 0.2322, "loss_nan_ranks": 0, "loss_rank_avg": 0.22375771403312683, "step": 2725, "valid_targets_mean": 2688.9, "valid_targets_min": 648 }, { "epoch": 2.8676470588235294, "grad_norm": 0.6088973094421416, "learning_rate": 2.9423025580083298e-05, "loss": 0.2306, "loss_nan_ranks": 0, "loss_rank_avg": 0.20682302117347717, "step": 2730, "valid_targets_mean": 2755.1, "valid_targets_min": 810 }, { "epoch": 2.8728991596638656, "grad_norm": 0.6859266823062403, "learning_rate": 2.937678604805938e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.21406525373458862, "step": 2735, "valid_targets_mean": 2067.5, "valid_targets_min": 1166 }, { "epoch": 2.8781512605042017, "grad_norm": 0.6634535239376516, "learning_rate": 2.9330482184278168e-05, "loss": 0.2381, "loss_nan_ranks": 0, "loss_rank_avg": 0.24567797780036926, "step": 2740, "valid_targets_mean": 2457.8, "valid_targets_min": 694 }, { "epoch": 2.883403361344538, "grad_norm": 0.6340089258781645, "learning_rate": 2.9284114306418758e-05, "loss": 0.2389, "loss_nan_ranks": 0, "loss_rank_avg": 0.2264363169670105, "step": 2745, "valid_targets_mean": 2580.6, "valid_targets_min": 725 }, { "epoch": 2.888655462184874, "grad_norm": 0.6682756597647231, "learning_rate": 2.923768273259942e-05, "loss": 0.2342, "loss_nan_ranks": 0, "loss_rank_avg": 0.2170996367931366, "step": 2750, "valid_targets_mean": 2042.1, "valid_targets_min": 719 }, { "epoch": 2.89390756302521, "grad_norm": 0.6425815374610044, "learning_rate": 2.919118778137546e-05, "loss": 0.2371, "loss_nan_ranks": 0, "loss_rank_avg": 0.20629505813121796, "step": 2755, "valid_targets_mean": 2251.1, "valid_targets_min": 779 }, { "epoch": 2.899159663865546, "grad_norm": 0.6998165427866984, "learning_rate": 2.9144629771736954e-05, "loss": 0.2626, "loss_nan_ranks": 0, "loss_rank_avg": 0.27105337381362915, "step": 2760, "valid_targets_mean": 2532.9, "valid_targets_min": 859 }, { "epoch": 2.9044117647058822, "grad_norm": 0.6850527077895415, "learning_rate": 2.9098009023106645e-05, "loss": 0.2419, "loss_nan_ranks": 0, "loss_rank_avg": 0.2457822561264038, "step": 2765, "valid_targets_mean": 2170.1, "valid_targets_min": 803 }, { "epoch": 2.9096638655462184, "grad_norm": 0.5591265461314032, "learning_rate": 2.9051325855337684e-05, "loss": 0.2417, "loss_nan_ranks": 0, "loss_rank_avg": 0.23795005679130554, "step": 2770, "valid_targets_mean": 3337.8, "valid_targets_min": 739 }, { "epoch": 2.9149159663865545, "grad_norm": 0.7253204297962602, "learning_rate": 2.90045805887115e-05, "loss": 0.2298, "loss_nan_ranks": 0, "loss_rank_avg": 0.26152512431144714, "step": 2775, "valid_targets_mean": 2250.4, "valid_targets_min": 810 }, { "epoch": 2.9201680672268906, "grad_norm": 0.6320606127718346, "learning_rate": 2.8957773543935518e-05, "loss": 0.231, "loss_nan_ranks": 0, "loss_rank_avg": 0.22176562249660492, "step": 2780, "valid_targets_mean": 2631.1, "valid_targets_min": 943 }, { "epoch": 2.9254201680672267, "grad_norm": 0.6808320182720331, "learning_rate": 2.8910905042141046e-05, "loss": 0.2378, "loss_nan_ranks": 0, "loss_rank_avg": 0.2327442467212677, "step": 2785, "valid_targets_mean": 2285.2, "valid_targets_min": 836 }, { "epoch": 2.9306722689075633, "grad_norm": 0.7718275961115919, "learning_rate": 2.8863975404881022e-05, "loss": 0.2489, "loss_nan_ranks": 0, "loss_rank_avg": 0.23095104098320007, "step": 2790, "valid_targets_mean": 1883.9, "valid_targets_min": 836 }, { "epoch": 2.935924369747899, "grad_norm": 0.6901725161531642, "learning_rate": 2.881698495412781e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.23618492484092712, "step": 2795, "valid_targets_mean": 2379.7, "valid_targets_min": 771 }, { "epoch": 2.9411764705882355, "grad_norm": 0.6510522678878954, "learning_rate": 2.8769934012271004e-05, "loss": 0.2418, "loss_nan_ranks": 0, "loss_rank_avg": 0.26842981576919556, "step": 2800, "valid_targets_mean": 2957.8, "valid_targets_min": 632 }, { "epoch": 2.946428571428571, "grad_norm": 0.690393878481563, "learning_rate": 2.8722822902115228e-05, "loss": 0.2301, "loss_nan_ranks": 0, "loss_rank_avg": 0.2306583821773529, "step": 2805, "valid_targets_mean": 2844.0, "valid_targets_min": 777 }, { "epoch": 2.9516806722689077, "grad_norm": 0.6881209587839068, "learning_rate": 2.8675651946877884e-05, "loss": 0.2508, "loss_nan_ranks": 0, "loss_rank_avg": 0.26074153184890747, "step": 2810, "valid_targets_mean": 2694.2, "valid_targets_min": 744 }, { "epoch": 2.956932773109244, "grad_norm": 0.5892580385058059, "learning_rate": 2.862842147018696e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.2656477689743042, "step": 2815, "valid_targets_mean": 3714.4, "valid_targets_min": 1073 }, { "epoch": 2.96218487394958, "grad_norm": 0.6824881929007802, "learning_rate": 2.858113179607881e-05, "loss": 0.2421, "loss_nan_ranks": 0, "loss_rank_avg": 0.23978950083255768, "step": 2820, "valid_targets_mean": 2137.4, "valid_targets_min": 873 }, { "epoch": 2.967436974789916, "grad_norm": 0.6773521974686484, "learning_rate": 2.8533783248995938e-05, "loss": 0.2435, "loss_nan_ranks": 0, "loss_rank_avg": 0.2452758550643921, "step": 2825, "valid_targets_mean": 2297.1, "valid_targets_min": 578 }, { "epoch": 2.972689075630252, "grad_norm": 0.7308770430795042, "learning_rate": 2.848637615378475e-05, "loss": 0.2534, "loss_nan_ranks": 0, "loss_rank_avg": 0.24922780692577362, "step": 2830, "valid_targets_mean": 2439.7, "valid_targets_min": 1055 }, { "epoch": 2.9779411764705883, "grad_norm": 0.6031497666783858, "learning_rate": 2.8438910835693314e-05, "loss": 0.2387, "loss_nan_ranks": 0, "loss_rank_avg": 0.2477431297302246, "step": 2835, "valid_targets_mean": 2889.0, "valid_targets_min": 720 }, { "epoch": 2.9831932773109244, "grad_norm": 0.7153376315518947, "learning_rate": 2.8391387620369192e-05, "loss": 0.2448, "loss_nan_ranks": 0, "loss_rank_avg": 0.25468868017196655, "step": 2840, "valid_targets_mean": 2295.2, "valid_targets_min": 721 }, { "epoch": 2.9884453781512605, "grad_norm": 0.6969521384499777, "learning_rate": 2.834380683385714e-05, "loss": 0.2429, "loss_nan_ranks": 0, "loss_rank_avg": 0.220721036195755, "step": 2845, "valid_targets_mean": 2244.9, "valid_targets_min": 1073 }, { "epoch": 2.9936974789915967, "grad_norm": 0.7414684846578835, "learning_rate": 2.8296168802596892e-05, "loss": 0.2391, "loss_nan_ranks": 0, "loss_rank_avg": 0.23130197823047638, "step": 2850, "valid_targets_mean": 1981.4, "valid_targets_min": 750 }, { "epoch": 2.9989495798319328, "grad_norm": 0.7478026755802675, "learning_rate": 2.8248473853420933e-05, "loss": 0.2411, "loss_nan_ranks": 0, "loss_rank_avg": 0.2313975691795349, "step": 2855, "valid_targets_mean": 1840.1, "valid_targets_min": 734 }, { "epoch": 3.004201680672269, "grad_norm": 0.6438849416484059, "learning_rate": 2.8200722313552247e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.20280009508132935, "step": 2860, "valid_targets_mean": 2363.8, "valid_targets_min": 720 }, { "epoch": 3.009453781512605, "grad_norm": 0.6700105099862343, "learning_rate": 2.8152914510602073e-05, "loss": 0.2048, "loss_nan_ranks": 0, "loss_rank_avg": 0.21491551399230957, "step": 2865, "valid_targets_mean": 2595.0, "valid_targets_min": 557 }, { "epoch": 3.014705882352941, "grad_norm": 0.6973369056653054, "learning_rate": 2.810505077256765e-05, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.19096165895462036, "step": 2870, "valid_targets_mean": 2309.4, "valid_targets_min": 666 }, { "epoch": 3.0199579831932772, "grad_norm": 0.7391770624716282, "learning_rate": 2.8057131427829983e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.22697217762470245, "step": 2875, "valid_targets_mean": 2748.4, "valid_targets_min": 692 }, { "epoch": 3.0252100840336134, "grad_norm": 0.7323248663686152, "learning_rate": 2.800915680515157e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.21774935722351074, "step": 2880, "valid_targets_mean": 2176.5, "valid_targets_min": 567 }, { "epoch": 3.0304621848739495, "grad_norm": 0.7293920324073403, "learning_rate": 2.7961127233674167e-05, "loss": 0.2025, "loss_nan_ranks": 0, "loss_rank_avg": 0.19380387663841248, "step": 2885, "valid_targets_mean": 2121.6, "valid_targets_min": 760 }, { "epoch": 3.0357142857142856, "grad_norm": 0.7214083612213081, "learning_rate": 2.7913043042916513e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.2048916071653366, "step": 2890, "valid_targets_mean": 2635.6, "valid_targets_min": 916 }, { "epoch": 3.0409663865546217, "grad_norm": 0.6608114815054316, "learning_rate": 2.786490456277208e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.21670818328857422, "step": 2895, "valid_targets_mean": 2556.7, "valid_targets_min": 762 }, { "epoch": 3.046218487394958, "grad_norm": 0.66860146042256, "learning_rate": 2.7816712123506796e-05, "loss": 0.1965, "loss_nan_ranks": 0, "loss_rank_avg": 0.20460188388824463, "step": 2900, "valid_targets_mean": 2566.9, "valid_targets_min": 420 }, { "epoch": 3.051470588235294, "grad_norm": 0.7008326884337155, "learning_rate": 2.776846605575681e-05, "loss": 0.2132, "loss_nan_ranks": 0, "loss_rank_avg": 0.201397106051445, "step": 2905, "valid_targets_mean": 2224.4, "valid_targets_min": 663 }, { "epoch": 3.05672268907563, "grad_norm": 0.7720626933651689, "learning_rate": 2.772016669052618e-05, "loss": 0.2133, "loss_nan_ranks": 0, "loss_rank_avg": 0.2363039255142212, "step": 2910, "valid_targets_mean": 2557.2, "valid_targets_min": 1106 }, { "epoch": 3.0619747899159666, "grad_norm": 0.7021404124625371, "learning_rate": 2.767181435918464e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.20766621828079224, "step": 2915, "valid_targets_mean": 2482.2, "valid_targets_min": 855 }, { "epoch": 3.0672268907563027, "grad_norm": 0.6343762530485658, "learning_rate": 2.7623409393465298e-05, "loss": 0.2071, "loss_nan_ranks": 0, "loss_rank_avg": 0.19036218523979187, "step": 2920, "valid_targets_mean": 3076.4, "valid_targets_min": 741 }, { "epoch": 3.072478991596639, "grad_norm": 0.7035625376410721, "learning_rate": 2.7574952125462386e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.18567273020744324, "step": 2925, "valid_targets_mean": 2296.6, "valid_targets_min": 467 }, { "epoch": 3.077731092436975, "grad_norm": 0.6382148687024268, "learning_rate": 2.7526442887628962e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.19346240162849426, "step": 2930, "valid_targets_mean": 2762.5, "valid_targets_min": 937 }, { "epoch": 3.082983193277311, "grad_norm": 0.7008906642109496, "learning_rate": 2.7477882012774633e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.21867555379867554, "step": 2935, "valid_targets_mean": 2581.9, "valid_targets_min": 1101 }, { "epoch": 3.088235294117647, "grad_norm": 0.708331450124728, "learning_rate": 2.742926983406328e-05, "loss": 0.2003, "loss_nan_ranks": 0, "loss_rank_avg": 0.22323349118232727, "step": 2940, "valid_targets_mean": 2543.1, "valid_targets_min": 680 }, { "epoch": 3.0934873949579833, "grad_norm": 0.7455067327316252, "learning_rate": 2.7380606685010767e-05, "loss": 0.2035, "loss_nan_ranks": 0, "loss_rank_avg": 0.21157895028591156, "step": 2945, "valid_targets_mean": 2247.4, "valid_targets_min": 701 }, { "epoch": 3.0987394957983194, "grad_norm": 0.6753873272175467, "learning_rate": 2.7331892899482654e-05, "loss": 0.2167, "loss_nan_ranks": 0, "loss_rank_avg": 0.2144676148891449, "step": 2950, "valid_targets_mean": 2689.9, "valid_targets_min": 767 }, { "epoch": 3.1039915966386555, "grad_norm": 0.6865230940428809, "learning_rate": 2.7283128811691893e-05, "loss": 0.2062, "loss_nan_ranks": 0, "loss_rank_avg": 0.2236787974834442, "step": 2955, "valid_targets_mean": 2606.0, "valid_targets_min": 869 }, { "epoch": 3.1092436974789917, "grad_norm": 0.6404580815887296, "learning_rate": 2.7234314756196564e-05, "loss": 0.1962, "loss_nan_ranks": 0, "loss_rank_avg": 0.197324737906456, "step": 2960, "valid_targets_mean": 2785.6, "valid_targets_min": 642 }, { "epoch": 3.1144957983193278, "grad_norm": 0.7140771160670712, "learning_rate": 2.718545106789755e-05, "loss": 0.2037, "loss_nan_ranks": 0, "loss_rank_avg": 0.19954288005828857, "step": 2965, "valid_targets_mean": 2234.5, "valid_targets_min": 872 }, { "epoch": 3.119747899159664, "grad_norm": 0.6975932021440397, "learning_rate": 2.713653808203626e-05, "loss": 0.1975, "loss_nan_ranks": 0, "loss_rank_avg": 0.2170845866203308, "step": 2970, "valid_targets_mean": 2639.3, "valid_targets_min": 680 }, { "epoch": 3.125, "grad_norm": 0.7113689274916534, "learning_rate": 2.7087576134192305e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.21494010090827942, "step": 2975, "valid_targets_mean": 2403.4, "valid_targets_min": 1159 }, { "epoch": 3.130252100840336, "grad_norm": 0.6838797403752815, "learning_rate": 2.7038565560281252e-05, "loss": 0.2072, "loss_nan_ranks": 0, "loss_rank_avg": 0.22361846268177032, "step": 2980, "valid_targets_mean": 2727.6, "valid_targets_min": 1111 }, { "epoch": 3.1355042016806722, "grad_norm": 0.7301967352422043, "learning_rate": 2.6989506696552224e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.24528783559799194, "step": 2985, "valid_targets_mean": 2384.6, "valid_targets_min": 675 }, { "epoch": 3.1407563025210083, "grad_norm": 0.7300962730703254, "learning_rate": 2.6940399879585685e-05, "loss": 0.2226, "loss_nan_ranks": 0, "loss_rank_avg": 0.24462322890758514, "step": 2990, "valid_targets_mean": 2379.9, "valid_targets_min": 747 }, { "epoch": 3.1460084033613445, "grad_norm": 0.6314374147339737, "learning_rate": 2.6891245446291093e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.20750781893730164, "step": 2995, "valid_targets_mean": 3385.5, "valid_targets_min": 734 }, { "epoch": 3.1512605042016806, "grad_norm": 0.6709712599868535, "learning_rate": 2.6842043733904578e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.19627419114112854, "step": 3000, "valid_targets_mean": 2626.9, "valid_targets_min": 1022 }, { "epoch": 3.1565126050420167, "grad_norm": 0.7079636790584424, "learning_rate": 2.6792795079986634e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.21414107084274292, "step": 3005, "valid_targets_mean": 2522.1, "valid_targets_min": 625 }, { "epoch": 3.161764705882353, "grad_norm": 0.8013316017451616, "learning_rate": 2.6743499822419833e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.21229714155197144, "step": 3010, "valid_targets_mean": 1945.2, "valid_targets_min": 1078 }, { "epoch": 3.167016806722689, "grad_norm": 0.7573033558532629, "learning_rate": 2.669415829940646e-05, "loss": 0.2004, "loss_nan_ranks": 0, "loss_rank_avg": 0.22666743397712708, "step": 3015, "valid_targets_mean": 2352.1, "valid_targets_min": 802 }, { "epoch": 3.172268907563025, "grad_norm": 0.6967416593034284, "learning_rate": 2.6644770849466226e-05, "loss": 0.2107, "loss_nan_ranks": 0, "loss_rank_avg": 0.19799959659576416, "step": 3020, "valid_targets_mean": 2473.9, "valid_targets_min": 926 }, { "epoch": 3.177521008403361, "grad_norm": 0.6958940312721166, "learning_rate": 2.6595337811433925e-05, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.21963286399841309, "step": 3025, "valid_targets_mean": 2855.2, "valid_targets_min": 797 }, { "epoch": 3.1827731092436973, "grad_norm": 0.6644738321935247, "learning_rate": 2.654585952445714e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.19399645924568176, "step": 3030, "valid_targets_mean": 2638.8, "valid_targets_min": 640 }, { "epoch": 3.1880252100840334, "grad_norm": 0.7306469351103843, "learning_rate": 2.6496336327993882e-05, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.20161199569702148, "step": 3035, "valid_targets_mean": 2136.2, "valid_targets_min": 711 }, { "epoch": 3.19327731092437, "grad_norm": 0.7466263828328548, "learning_rate": 2.6446768561810264e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.20817327499389648, "step": 3040, "valid_targets_mean": 2153.1, "valid_targets_min": 798 }, { "epoch": 3.198529411764706, "grad_norm": 0.6197811979812847, "learning_rate": 2.6397156565978198e-05, "loss": 0.2048, "loss_nan_ranks": 0, "loss_rank_avg": 0.18749669194221497, "step": 3045, "valid_targets_mean": 2755.1, "valid_targets_min": 823 }, { "epoch": 3.203781512605042, "grad_norm": 0.6980373354580599, "learning_rate": 2.6347500680873043e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.20377440750598907, "step": 3050, "valid_targets_mean": 2491.8, "valid_targets_min": 725 }, { "epoch": 3.2090336134453783, "grad_norm": 0.7085865520639477, "learning_rate": 2.6297801247171258e-05, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.2216644287109375, "step": 3055, "valid_targets_mean": 2806.9, "valid_targets_min": 1071 }, { "epoch": 3.2142857142857144, "grad_norm": 0.7205089790035474, "learning_rate": 2.6248058605848097e-05, "loss": 0.2212, "loss_nan_ranks": 0, "loss_rank_avg": 0.22407683730125427, "step": 3060, "valid_targets_mean": 2472.9, "valid_targets_min": 769 }, { "epoch": 3.2195378151260505, "grad_norm": 0.737404594127863, "learning_rate": 2.6198273098175234e-05, "loss": 0.2204, "loss_nan_ranks": 0, "loss_rank_avg": 0.20326296985149384, "step": 3065, "valid_targets_mean": 2019.1, "valid_targets_min": 888 }, { "epoch": 3.2247899159663866, "grad_norm": 0.6073130718222292, "learning_rate": 2.614844506571844e-05, "loss": 0.2108, "loss_nan_ranks": 0, "loss_rank_avg": 0.20230062305927277, "step": 3070, "valid_targets_mean": 3304.4, "valid_targets_min": 746 }, { "epoch": 3.2300420168067228, "grad_norm": 0.7085944292327786, "learning_rate": 2.609857485033525e-05, "loss": 0.215, "loss_nan_ranks": 0, "loss_rank_avg": 0.20458903908729553, "step": 3075, "valid_targets_mean": 2500.9, "valid_targets_min": 902 }, { "epoch": 3.235294117647059, "grad_norm": 0.7171287135570944, "learning_rate": 2.6048662794172595e-05, "loss": 0.2095, "loss_nan_ranks": 0, "loss_rank_avg": 0.20819462835788727, "step": 3080, "valid_targets_mean": 2273.6, "valid_targets_min": 787 }, { "epoch": 3.240546218487395, "grad_norm": 0.7241451356443119, "learning_rate": 2.599870923966447e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.2197907567024231, "step": 3085, "valid_targets_mean": 2637.4, "valid_targets_min": 625 }, { "epoch": 3.245798319327731, "grad_norm": 0.6305118521703866, "learning_rate": 2.5948714529529565e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.18660598993301392, "step": 3090, "valid_targets_mean": 3157.4, "valid_targets_min": 1567 }, { "epoch": 3.2510504201680672, "grad_norm": 0.6893413514689206, "learning_rate": 2.5898679006768958e-05, "loss": 0.2081, "loss_nan_ranks": 0, "loss_rank_avg": 0.19289371371269226, "step": 3095, "valid_targets_mean": 2322.9, "valid_targets_min": 681 }, { "epoch": 3.2563025210084033, "grad_norm": 0.7101789326050002, "learning_rate": 2.5848603014663702e-05, "loss": 0.2077, "loss_nan_ranks": 0, "loss_rank_avg": 0.2187972515821457, "step": 3100, "valid_targets_mean": 2543.6, "valid_targets_min": 1024 }, { "epoch": 3.2615546218487395, "grad_norm": 0.9990787057867775, "learning_rate": 2.579848689677252e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.21138152480125427, "step": 3105, "valid_targets_mean": 2269.6, "valid_targets_min": 982 }, { "epoch": 3.2668067226890756, "grad_norm": 0.8018203500723405, "learning_rate": 2.5748330996929414e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.20356349647045135, "step": 3110, "valid_targets_mean": 1958.8, "valid_targets_min": 692 }, { "epoch": 3.2720588235294117, "grad_norm": 0.6603494412466163, "learning_rate": 2.5698135659241334e-05, "loss": 0.2031, "loss_nan_ranks": 0, "loss_rank_avg": 0.18327882885932922, "step": 3115, "valid_targets_mean": 2493.4, "valid_targets_min": 626 }, { "epoch": 3.277310924369748, "grad_norm": 0.762235597580697, "learning_rate": 2.564790122808579e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.20926137268543243, "step": 3120, "valid_targets_mean": 2595.1, "valid_targets_min": 720 }, { "epoch": 3.282563025210084, "grad_norm": 0.6535295283093114, "learning_rate": 2.5597628048108504e-05, "loss": 0.2168, "loss_nan_ranks": 0, "loss_rank_avg": 0.19361212849617004, "step": 3125, "valid_targets_mean": 2594.5, "valid_targets_min": 814 }, { "epoch": 3.28781512605042, "grad_norm": 0.7359578809709093, "learning_rate": 2.5547316464221058e-05, "loss": 0.2171, "loss_nan_ranks": 0, "loss_rank_avg": 0.24306191504001617, "step": 3130, "valid_targets_mean": 2595.2, "valid_targets_min": 762 }, { "epoch": 3.293067226890756, "grad_norm": 0.7555698425148304, "learning_rate": 2.5496966821598493e-05, "loss": 0.2028, "loss_nan_ranks": 0, "loss_rank_avg": 0.18649283051490784, "step": 3135, "valid_targets_mean": 2025.6, "valid_targets_min": 1099 }, { "epoch": 3.2983193277310923, "grad_norm": 0.6867271312637763, "learning_rate": 2.5446579465676977e-05, "loss": 0.1993, "loss_nan_ranks": 0, "loss_rank_avg": 0.2280460000038147, "step": 3140, "valid_targets_mean": 2837.4, "valid_targets_min": 940 }, { "epoch": 3.3035714285714284, "grad_norm": 0.7890879070663028, "learning_rate": 2.5396154742151407e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.24599486589431763, "step": 3145, "valid_targets_mean": 2421.9, "valid_targets_min": 617 }, { "epoch": 3.3088235294117645, "grad_norm": 0.7043690415607949, "learning_rate": 2.5345692996973075e-05, "loss": 0.2029, "loss_nan_ranks": 0, "loss_rank_avg": 0.20645210146903992, "step": 3150, "valid_targets_mean": 2250.8, "valid_targets_min": 654 }, { "epoch": 3.314075630252101, "grad_norm": 0.6920998160391696, "learning_rate": 2.5295194576347233e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.22358179092407227, "step": 3155, "valid_targets_mean": 2739.9, "valid_targets_min": 790 }, { "epoch": 3.3193277310924367, "grad_norm": 0.8209408504141388, "learning_rate": 2.5244659826730774e-05, "loss": 0.2082, "loss_nan_ranks": 0, "loss_rank_avg": 0.22088845074176788, "step": 3160, "valid_targets_mean": 2667.9, "valid_targets_min": 696 }, { "epoch": 3.3245798319327733, "grad_norm": 0.73587278467102, "learning_rate": 2.519408909482984e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.20288720726966858, "step": 3165, "valid_targets_mean": 2124.1, "valid_targets_min": 917 }, { "epoch": 3.3298319327731094, "grad_norm": 0.6501152833208236, "learning_rate": 2.5143482727597427e-05, "loss": 0.2008, "loss_nan_ranks": 0, "loss_rank_avg": 0.20123985409736633, "step": 3170, "valid_targets_mean": 3260.6, "valid_targets_min": 1042 }, { "epoch": 3.3350840336134455, "grad_norm": 0.6791329217706075, "learning_rate": 2.509284107223102e-05, "loss": 0.1986, "loss_nan_ranks": 0, "loss_rank_avg": 0.21437102556228638, "step": 3175, "valid_targets_mean": 2677.3, "valid_targets_min": 1019 }, { "epoch": 3.3403361344537816, "grad_norm": 0.8312153231004512, "learning_rate": 2.50421644761702e-05, "loss": 0.2154, "loss_nan_ranks": 0, "loss_rank_avg": 0.2082928568124771, "step": 3180, "valid_targets_mean": 1766.3, "valid_targets_min": 947 }, { "epoch": 3.3455882352941178, "grad_norm": 0.6346713038488362, "learning_rate": 2.499145328709429e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.2058856189250946, "step": 3185, "valid_targets_mean": 2967.8, "valid_targets_min": 818 }, { "epoch": 3.350840336134454, "grad_norm": 0.7841149043918871, "learning_rate": 2.4940707852919924e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.21573182940483093, "step": 3190, "valid_targets_mean": 1853.8, "valid_targets_min": 1039 }, { "epoch": 3.35609243697479, "grad_norm": 0.7289604889723915, "learning_rate": 2.488992852179868e-05, "loss": 0.2001, "loss_nan_ranks": 0, "loss_rank_avg": 0.21095168590545654, "step": 3195, "valid_targets_mean": 2192.4, "valid_targets_min": 1030 }, { "epoch": 3.361344537815126, "grad_norm": 0.7426897994171837, "learning_rate": 2.483911564211472e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.2094847857952118, "step": 3200, "valid_targets_mean": 2182.3, "valid_targets_min": 1090 }, { "epoch": 3.366596638655462, "grad_norm": 0.6905790936704768, "learning_rate": 2.4788269562482355e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.18250685930252075, "step": 3205, "valid_targets_mean": 2181.2, "valid_targets_min": 797 }, { "epoch": 3.3718487394957983, "grad_norm": 0.6711044771695471, "learning_rate": 2.4737390631743675e-05, "loss": 0.217, "loss_nan_ranks": 0, "loss_rank_avg": 0.21213862299919128, "step": 3210, "valid_targets_mean": 2841.9, "valid_targets_min": 715 }, { "epoch": 3.3771008403361344, "grad_norm": 0.7172706019446755, "learning_rate": 2.4686479198966146e-05, "loss": 0.2113, "loss_nan_ranks": 0, "loss_rank_avg": 0.21013203263282776, "step": 3215, "valid_targets_mean": 2435.9, "valid_targets_min": 848 }, { "epoch": 3.3823529411764706, "grad_norm": 0.746681881677102, "learning_rate": 2.463553561344024e-05, "loss": 0.2193, "loss_nan_ranks": 0, "loss_rank_avg": 0.2209860384464264, "step": 3220, "valid_targets_mean": 2233.9, "valid_targets_min": 929 }, { "epoch": 3.3876050420168067, "grad_norm": 0.7545727322641577, "learning_rate": 2.4584560224677013e-05, "loss": 0.2176, "loss_nan_ranks": 0, "loss_rank_avg": 0.2379944920539856, "step": 3225, "valid_targets_mean": 2649.4, "valid_targets_min": 738 }, { "epoch": 3.392857142857143, "grad_norm": 0.6782835854882808, "learning_rate": 2.4533553382405702e-05, "loss": 0.211, "loss_nan_ranks": 0, "loss_rank_avg": 0.20617589354515076, "step": 3230, "valid_targets_mean": 2802.6, "valid_targets_min": 882 }, { "epoch": 3.398109243697479, "grad_norm": 0.7578767328316001, "learning_rate": 2.4482515436571365e-05, "loss": 0.2172, "loss_nan_ranks": 0, "loss_rank_avg": 0.22788771986961365, "step": 3235, "valid_targets_mean": 2326.2, "valid_targets_min": 776 }, { "epoch": 3.403361344537815, "grad_norm": 0.6541735808021184, "learning_rate": 2.4431446737332437e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.20903077721595764, "step": 3240, "valid_targets_mean": 3203.4, "valid_targets_min": 1003 }, { "epoch": 3.408613445378151, "grad_norm": 0.7811038952636883, "learning_rate": 2.438034763505833e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.21477511525154114, "step": 3245, "valid_targets_mean": 1979.8, "valid_targets_min": 757 }, { "epoch": 3.4138655462184873, "grad_norm": 0.6625538840028757, "learning_rate": 2.432921848032707e-05, "loss": 0.2044, "loss_nan_ranks": 0, "loss_rank_avg": 0.2320900559425354, "step": 3250, "valid_targets_mean": 2910.2, "valid_targets_min": 1315 }, { "epoch": 3.4191176470588234, "grad_norm": 0.7485969796152663, "learning_rate": 2.427805962392286e-05, "loss": 0.2025, "loss_nan_ranks": 0, "loss_rank_avg": 0.20698726177215576, "step": 3255, "valid_targets_mean": 1875.1, "valid_targets_min": 863 }, { "epoch": 3.4243697478991595, "grad_norm": 0.7348995050217967, "learning_rate": 2.4226871416833683e-05, "loss": 0.1988, "loss_nan_ranks": 0, "loss_rank_avg": 0.20574046671390533, "step": 3260, "valid_targets_mean": 2167.6, "valid_targets_min": 1058 }, { "epoch": 3.4296218487394956, "grad_norm": 0.6743471501486973, "learning_rate": 2.4175654210248848e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.19565929472446442, "step": 3265, "valid_targets_mean": 2611.9, "valid_targets_min": 806 }, { "epoch": 3.434873949579832, "grad_norm": 0.6301404143473273, "learning_rate": 2.4124408355556677e-05, "loss": 0.2177, "loss_nan_ranks": 0, "loss_rank_avg": 0.22094877064228058, "step": 3270, "valid_targets_mean": 3081.8, "valid_targets_min": 686 }, { "epoch": 3.440126050420168, "grad_norm": 0.6526940719618316, "learning_rate": 2.4073134204342014e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.20152367651462555, "step": 3275, "valid_targets_mean": 2381.3, "valid_targets_min": 793 }, { "epoch": 3.4453781512605044, "grad_norm": 0.6659235538473005, "learning_rate": 2.4021832108383837e-05, "loss": 0.2207, "loss_nan_ranks": 0, "loss_rank_avg": 0.20738565921783447, "step": 3280, "valid_targets_mean": 2625.6, "valid_targets_min": 635 }, { "epoch": 3.4506302521008405, "grad_norm": 0.7166624142705825, "learning_rate": 2.3970502419652854e-05, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.19094321131706238, "step": 3285, "valid_targets_mean": 2041.8, "valid_targets_min": 776 }, { "epoch": 3.4558823529411766, "grad_norm": 0.7984671258808161, "learning_rate": 2.3919145490309076e-05, "loss": 0.2116, "loss_nan_ranks": 0, "loss_rank_avg": 0.21888110041618347, "step": 3290, "valid_targets_mean": 1798.3, "valid_targets_min": 611 }, { "epoch": 3.4611344537815127, "grad_norm": 0.6963556467492686, "learning_rate": 2.38677616726994e-05, "loss": 0.1958, "loss_nan_ranks": 0, "loss_rank_avg": 0.17585915327072144, "step": 3295, "valid_targets_mean": 2040.5, "valid_targets_min": 914 }, { "epoch": 3.466386554621849, "grad_norm": 0.5743174603598479, "learning_rate": 2.381635131935521e-05, "loss": 0.205, "loss_nan_ranks": 0, "loss_rank_avg": 0.1667209416627884, "step": 3300, "valid_targets_mean": 3134.2, "valid_targets_min": 522 }, { "epoch": 3.471638655462185, "grad_norm": 0.7243626640826193, "learning_rate": 2.3764914782989926e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.22822029888629913, "step": 3305, "valid_targets_mean": 2619.9, "valid_targets_min": 740 }, { "epoch": 3.476890756302521, "grad_norm": 0.669561945697959, "learning_rate": 2.3713452416496625e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.20612934231758118, "step": 3310, "valid_targets_mean": 2525.0, "valid_targets_min": 717 }, { "epoch": 3.482142857142857, "grad_norm": 0.7414140882682606, "learning_rate": 2.366196457294558e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.21093863248825073, "step": 3315, "valid_targets_mean": 2090.9, "valid_targets_min": 739 }, { "epoch": 3.4873949579831933, "grad_norm": 0.6133977770277803, "learning_rate": 2.3610451605581858e-05, "loss": 0.2061, "loss_nan_ranks": 0, "loss_rank_avg": 0.1882474273443222, "step": 3320, "valid_targets_mean": 3069.8, "valid_targets_min": 891 }, { "epoch": 3.4926470588235294, "grad_norm": 0.6648952110036311, "learning_rate": 2.3558913867822905e-05, "loss": 0.2057, "loss_nan_ranks": 0, "loss_rank_avg": 0.20279830694198608, "step": 3325, "valid_targets_mean": 2729.6, "valid_targets_min": 484 }, { "epoch": 3.4978991596638656, "grad_norm": 0.7839692483507994, "learning_rate": 2.3507351713256105e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.21825388073921204, "step": 3330, "valid_targets_mean": 1961.4, "valid_targets_min": 837 }, { "epoch": 3.5031512605042017, "grad_norm": 0.6420384291551596, "learning_rate": 2.3455765495636353e-05, "loss": 0.2015, "loss_nan_ranks": 0, "loss_rank_avg": 0.20120246708393097, "step": 3335, "valid_targets_mean": 2840.8, "valid_targets_min": 815 }, { "epoch": 3.508403361344538, "grad_norm": 0.7332433509193245, "learning_rate": 2.3404155568883643e-05, "loss": 0.214, "loss_nan_ranks": 0, "loss_rank_avg": 0.23752212524414062, "step": 3340, "valid_targets_mean": 2502.9, "valid_targets_min": 1052 }, { "epoch": 3.513655462184874, "grad_norm": 0.7036254623505526, "learning_rate": 2.3352522287080625e-05, "loss": 0.2107, "loss_nan_ranks": 0, "loss_rank_avg": 0.22437232732772827, "step": 3345, "valid_targets_mean": 2470.9, "valid_targets_min": 750 }, { "epoch": 3.51890756302521, "grad_norm": 0.674241478442284, "learning_rate": 2.3300866004470182e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.23106199502944946, "step": 3350, "valid_targets_mean": 2678.7, "valid_targets_min": 1190 }, { "epoch": 3.524159663865546, "grad_norm": 0.6913901681322876, "learning_rate": 2.324918707545302e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.20624200999736786, "step": 3355, "valid_targets_mean": 2525.9, "valid_targets_min": 886 }, { "epoch": 3.5294117647058822, "grad_norm": 0.7215505447514452, "learning_rate": 2.3197485854585183e-05, "loss": 0.2074, "loss_nan_ranks": 0, "loss_rank_avg": 0.18115992844104767, "step": 3360, "valid_targets_mean": 1991.8, "valid_targets_min": 697 }, { "epoch": 3.5346638655462184, "grad_norm": 0.6339782709302462, "learning_rate": 2.3145762696575675e-05, "loss": 0.2014, "loss_nan_ranks": 0, "loss_rank_avg": 0.20273572206497192, "step": 3365, "valid_targets_mean": 3340.9, "valid_targets_min": 754 }, { "epoch": 3.5399159663865545, "grad_norm": 0.6976739706673805, "learning_rate": 2.3094017956283995e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.2007465362548828, "step": 3370, "valid_targets_mean": 2454.3, "valid_targets_min": 943 }, { "epoch": 3.5451680672268906, "grad_norm": 0.6726999837744964, "learning_rate": 2.3042251988717728e-05, "loss": 0.2006, "loss_nan_ranks": 0, "loss_rank_avg": 0.16553646326065063, "step": 3375, "valid_targets_mean": 2192.6, "valid_targets_min": 643 }, { "epoch": 3.5504201680672267, "grad_norm": 0.7301827373994265, "learning_rate": 2.2990465149030077e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.19199733436107635, "step": 3380, "valid_targets_mean": 2214.3, "valid_targets_min": 897 }, { "epoch": 3.5556722689075633, "grad_norm": 0.6670894246533184, "learning_rate": 2.2938657792517446e-05, "loss": 0.221, "loss_nan_ranks": 0, "loss_rank_avg": 0.2090798318386078, "step": 3385, "valid_targets_mean": 2772.3, "valid_targets_min": 660 }, { "epoch": 3.560924369747899, "grad_norm": 0.7737810251679192, "learning_rate": 2.2886830274617017e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.24221691489219666, "step": 3390, "valid_targets_mean": 2221.1, "valid_targets_min": 861 }, { "epoch": 3.5661764705882355, "grad_norm": 0.6681259679390096, "learning_rate": 2.2834982950904267e-05, "loss": 0.2107, "loss_nan_ranks": 0, "loss_rank_avg": 0.19659334421157837, "step": 3395, "valid_targets_mean": 2447.6, "valid_targets_min": 663 }, { "epoch": 3.571428571428571, "grad_norm": 0.8318412772228536, "learning_rate": 2.2783116177090573e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.22690819203853607, "step": 3400, "valid_targets_mean": 2100.6, "valid_targets_min": 650 }, { "epoch": 3.5766806722689077, "grad_norm": 0.6541716254669749, "learning_rate": 2.2731230309020762e-05, "loss": 0.2164, "loss_nan_ranks": 0, "loss_rank_avg": 0.19614872336387634, "step": 3405, "valid_targets_mean": 2690.9, "valid_targets_min": 896 }, { "epoch": 3.581932773109244, "grad_norm": 0.735048933666179, "learning_rate": 2.2679325702670642e-05, "loss": 0.2098, "loss_nan_ranks": 0, "loss_rank_avg": 0.22025522589683533, "step": 3410, "valid_targets_mean": 2054.1, "valid_targets_min": 814 }, { "epoch": 3.58718487394958, "grad_norm": 0.7432848251883631, "learning_rate": 2.2627402714144586e-05, "loss": 0.2058, "loss_nan_ranks": 0, "loss_rank_avg": 0.21356913447380066, "step": 3415, "valid_targets_mean": 2400.3, "valid_targets_min": 940 }, { "epoch": 3.592436974789916, "grad_norm": 0.6273611826621119, "learning_rate": 2.2575461699673085e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.21526393294334412, "step": 3420, "valid_targets_mean": 3208.0, "valid_targets_min": 1402 }, { "epoch": 3.597689075630252, "grad_norm": 0.6901843944101652, "learning_rate": 2.2523503015610303e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.21407434344291687, "step": 3425, "valid_targets_mean": 2472.9, "valid_targets_min": 703 }, { "epoch": 3.6029411764705883, "grad_norm": 0.6750339364655951, "learning_rate": 2.2471527018431637e-05, "loss": 0.2146, "loss_nan_ranks": 0, "loss_rank_avg": 0.2302270233631134, "step": 3430, "valid_targets_mean": 3292.7, "valid_targets_min": 943 }, { "epoch": 3.6081932773109244, "grad_norm": 0.6870012851485073, "learning_rate": 2.2419534064731238e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.2101989984512329, "step": 3435, "valid_targets_mean": 2430.9, "valid_targets_min": 578 }, { "epoch": 3.6134453781512605, "grad_norm": 0.7652411173135991, "learning_rate": 2.236752451121963e-05, "loss": 0.2181, "loss_nan_ranks": 0, "loss_rank_avg": 0.20987604558467865, "step": 3440, "valid_targets_mean": 2773.8, "valid_targets_min": 756 }, { "epoch": 3.6186974789915967, "grad_norm": 0.96702355486614, "learning_rate": 2.2315498714721198e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.2208380401134491, "step": 3445, "valid_targets_mean": 2227.6, "valid_targets_min": 589 }, { "epoch": 3.6239495798319328, "grad_norm": 0.7568581037232849, "learning_rate": 2.2263457032171762e-05, "loss": 0.2144, "loss_nan_ranks": 0, "loss_rank_avg": 0.20502294600009918, "step": 3450, "valid_targets_mean": 1974.8, "valid_targets_min": 650 }, { "epoch": 3.629201680672269, "grad_norm": 0.6324142287116146, "learning_rate": 2.2211399820616154e-05, "loss": 0.2017, "loss_nan_ranks": 0, "loss_rank_avg": 0.1848364919424057, "step": 3455, "valid_targets_mean": 2530.7, "valid_targets_min": 1356 }, { "epoch": 3.634453781512605, "grad_norm": 0.6787789057247168, "learning_rate": 2.2159327437205733e-05, "loss": 0.2202, "loss_nan_ranks": 0, "loss_rank_avg": 0.20259186625480652, "step": 3460, "valid_targets_mean": 2469.3, "valid_targets_min": 843 }, { "epoch": 3.639705882352941, "grad_norm": 0.6108458629326181, "learning_rate": 2.210724023919595e-05, "loss": 0.21, "loss_nan_ranks": 0, "loss_rank_avg": 0.21205033361911774, "step": 3465, "valid_targets_mean": 3304.5, "valid_targets_min": 683 }, { "epoch": 3.6449579831932772, "grad_norm": 0.7630702002273175, "learning_rate": 2.205513858394389e-05, "loss": 0.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.22506915032863617, "step": 3470, "valid_targets_mean": 2128.4, "valid_targets_min": 982 }, { "epoch": 3.6502100840336134, "grad_norm": 0.6853988147626505, "learning_rate": 2.2003022828905832e-05, "loss": 0.2047, "loss_nan_ranks": 0, "loss_rank_avg": 0.2102399468421936, "step": 3475, "valid_targets_mean": 2369.8, "valid_targets_min": 942 }, { "epoch": 3.6554621848739495, "grad_norm": 0.8205924816380262, "learning_rate": 2.19508933316348e-05, "loss": 0.2094, "loss_nan_ranks": 0, "loss_rank_avg": 0.2225526124238968, "step": 3480, "valid_targets_mean": 2051.9, "valid_targets_min": 627 }, { "epoch": 3.6607142857142856, "grad_norm": 0.7855685679107322, "learning_rate": 2.189875044977808e-05, "loss": 0.2142, "loss_nan_ranks": 0, "loss_rank_avg": 0.21352198719978333, "step": 3485, "valid_targets_mean": 2024.9, "valid_targets_min": 868 }, { "epoch": 3.6659663865546217, "grad_norm": 0.6891565684644114, "learning_rate": 2.1846594541074796e-05, "loss": 0.2067, "loss_nan_ranks": 0, "loss_rank_avg": 0.19370394945144653, "step": 3490, "valid_targets_mean": 2303.7, "valid_targets_min": 732 }, { "epoch": 3.671218487394958, "grad_norm": 0.66281123426459, "learning_rate": 2.179442596335345e-05, "loss": 0.2158, "loss_nan_ranks": 0, "loss_rank_avg": 0.21961744129657745, "step": 3495, "valid_targets_mean": 2835.9, "valid_targets_min": 771 }, { "epoch": 3.6764705882352944, "grad_norm": 0.6917997631532197, "learning_rate": 2.174224507452945e-05, "loss": 0.2227, "loss_nan_ranks": 0, "loss_rank_avg": 0.20729771256446838, "step": 3500, "valid_targets_mean": 2409.9, "valid_targets_min": 742 }, { "epoch": 3.68172268907563, "grad_norm": 0.7215177976056998, "learning_rate": 2.1690052232602677e-05, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.24402323365211487, "step": 3505, "valid_targets_mean": 2753.1, "valid_targets_min": 670 }, { "epoch": 3.6869747899159666, "grad_norm": 0.6763541211099533, "learning_rate": 2.1637847795655022e-05, "loss": 0.2118, "loss_nan_ranks": 0, "loss_rank_avg": 0.21992330253124237, "step": 3510, "valid_targets_mean": 2720.9, "valid_targets_min": 700 }, { "epoch": 3.6922268907563023, "grad_norm": 0.6816841950766274, "learning_rate": 2.1585632121847925e-05, "loss": 0.2169, "loss_nan_ranks": 0, "loss_rank_avg": 0.19951927661895752, "step": 3515, "valid_targets_mean": 2837.1, "valid_targets_min": 743 }, { "epoch": 3.697478991596639, "grad_norm": 0.695061597525997, "learning_rate": 2.153340556941991e-05, "loss": 0.2147, "loss_nan_ranks": 0, "loss_rank_avg": 0.23091833293437958, "step": 3520, "valid_targets_mean": 2830.2, "valid_targets_min": 642 }, { "epoch": 3.7027310924369745, "grad_norm": 0.7145487481152861, "learning_rate": 2.1481168496684145e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.22669626772403717, "step": 3525, "valid_targets_mean": 2385.2, "valid_targets_min": 676 }, { "epoch": 3.707983193277311, "grad_norm": 0.773517958966538, "learning_rate": 2.142892126202597e-05, "loss": 0.2083, "loss_nan_ranks": 0, "loss_rank_avg": 0.20061250030994415, "step": 3530, "valid_targets_mean": 1901.8, "valid_targets_min": 620 }, { "epoch": 3.713235294117647, "grad_norm": 0.6514006030844219, "learning_rate": 2.137666422390045e-05, "loss": 0.2088, "loss_nan_ranks": 0, "loss_rank_avg": 0.21307383477687836, "step": 3535, "valid_targets_mean": 2973.2, "valid_targets_min": 819 }, { "epoch": 3.7184873949579833, "grad_norm": 0.6294462036244911, "learning_rate": 2.132439774082991e-05, "loss": 0.2197, "loss_nan_ranks": 0, "loss_rank_avg": 0.2212301641702652, "step": 3540, "valid_targets_mean": 3056.4, "valid_targets_min": 1194 }, { "epoch": 3.7237394957983194, "grad_norm": 0.654887046400427, "learning_rate": 2.1272122171401467e-05, "loss": 0.1945, "loss_nan_ranks": 0, "loss_rank_avg": 0.18347257375717163, "step": 3545, "valid_targets_mean": 2574.4, "valid_targets_min": 683 }, { "epoch": 3.7289915966386555, "grad_norm": 0.6809633747210387, "learning_rate": 2.1219837874264573e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.18207016587257385, "step": 3550, "valid_targets_mean": 2467.8, "valid_targets_min": 773 }, { "epoch": 3.7342436974789917, "grad_norm": 0.8490088878626119, "learning_rate": 2.116754520812857e-05, "loss": 0.2161, "loss_nan_ranks": 0, "loss_rank_avg": 0.21279117465019226, "step": 3555, "valid_targets_mean": 1938.0, "valid_targets_min": 917 }, { "epoch": 3.7394957983193278, "grad_norm": 0.7362797471450374, "learning_rate": 2.111524453176022e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.2274627536535263, "step": 3560, "valid_targets_mean": 2261.9, "valid_targets_min": 655 }, { "epoch": 3.744747899159664, "grad_norm": 0.7547351585834484, "learning_rate": 2.1062936203981227e-05, "loss": 0.2208, "loss_nan_ranks": 0, "loss_rank_avg": 0.21145398914813995, "step": 3565, "valid_targets_mean": 2079.0, "valid_targets_min": 765 }, { "epoch": 3.75, "grad_norm": 0.6040282948873019, "learning_rate": 2.10106205836658e-05, "loss": 0.2067, "loss_nan_ranks": 0, "loss_rank_avg": 0.17291516065597534, "step": 3570, "valid_targets_mean": 2807.0, "valid_targets_min": 768 }, { "epoch": 3.755252100840336, "grad_norm": 0.7692191031763723, "learning_rate": 2.095829802973817e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.21016576886177063, "step": 3575, "valid_targets_mean": 2692.1, "valid_targets_min": 818 }, { "epoch": 3.7605042016806722, "grad_norm": 0.6937553318754113, "learning_rate": 2.090596890117016e-05, "loss": 0.211, "loss_nan_ranks": 0, "loss_rank_avg": 0.20397567749023438, "step": 3580, "valid_targets_mean": 2325.8, "valid_targets_min": 915 }, { "epoch": 3.7657563025210083, "grad_norm": 0.7298575781771081, "learning_rate": 2.0853633556978674e-05, "loss": 0.2089, "loss_nan_ranks": 0, "loss_rank_avg": 0.2305256426334381, "step": 3585, "valid_targets_mean": 2357.3, "valid_targets_min": 789 }, { "epoch": 3.7710084033613445, "grad_norm": 0.8229634474031364, "learning_rate": 2.0801292356223265e-05, "loss": 0.2235, "loss_nan_ranks": 0, "loss_rank_avg": 0.23045924305915833, "step": 3590, "valid_targets_mean": 1879.1, "valid_targets_min": 807 }, { "epoch": 3.7762605042016806, "grad_norm": 0.6135522966100759, "learning_rate": 2.0748945658003695e-05, "loss": 0.2116, "loss_nan_ranks": 0, "loss_rank_avg": 0.20716413855552673, "step": 3595, "valid_targets_mean": 3463.8, "valid_targets_min": 244 }, { "epoch": 3.7815126050420167, "grad_norm": 0.8109456213693356, "learning_rate": 2.0696593821457392e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.21201831102371216, "step": 3600, "valid_targets_mean": 2110.6, "valid_targets_min": 714 }, { "epoch": 3.786764705882353, "grad_norm": 0.7309833863162327, "learning_rate": 2.064423720575709e-05, "loss": 0.2172, "loss_nan_ranks": 0, "loss_rank_avg": 0.22593368589878082, "step": 3605, "valid_targets_mean": 2323.6, "valid_targets_min": 658 }, { "epoch": 3.792016806722689, "grad_norm": 0.6453442893544274, "learning_rate": 2.0591876170108257e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.22857289016246796, "step": 3610, "valid_targets_mean": 2964.2, "valid_targets_min": 739 }, { "epoch": 3.7972689075630255, "grad_norm": 1.045593114030177, "learning_rate": 2.0539511073746743e-05, "loss": 0.1914, "loss_nan_ranks": 0, "loss_rank_avg": 0.2170926183462143, "step": 3615, "valid_targets_mean": 2493.9, "valid_targets_min": 662 }, { "epoch": 3.802521008403361, "grad_norm": 0.685780352452399, "learning_rate": 2.0487142275936213e-05, "loss": 0.2002, "loss_nan_ranks": 0, "loss_rank_avg": 0.1872934252023697, "step": 3620, "valid_targets_mean": 2356.4, "valid_targets_min": 591 }, { "epoch": 3.8077731092436977, "grad_norm": 0.7579039345943492, "learning_rate": 2.0434770135965743e-05, "loss": 0.2121, "loss_nan_ranks": 0, "loss_rank_avg": 0.200333833694458, "step": 3625, "valid_targets_mean": 2157.2, "valid_targets_min": 620 }, { "epoch": 3.8130252100840334, "grad_norm": 0.6470297697973766, "learning_rate": 2.0382395013147347e-05, "loss": 0.2022, "loss_nan_ranks": 0, "loss_rank_avg": 0.19545529782772064, "step": 3630, "valid_targets_mean": 2711.9, "valid_targets_min": 1144 }, { "epoch": 3.81827731092437, "grad_norm": 0.653362214398331, "learning_rate": 2.033001726681349e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.21826599538326263, "step": 3635, "valid_targets_mean": 2853.1, "valid_targets_min": 1078 }, { "epoch": 3.8235294117647056, "grad_norm": 0.6867053178122183, "learning_rate": 2.027763725631463e-05, "loss": 0.2023, "loss_nan_ranks": 0, "loss_rank_avg": 0.19404883682727814, "step": 3640, "valid_targets_mean": 2482.8, "valid_targets_min": 1067 }, { "epoch": 3.828781512605042, "grad_norm": 0.7218696655921097, "learning_rate": 2.0225255341016794e-05, "loss": 0.2105, "loss_nan_ranks": 0, "loss_rank_avg": 0.1934603750705719, "step": 3645, "valid_targets_mean": 2152.1, "valid_targets_min": 824 }, { "epoch": 3.8340336134453783, "grad_norm": 0.7091556745123918, "learning_rate": 2.017287188029904e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.21000255644321442, "step": 3650, "valid_targets_mean": 2308.8, "valid_targets_min": 610 }, { "epoch": 3.8392857142857144, "grad_norm": 0.6815200778696167, "learning_rate": 2.0120487233551035e-05, "loss": 0.2187, "loss_nan_ranks": 0, "loss_rank_avg": 0.23103326559066772, "step": 3655, "valid_targets_mean": 2734.1, "valid_targets_min": 610 }, { "epoch": 3.8445378151260505, "grad_norm": 0.6280352447022034, "learning_rate": 2.006810176017059e-05, "loss": 0.2085, "loss_nan_ranks": 0, "loss_rank_avg": 0.21302129328250885, "step": 3660, "valid_targets_mean": 3324.1, "valid_targets_min": 1012 }, { "epoch": 3.8497899159663866, "grad_norm": 0.7066023629427282, "learning_rate": 2.0015715819561205e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.21427252888679504, "step": 3665, "valid_targets_mean": 2452.4, "valid_targets_min": 873 }, { "epoch": 3.8550420168067228, "grad_norm": 0.647316148786966, "learning_rate": 1.9963329771129558e-05, "loss": 0.1952, "loss_nan_ranks": 0, "loss_rank_avg": 0.1968604177236557, "step": 3670, "valid_targets_mean": 2530.9, "valid_targets_min": 1254 }, { "epoch": 3.860294117647059, "grad_norm": 0.6784605187933433, "learning_rate": 1.9910943974283066e-05, "loss": 0.2143, "loss_nan_ranks": 0, "loss_rank_avg": 0.2061229795217514, "step": 3675, "valid_targets_mean": 2622.5, "valid_targets_min": 841 }, { "epoch": 3.865546218487395, "grad_norm": 0.6920269949000379, "learning_rate": 1.9858558788427447e-05, "loss": 0.1973, "loss_nan_ranks": 0, "loss_rank_avg": 0.18967095017433167, "step": 3680, "valid_targets_mean": 2135.2, "valid_targets_min": 513 }, { "epoch": 3.870798319327731, "grad_norm": 0.7052959882420897, "learning_rate": 1.9806174572964205e-05, "loss": 0.2198, "loss_nan_ranks": 0, "loss_rank_avg": 0.20895016193389893, "step": 3685, "valid_targets_mean": 2395.5, "valid_targets_min": 859 }, { "epoch": 3.8760504201680672, "grad_norm": 0.6385724766539387, "learning_rate": 1.975379168728819e-05, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.2081984281539917, "step": 3690, "valid_targets_mean": 2853.7, "valid_targets_min": 936 }, { "epoch": 3.8813025210084033, "grad_norm": 0.72510115733088, "learning_rate": 1.9701410490785128e-05, "loss": 0.2249, "loss_nan_ranks": 0, "loss_rank_avg": 0.22268277406692505, "step": 3695, "valid_targets_mean": 2524.2, "valid_targets_min": 694 }, { "epoch": 3.8865546218487395, "grad_norm": 0.7123147276422185, "learning_rate": 1.9649031342829178e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.22262287139892578, "step": 3700, "valid_targets_mean": 2540.8, "valid_targets_min": 746 }, { "epoch": 3.8918067226890756, "grad_norm": 0.6390925839310951, "learning_rate": 1.9596654602780398e-05, "loss": 0.2161, "loss_nan_ranks": 0, "loss_rank_avg": 0.19909490644931793, "step": 3705, "valid_targets_mean": 2773.2, "valid_targets_min": 853 }, { "epoch": 3.8970588235294117, "grad_norm": 0.6412477203773937, "learning_rate": 1.9544280629982364e-05, "loss": 0.2038, "loss_nan_ranks": 0, "loss_rank_avg": 0.1946112960577011, "step": 3710, "valid_targets_mean": 2642.8, "valid_targets_min": 849 }, { "epoch": 3.902310924369748, "grad_norm": 0.716484891233997, "learning_rate": 1.949190978375966e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.23176735639572144, "step": 3715, "valid_targets_mean": 2558.9, "valid_targets_min": 1150 }, { "epoch": 3.907563025210084, "grad_norm": 0.6768189969402229, "learning_rate": 1.9439542423415413e-05, "loss": 0.2018, "loss_nan_ranks": 0, "loss_rank_avg": 0.19778092205524445, "step": 3720, "valid_targets_mean": 2772.1, "valid_targets_min": 1107 }, { "epoch": 3.91281512605042, "grad_norm": 0.6207653385694745, "learning_rate": 1.9387178908228838e-05, "loss": 0.2181, "loss_nan_ranks": 0, "loss_rank_avg": 0.20920640230178833, "step": 3725, "valid_targets_mean": 3297.2, "valid_targets_min": 724 }, { "epoch": 3.918067226890756, "grad_norm": 0.7356716818302198, "learning_rate": 1.933481959745276e-05, "loss": 0.2218, "loss_nan_ranks": 0, "loss_rank_avg": 0.24886155128479004, "step": 3730, "valid_targets_mean": 2577.4, "valid_targets_min": 704 }, { "epoch": 3.9233193277310923, "grad_norm": 0.6771424238422388, "learning_rate": 1.9282464850311184e-05, "loss": 0.2115, "loss_nan_ranks": 0, "loss_rank_avg": 0.22557204961776733, "step": 3735, "valid_targets_mean": 2883.5, "valid_targets_min": 474 }, { "epoch": 3.928571428571429, "grad_norm": 0.7641048688976471, "learning_rate": 1.9230115025996764e-05, "loss": 0.208, "loss_nan_ranks": 0, "loss_rank_avg": 0.2032201588153839, "step": 3740, "valid_targets_mean": 1858.1, "valid_targets_min": 1143 }, { "epoch": 3.9338235294117645, "grad_norm": 0.5906821588122515, "learning_rate": 1.9177770483668416e-05, "loss": 0.2203, "loss_nan_ranks": 0, "loss_rank_avg": 0.1867651641368866, "step": 3745, "valid_targets_mean": 2936.9, "valid_targets_min": 646 }, { "epoch": 3.939075630252101, "grad_norm": 0.6203552861446046, "learning_rate": 1.912543158244881e-05, "loss": 0.2128, "loss_nan_ranks": 0, "loss_rank_avg": 0.19798970222473145, "step": 3750, "valid_targets_mean": 3003.4, "valid_targets_min": 617 }, { "epoch": 3.9443277310924367, "grad_norm": 0.7646340475457648, "learning_rate": 1.9073098681421895e-05, "loss": 0.2129, "loss_nan_ranks": 0, "loss_rank_avg": 0.19918084144592285, "step": 3755, "valid_targets_mean": 1886.4, "valid_targets_min": 545 }, { "epoch": 3.9495798319327733, "grad_norm": 0.6926521998600635, "learning_rate": 1.902077213963048e-05, "loss": 0.1995, "loss_nan_ranks": 0, "loss_rank_avg": 0.2141200602054596, "step": 3760, "valid_targets_mean": 2899.2, "valid_targets_min": 896 }, { "epoch": 3.9548319327731094, "grad_norm": 0.7157783415052118, "learning_rate": 1.896845231607372e-05, "loss": 0.1966, "loss_nan_ranks": 0, "loss_rank_avg": 0.19222521781921387, "step": 3765, "valid_targets_mean": 2013.7, "valid_targets_min": 780 }, { "epoch": 3.9600840336134455, "grad_norm": 0.8266386898112025, "learning_rate": 1.8916139569704704e-05, "loss": 0.2116, "loss_nan_ranks": 0, "loss_rank_avg": 0.22533836960792542, "step": 3770, "valid_targets_mean": 2034.5, "valid_targets_min": 656 }, { "epoch": 3.9653361344537816, "grad_norm": 0.8096944452658449, "learning_rate": 1.886383425942795e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.18177619576454163, "step": 3775, "valid_targets_mean": 1980.1, "valid_targets_min": 782 }, { "epoch": 3.9705882352941178, "grad_norm": 0.6708795853596977, "learning_rate": 1.8811536744096956e-05, "loss": 0.2115, "loss_nan_ranks": 0, "loss_rank_avg": 0.2508021593093872, "step": 3780, "valid_targets_mean": 2865.2, "valid_targets_min": 712 }, { "epoch": 3.975840336134454, "grad_norm": 0.6124622098856916, "learning_rate": 1.8759247382511748e-05, "loss": 0.2019, "loss_nan_ranks": 0, "loss_rank_avg": 0.21529731154441833, "step": 3785, "valid_targets_mean": 3260.9, "valid_targets_min": 772 }, { "epoch": 3.98109243697479, "grad_norm": 0.7245013981014534, "learning_rate": 1.8706966533416413e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.2099657505750656, "step": 3790, "valid_targets_mean": 2156.7, "valid_targets_min": 703 }, { "epoch": 3.986344537815126, "grad_norm": 0.7199624429982473, "learning_rate": 1.8654694555496624e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.2163430154323578, "step": 3795, "valid_targets_mean": 2900.4, "valid_targets_min": 1205 }, { "epoch": 3.991596638655462, "grad_norm": 0.7313432594209842, "learning_rate": 1.860243180737721e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.24018210172653198, "step": 3800, "valid_targets_mean": 2467.2, "valid_targets_min": 867 }, { "epoch": 3.9968487394957983, "grad_norm": 0.686344735243992, "learning_rate": 1.8550178647619664e-05, "loss": 0.2064, "loss_nan_ranks": 0, "loss_rank_avg": 0.2029697597026825, "step": 3805, "valid_targets_mean": 2462.6, "valid_targets_min": 853 }, { "epoch": 4.0021008403361344, "grad_norm": 0.5964545073234324, "learning_rate": 1.84979354347197e-05, "loss": 0.1972, "loss_nan_ranks": 0, "loss_rank_avg": 0.15941348671913147, "step": 3810, "valid_targets_mean": 2904.0, "valid_targets_min": 753 }, { "epoch": 4.007352941176471, "grad_norm": 0.6310111711662433, "learning_rate": 1.8445702527104782e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.17425957322120667, "step": 3815, "valid_targets_mean": 2903.4, "valid_targets_min": 1572 }, { "epoch": 4.012605042016807, "grad_norm": 0.8382816261281872, "learning_rate": 1.8393480283131677e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.1987411081790924, "step": 3820, "valid_targets_mean": 2029.4, "valid_targets_min": 824 }, { "epoch": 4.017857142857143, "grad_norm": 0.6828047242423465, "learning_rate": 1.8341269061083996e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.16214141249656677, "step": 3825, "valid_targets_mean": 2665.1, "valid_targets_min": 740 }, { "epoch": 4.023109243697479, "grad_norm": 0.6544969992637274, "learning_rate": 1.8289069219169717e-05, "loss": 0.1698, "loss_nan_ranks": 0, "loss_rank_avg": 0.15575842559337616, "step": 3830, "valid_targets_mean": 2708.9, "valid_targets_min": 741 }, { "epoch": 4.0283613445378155, "grad_norm": 0.665567823015263, "learning_rate": 1.8236881115518766e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.1710759848356247, "step": 3835, "valid_targets_mean": 2501.2, "valid_targets_min": 671 }, { "epoch": 4.033613445378151, "grad_norm": 0.8048649946622554, "learning_rate": 1.8184705108180516e-05, "loss": 0.1964, "loss_nan_ranks": 0, "loss_rank_avg": 0.21742048859596252, "step": 3840, "valid_targets_mean": 2245.1, "valid_targets_min": 819 }, { "epoch": 4.038865546218488, "grad_norm": 0.6730348979572065, "learning_rate": 1.8132541555121353e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.17370149493217468, "step": 3845, "valid_targets_mean": 3004.6, "valid_targets_min": 697 }, { "epoch": 4.044117647058823, "grad_norm": 0.6773064122209941, "learning_rate": 1.808039081422223e-05, "loss": 0.1759, "loss_nan_ranks": 0, "loss_rank_avg": 0.177533358335495, "step": 3850, "valid_targets_mean": 2959.3, "valid_targets_min": 923 }, { "epoch": 4.04936974789916, "grad_norm": 0.8972828803367779, "learning_rate": 1.802825324327618e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.19859957695007324, "step": 3855, "valid_targets_mean": 1707.2, "valid_targets_min": 642 }, { "epoch": 4.054621848739496, "grad_norm": 0.6816271881225173, "learning_rate": 1.7976129199985886e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.19027729332447052, "step": 3860, "valid_targets_mean": 2623.9, "valid_targets_min": 1048 }, { "epoch": 4.059873949579832, "grad_norm": 0.7082107239302485, "learning_rate": 1.7924019041961228e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.17302575707435608, "step": 3865, "valid_targets_mean": 2540.1, "valid_targets_min": 792 }, { "epoch": 4.065126050420168, "grad_norm": 0.781860364268105, "learning_rate": 1.7871923126716827e-05, "loss": 0.1827, "loss_nan_ranks": 0, "loss_rank_avg": 0.17314311861991882, "step": 3870, "valid_targets_mean": 1902.4, "valid_targets_min": 746 }, { "epoch": 4.070378151260504, "grad_norm": 0.770240331697946, "learning_rate": 1.7819841811669573e-05, "loss": 0.1726, "loss_nan_ranks": 0, "loss_rank_avg": 0.17767006158828735, "step": 3875, "valid_targets_mean": 2162.2, "valid_targets_min": 990 }, { "epoch": 4.07563025210084, "grad_norm": 0.7494050596565602, "learning_rate": 1.7767775454136194e-05, "loss": 0.1684, "loss_nan_ranks": 0, "loss_rank_avg": 0.16591396927833557, "step": 3880, "valid_targets_mean": 2518.5, "valid_targets_min": 870 }, { "epoch": 4.080882352941177, "grad_norm": 0.6697129284162905, "learning_rate": 1.7715724411330806e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.1829383820295334, "step": 3885, "valid_targets_mean": 3106.3, "valid_targets_min": 627 }, { "epoch": 4.086134453781512, "grad_norm": 0.7339734064772027, "learning_rate": 1.7663689040362446e-05, "loss": 0.1872, "loss_nan_ranks": 0, "loss_rank_avg": 0.18020042777061462, "step": 3890, "valid_targets_mean": 2812.9, "valid_targets_min": 722 }, { "epoch": 4.091386554621849, "grad_norm": 0.7376435988375549, "learning_rate": 1.761166969823262e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.15077045559883118, "step": 3895, "valid_targets_mean": 2092.4, "valid_targets_min": 865 }, { "epoch": 4.0966386554621845, "grad_norm": 0.6730357795335743, "learning_rate": 1.7559666741832896e-05, "loss": 0.187, "loss_nan_ranks": 0, "loss_rank_avg": 0.16643144190311432, "step": 3900, "valid_targets_mean": 2449.2, "valid_targets_min": 982 }, { "epoch": 4.101890756302521, "grad_norm": 0.8297442949389751, "learning_rate": 1.750768052794239e-05, "loss": 0.1927, "loss_nan_ranks": 0, "loss_rank_avg": 0.18952782452106476, "step": 3905, "valid_targets_mean": 1901.9, "valid_targets_min": 791 }, { "epoch": 4.107142857142857, "grad_norm": 0.794021570909151, "learning_rate": 1.7455711413225372e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.19502568244934082, "step": 3910, "valid_targets_mean": 2269.1, "valid_targets_min": 930 }, { "epoch": 4.112394957983193, "grad_norm": 0.8070144150239097, "learning_rate": 1.7403759754228794e-05, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.17317187786102295, "step": 3915, "valid_targets_mean": 1938.3, "valid_targets_min": 802 }, { "epoch": 4.117647058823529, "grad_norm": 0.6999096413433571, "learning_rate": 1.7351825907379837e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.1811293363571167, "step": 3920, "valid_targets_mean": 2730.1, "valid_targets_min": 912 }, { "epoch": 4.1228991596638656, "grad_norm": 0.7320665392327763, "learning_rate": 1.7299910228983513e-05, "loss": 0.1786, "loss_nan_ranks": 0, "loss_rank_avg": 0.1840408742427826, "step": 3925, "valid_targets_mean": 2366.4, "valid_targets_min": 1159 }, { "epoch": 4.128151260504202, "grad_norm": 0.7286921165522647, "learning_rate": 1.7248013075220128e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.17183949053287506, "step": 3930, "valid_targets_mean": 2257.6, "valid_targets_min": 886 }, { "epoch": 4.133403361344538, "grad_norm": 0.7113378690439488, "learning_rate": 1.7196134802142945e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.1910371482372284, "step": 3935, "valid_targets_mean": 2610.0, "valid_targets_min": 974 }, { "epoch": 4.138655462184874, "grad_norm": 0.9815704878476788, "learning_rate": 1.7144275765675673e-05, "loss": 0.1737, "loss_nan_ranks": 0, "loss_rank_avg": 0.1488598883152008, "step": 3940, "valid_targets_mean": 2683.5, "valid_targets_min": 824 }, { "epoch": 4.14390756302521, "grad_norm": 0.6552007544862622, "learning_rate": 1.7092436321610042e-05, "loss": 0.1755, "loss_nan_ranks": 0, "loss_rank_avg": 0.17244458198547363, "step": 3945, "valid_targets_mean": 3017.2, "valid_targets_min": 706 }, { "epoch": 4.149159663865547, "grad_norm": 0.7250853653334564, "learning_rate": 1.704061682560336e-05, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.17147307097911835, "step": 3950, "valid_targets_mean": 2484.5, "valid_targets_min": 1216 }, { "epoch": 4.154411764705882, "grad_norm": 0.7570116394721385, "learning_rate": 1.698881763317609e-05, "loss": 0.1856, "loss_nan_ranks": 0, "loss_rank_avg": 0.19652274250984192, "step": 3955, "valid_targets_mean": 2825.2, "valid_targets_min": 1066 }, { "epoch": 4.159663865546219, "grad_norm": 0.7477767810091138, "learning_rate": 1.69370390997094e-05, "loss": 0.1868, "loss_nan_ranks": 0, "loss_rank_avg": 0.1591658890247345, "step": 3960, "valid_targets_mean": 2386.2, "valid_targets_min": 551 }, { "epoch": 4.1649159663865545, "grad_norm": 0.7313664660917486, "learning_rate": 1.6885281580442677e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.18173372745513916, "step": 3965, "valid_targets_mean": 2462.9, "valid_targets_min": 816 }, { "epoch": 4.170168067226891, "grad_norm": 0.6878567291997353, "learning_rate": 1.6833545430471194e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.16087912023067474, "step": 3970, "valid_targets_mean": 2534.8, "valid_targets_min": 920 }, { "epoch": 4.175420168067227, "grad_norm": 0.7273228101827134, "learning_rate": 1.678183100474359e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.1902090162038803, "step": 3975, "valid_targets_mean": 2782.7, "valid_targets_min": 1105 }, { "epoch": 4.180672268907563, "grad_norm": 0.7924963064350935, "learning_rate": 1.6730138658059448e-05, "loss": 0.1784, "loss_nan_ranks": 0, "loss_rank_avg": 0.18615125119686127, "step": 3980, "valid_targets_mean": 2283.1, "valid_targets_min": 936 }, { "epoch": 4.185924369747899, "grad_norm": 0.7668376984218435, "learning_rate": 1.667846874506689e-05, "loss": 0.1724, "loss_nan_ranks": 0, "loss_rank_avg": 0.18692851066589355, "step": 3985, "valid_targets_mean": 2412.2, "valid_targets_min": 679 }, { "epoch": 4.1911764705882355, "grad_norm": 0.6979922592014087, "learning_rate": 1.662682162026012e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.16892990469932556, "step": 3990, "valid_targets_mean": 2284.2, "valid_targets_min": 753 }, { "epoch": 4.196428571428571, "grad_norm": 0.7050681864554844, "learning_rate": 1.6575197637976995e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.19187793135643005, "step": 3995, "valid_targets_mean": 3008.6, "valid_targets_min": 775 }, { "epoch": 4.201680672268908, "grad_norm": 0.7383233513848826, "learning_rate": 1.652359715239661e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.17365893721580505, "step": 4000, "valid_targets_mean": 2399.9, "valid_targets_min": 974 }, { "epoch": 4.206932773109243, "grad_norm": 0.7797983416724591, "learning_rate": 1.6472020517536828e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.17422497272491455, "step": 4005, "valid_targets_mean": 3114.1, "valid_targets_min": 839 }, { "epoch": 4.21218487394958, "grad_norm": 0.7864125547244055, "learning_rate": 1.6420468087251907e-05, "loss": 0.1807, "loss_nan_ranks": 0, "loss_rank_avg": 0.16865600645542145, "step": 4010, "valid_targets_mean": 1723.1, "valid_targets_min": 734 }, { "epoch": 4.217436974789916, "grad_norm": 0.7327097751903167, "learning_rate": 1.6368940215230026e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.16839268803596497, "step": 4015, "valid_targets_mean": 2459.2, "valid_targets_min": 818 }, { "epoch": 4.222689075630252, "grad_norm": 0.8238296453072825, "learning_rate": 1.6317437254990875e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.1884918212890625, "step": 4020, "valid_targets_mean": 2194.0, "valid_targets_min": 782 }, { "epoch": 4.227941176470588, "grad_norm": 0.6460591633506324, "learning_rate": 1.626595955988325e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.20153161883354187, "step": 4025, "valid_targets_mean": 3779.9, "valid_targets_min": 1333 }, { "epoch": 4.233193277310924, "grad_norm": 0.7457345391565217, "learning_rate": 1.6214507483082593e-05, "loss": 0.1892, "loss_nan_ranks": 0, "loss_rank_avg": 0.19580884277820587, "step": 4030, "valid_targets_mean": 2798.9, "valid_targets_min": 740 }, { "epoch": 4.23844537815126, "grad_norm": 0.9377584690672369, "learning_rate": 1.6163081377588588e-05, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.19530422985553741, "step": 4035, "valid_targets_mean": 2320.8, "valid_targets_min": 1065 }, { "epoch": 4.243697478991597, "grad_norm": 0.7042255194986914, "learning_rate": 1.6111681596222732e-05, "loss": 0.1858, "loss_nan_ranks": 0, "loss_rank_avg": 0.1799120008945465, "step": 4040, "valid_targets_mean": 2469.2, "valid_targets_min": 1188 }, { "epoch": 4.248949579831933, "grad_norm": 0.8657610459161533, "learning_rate": 1.606030849162593e-05, "loss": 0.1878, "loss_nan_ranks": 0, "loss_rank_avg": 0.17773385345935822, "step": 4045, "valid_targets_mean": 2067.2, "valid_targets_min": 801 }, { "epoch": 4.254201680672269, "grad_norm": 0.7170358815089117, "learning_rate": 1.600896241625605e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.17556703090667725, "step": 4050, "valid_targets_mean": 2699.3, "valid_targets_min": 1230 }, { "epoch": 4.2594537815126055, "grad_norm": 0.6997369617036321, "learning_rate": 1.5957643722385532e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.18936964869499207, "step": 4055, "valid_targets_mean": 2953.2, "valid_targets_min": 1086 }, { "epoch": 4.264705882352941, "grad_norm": 0.6298850135767894, "learning_rate": 1.590635276209896e-05, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.15947186946868896, "step": 4060, "valid_targets_mean": 3146.7, "valid_targets_min": 902 }, { "epoch": 4.269957983193278, "grad_norm": 0.7757297711293648, "learning_rate": 1.5855089887290634e-05, "loss": 0.1883, "loss_nan_ranks": 0, "loss_rank_avg": 0.1859544813632965, "step": 4065, "valid_targets_mean": 2376.6, "valid_targets_min": 889 }, { "epoch": 4.275210084033613, "grad_norm": 0.707196240386275, "learning_rate": 1.5803855449662175e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.17105159163475037, "step": 4070, "valid_targets_mean": 3088.3, "valid_targets_min": 777 }, { "epoch": 4.28046218487395, "grad_norm": 0.6412532070399728, "learning_rate": 1.5752649800720096e-05, "loss": 0.1827, "loss_nan_ranks": 0, "loss_rank_avg": 0.17575950920581818, "step": 4075, "valid_targets_mean": 3077.6, "valid_targets_min": 929 }, { "epoch": 4.285714285714286, "grad_norm": 0.7333503639293483, "learning_rate": 1.5701473291773395e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.16692572832107544, "step": 4080, "valid_targets_mean": 2213.4, "valid_targets_min": 808 }, { "epoch": 4.290966386554622, "grad_norm": 0.7789248084874639, "learning_rate": 1.5650326273931166e-05, "loss": 0.1898, "loss_nan_ranks": 0, "loss_rank_avg": 0.18778863549232483, "step": 4085, "valid_targets_mean": 2436.8, "valid_targets_min": 692 }, { "epoch": 4.296218487394958, "grad_norm": 0.7608523839784216, "learning_rate": 1.559920909810016e-05, "loss": 0.1905, "loss_nan_ranks": 0, "loss_rank_avg": 0.18575254082679749, "step": 4090, "valid_targets_mean": 2774.9, "valid_targets_min": 720 }, { "epoch": 4.301470588235294, "grad_norm": 0.7894327029271562, "learning_rate": 1.5548122114982393e-05, "loss": 0.1838, "loss_nan_ranks": 0, "loss_rank_avg": 0.20460262894630432, "step": 4095, "valid_targets_mean": 2156.1, "valid_targets_min": 628 }, { "epoch": 4.30672268907563, "grad_norm": 0.7108371500394565, "learning_rate": 1.5497065675072728e-05, "loss": 0.174, "loss_nan_ranks": 0, "loss_rank_avg": 0.1754794716835022, "step": 4100, "valid_targets_mean": 2560.9, "valid_targets_min": 849 }, { "epoch": 4.311974789915967, "grad_norm": 0.7197950949390775, "learning_rate": 1.5446040128656485e-05, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.1896936446428299, "step": 4105, "valid_targets_mean": 2634.4, "valid_targets_min": 1256 }, { "epoch": 4.317226890756302, "grad_norm": 0.815627208196532, "learning_rate": 1.539504582580704e-05, "loss": 0.1888, "loss_nan_ranks": 0, "loss_rank_avg": 0.1940707117319107, "step": 4110, "valid_targets_mean": 2417.6, "valid_targets_min": 733 }, { "epoch": 4.322478991596639, "grad_norm": 0.6715019204570937, "learning_rate": 1.5344083116383395e-05, "loss": 0.1814, "loss_nan_ranks": 0, "loss_rank_avg": 0.16882187128067017, "step": 4115, "valid_targets_mean": 3112.1, "valid_targets_min": 910 }, { "epoch": 4.3277310924369745, "grad_norm": 0.8201097153549575, "learning_rate": 1.529315235002781e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.18270252645015717, "step": 4120, "valid_targets_mean": 2153.9, "valid_targets_min": 973 }, { "epoch": 4.332983193277311, "grad_norm": 0.6915688934573623, "learning_rate": 1.5242253876163399e-05, "loss": 0.1911, "loss_nan_ranks": 0, "loss_rank_avg": 0.18757754564285278, "step": 4125, "valid_targets_mean": 3134.6, "valid_targets_min": 1432 }, { "epoch": 4.338235294117647, "grad_norm": 0.7700752339493685, "learning_rate": 1.5191388043991712e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.20721203088760376, "step": 4130, "valid_targets_mean": 2372.6, "valid_targets_min": 802 }, { "epoch": 4.343487394957983, "grad_norm": 0.7313076777239362, "learning_rate": 1.5140555202490359e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.16860508918762207, "step": 4135, "valid_targets_mean": 2125.1, "valid_targets_min": 703 }, { "epoch": 4.348739495798319, "grad_norm": 0.7070894615662773, "learning_rate": 1.5089755700410602e-05, "loss": 0.1916, "loss_nan_ranks": 0, "loss_rank_avg": 0.1806333363056183, "step": 4140, "valid_targets_mean": 2950.4, "valid_targets_min": 1042 }, { "epoch": 4.3539915966386555, "grad_norm": 0.7047900654504996, "learning_rate": 1.5038989886274992e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.17181357741355896, "step": 4145, "valid_targets_mean": 2456.4, "valid_targets_min": 728 }, { "epoch": 4.359243697478991, "grad_norm": 0.7947773694315373, "learning_rate": 1.498825810837492e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.1729154884815216, "step": 4150, "valid_targets_mean": 2260.0, "valid_targets_min": 596 }, { "epoch": 4.364495798319328, "grad_norm": 0.7438599144833491, "learning_rate": 1.4937560714768283e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.17960473895072937, "step": 4155, "valid_targets_mean": 2432.4, "valid_targets_min": 698 }, { "epoch": 4.369747899159664, "grad_norm": 0.771452228573944, "learning_rate": 1.4886898053277086e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.21052835881710052, "step": 4160, "valid_targets_mean": 2578.2, "valid_targets_min": 769 }, { "epoch": 4.375, "grad_norm": 0.6592959235985212, "learning_rate": 1.4836270471485029e-05, "loss": 0.1706, "loss_nan_ranks": 0, "loss_rank_avg": 0.18025822937488556, "step": 4165, "valid_targets_mean": 3174.4, "valid_targets_min": 850 }, { "epoch": 4.380252100840336, "grad_norm": 0.818888534502337, "learning_rate": 1.4785678316735144e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.1800573468208313, "step": 4170, "valid_targets_mean": 2206.2, "valid_targets_min": 658 }, { "epoch": 4.385504201680672, "grad_norm": 0.6949510487488129, "learning_rate": 1.4735121936127406e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.15901532769203186, "step": 4175, "valid_targets_mean": 2460.3, "valid_targets_min": 309 }, { "epoch": 4.390756302521009, "grad_norm": 0.7369699549502026, "learning_rate": 1.4684601676516366e-05, "loss": 0.1779, "loss_nan_ranks": 0, "loss_rank_avg": 0.1716357171535492, "step": 4180, "valid_targets_mean": 2640.8, "valid_targets_min": 626 }, { "epoch": 4.3960084033613445, "grad_norm": 0.8430612932856147, "learning_rate": 1.4634117884508738e-05, "loss": 0.1757, "loss_nan_ranks": 0, "loss_rank_avg": 0.17793697118759155, "step": 4185, "valid_targets_mean": 1770.9, "valid_targets_min": 768 }, { "epoch": 4.401260504201681, "grad_norm": 0.7931502126995679, "learning_rate": 1.458367090646105e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.20347827672958374, "step": 4190, "valid_targets_mean": 2522.5, "valid_targets_min": 985 }, { "epoch": 4.406512605042017, "grad_norm": 0.7167848190563175, "learning_rate": 1.4533261088477257e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.18484370410442352, "step": 4195, "valid_targets_mean": 2692.8, "valid_targets_min": 747 }, { "epoch": 4.411764705882353, "grad_norm": 0.7138856506553442, "learning_rate": 1.448288877640637e-05, "loss": 0.1824, "loss_nan_ranks": 0, "loss_rank_avg": 0.1668294370174408, "step": 4200, "valid_targets_mean": 2518.8, "valid_targets_min": 654 }, { "epoch": 4.417016806722689, "grad_norm": 0.6504444444519508, "learning_rate": 1.4432554315840082e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.18564704060554504, "step": 4205, "valid_targets_mean": 3140.6, "valid_targets_min": 1135 }, { "epoch": 4.4222689075630255, "grad_norm": 0.8499270398136098, "learning_rate": 1.438225805211039e-05, "loss": 0.1818, "loss_nan_ranks": 0, "loss_rank_avg": 0.18404464423656464, "step": 4210, "valid_targets_mean": 1649.0, "valid_targets_min": 644 }, { "epoch": 4.427521008403361, "grad_norm": 0.715092529952324, "learning_rate": 1.4332000330287248e-05, "loss": 0.1821, "loss_nan_ranks": 0, "loss_rank_avg": 0.1709214150905609, "step": 4215, "valid_targets_mean": 2421.9, "valid_targets_min": 750 }, { "epoch": 4.432773109243698, "grad_norm": 0.7288642734691909, "learning_rate": 1.428178149517617e-05, "loss": 0.1939, "loss_nan_ranks": 0, "loss_rank_avg": 0.20450027287006378, "step": 4220, "valid_targets_mean": 2933.5, "valid_targets_min": 1024 }, { "epoch": 4.438025210084033, "grad_norm": 0.795039692170866, "learning_rate": 1.4231601891315876e-05, "loss": 0.192, "loss_nan_ranks": 0, "loss_rank_avg": 0.18002474308013916, "step": 4225, "valid_targets_mean": 2059.5, "valid_targets_min": 1001 }, { "epoch": 4.44327731092437, "grad_norm": 0.988082973084519, "learning_rate": 1.418146186297594e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.18671777844429016, "step": 4230, "valid_targets_mean": 1872.4, "valid_targets_min": 814 }, { "epoch": 4.448529411764706, "grad_norm": 0.7931578128546755, "learning_rate": 1.413136175415441e-05, "loss": 0.1714, "loss_nan_ranks": 0, "loss_rank_avg": 0.19192029535770416, "step": 4235, "valid_targets_mean": 2010.4, "valid_targets_min": 848 }, { "epoch": 4.453781512605042, "grad_norm": 0.8177205538850968, "learning_rate": 1.4081301908575457e-05, "loss": 0.1848, "loss_nan_ranks": 0, "loss_rank_avg": 0.17905864119529724, "step": 4240, "valid_targets_mean": 1845.2, "valid_targets_min": 721 }, { "epoch": 4.459033613445378, "grad_norm": 0.7284329325277255, "learning_rate": 1.4031282669687035e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.1842656135559082, "step": 4245, "valid_targets_mean": 2472.1, "valid_targets_min": 1012 }, { "epoch": 4.464285714285714, "grad_norm": 0.7240658652686646, "learning_rate": 1.3981304380658474e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.19007527828216553, "step": 4250, "valid_targets_mean": 2486.7, "valid_targets_min": 739 }, { "epoch": 4.46953781512605, "grad_norm": 0.7916628114284047, "learning_rate": 1.3931367384378183e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.2028101086616516, "step": 4255, "valid_targets_mean": 2322.4, "valid_targets_min": 682 }, { "epoch": 4.474789915966387, "grad_norm": 0.7379642382110667, "learning_rate": 1.3881472023451262e-05, "loss": 0.1867, "loss_nan_ranks": 0, "loss_rank_avg": 0.18040382862091064, "step": 4260, "valid_targets_mean": 2429.3, "valid_targets_min": 812 }, { "epoch": 4.480042016806722, "grad_norm": 0.7027762915252015, "learning_rate": 1.3831618640197153e-05, "loss": 0.1781, "loss_nan_ranks": 0, "loss_rank_avg": 0.1830647736787796, "step": 4265, "valid_targets_mean": 2796.7, "valid_targets_min": 887 }, { "epoch": 4.485294117647059, "grad_norm": 0.716947336725011, "learning_rate": 1.3781807576647315e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.1749706119298935, "step": 4270, "valid_targets_mean": 2428.2, "valid_targets_min": 805 }, { "epoch": 4.4905462184873945, "grad_norm": 0.7292281203695309, "learning_rate": 1.373203917454285e-05, "loss": 0.1799, "loss_nan_ranks": 0, "loss_rank_avg": 0.1867130696773529, "step": 4275, "valid_targets_mean": 2838.0, "valid_targets_min": 1197 }, { "epoch": 4.495798319327731, "grad_norm": 0.7290851774469034, "learning_rate": 1.3682313775332186e-05, "loss": 0.1899, "loss_nan_ranks": 0, "loss_rank_avg": 0.16877129673957825, "step": 4280, "valid_targets_mean": 2704.8, "valid_targets_min": 694 }, { "epoch": 4.501050420168067, "grad_norm": 0.9037910643162406, "learning_rate": 1.3632631720168705e-05, "loss": 0.1801, "loss_nan_ranks": 0, "loss_rank_avg": 0.1778022050857544, "step": 4285, "valid_targets_mean": 1608.9, "valid_targets_min": 940 }, { "epoch": 4.506302521008403, "grad_norm": 0.7874366555714657, "learning_rate": 1.358299334990842e-05, "loss": 0.1771, "loss_nan_ranks": 0, "loss_rank_avg": 0.1755077838897705, "step": 4290, "valid_targets_mean": 2098.4, "valid_targets_min": 614 }, { "epoch": 4.51155462184874, "grad_norm": 0.8040088928448513, "learning_rate": 1.3533399005107635e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.1978076994419098, "step": 4295, "valid_targets_mean": 2012.0, "valid_targets_min": 721 }, { "epoch": 4.516806722689076, "grad_norm": 0.6756346527241319, "learning_rate": 1.3483849026020603e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.17955875396728516, "step": 4300, "valid_targets_mean": 2901.0, "valid_targets_min": 857 }, { "epoch": 4.522058823529412, "grad_norm": 0.7127125041012732, "learning_rate": 1.3434343752597199e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.18654534220695496, "step": 4305, "valid_targets_mean": 2637.3, "valid_targets_min": 803 }, { "epoch": 4.527310924369748, "grad_norm": 0.6197339001895822, "learning_rate": 1.3384883524480576e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.15983977913856506, "step": 4310, "valid_targets_mean": 3360.6, "valid_targets_min": 991 }, { "epoch": 4.532563025210084, "grad_norm": 0.7186207642971952, "learning_rate": 1.333546868100486e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.18633624911308289, "step": 4315, "valid_targets_mean": 2568.3, "valid_targets_min": 867 }, { "epoch": 4.53781512605042, "grad_norm": 0.6506719666430806, "learning_rate": 1.3286099561192784e-05, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.20066654682159424, "step": 4320, "valid_targets_mean": 3334.8, "valid_targets_min": 1078 }, { "epoch": 4.543067226890757, "grad_norm": 0.7139868060577005, "learning_rate": 1.3236776503753397e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.1832045167684555, "step": 4325, "valid_targets_mean": 2449.9, "valid_targets_min": 889 }, { "epoch": 4.548319327731092, "grad_norm": 0.8346149773596157, "learning_rate": 1.3187499847079713e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.17674115300178528, "step": 4330, "valid_targets_mean": 1668.5, "valid_targets_min": 788 }, { "epoch": 4.553571428571429, "grad_norm": 0.8581192326236325, "learning_rate": 1.3138269929246427e-05, "loss": 0.1752, "loss_nan_ranks": 0, "loss_rank_avg": 0.169841468334198, "step": 4335, "valid_targets_mean": 2480.5, "valid_targets_min": 758 }, { "epoch": 4.5588235294117645, "grad_norm": 0.6712603189184432, "learning_rate": 1.308908708800753e-05, "loss": 0.1947, "loss_nan_ranks": 0, "loss_rank_avg": 0.17790794372558594, "step": 4340, "valid_targets_mean": 3218.3, "valid_targets_min": 818 }, { "epoch": 4.564075630252101, "grad_norm": 0.8382631585908171, "learning_rate": 1.3039951660794063e-05, "loss": 0.188, "loss_nan_ranks": 0, "loss_rank_avg": 0.20454202592372894, "step": 4345, "valid_targets_mean": 2153.2, "valid_targets_min": 770 }, { "epoch": 4.569327731092437, "grad_norm": 0.7788139909395001, "learning_rate": 1.2990863984711773e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.187415212392807, "step": 4350, "valid_targets_mean": 2221.0, "valid_targets_min": 784 }, { "epoch": 4.574579831932773, "grad_norm": 0.8228381865776829, "learning_rate": 1.294182439653878e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.2052648365497589, "step": 4355, "valid_targets_mean": 2024.1, "valid_targets_min": 819 }, { "epoch": 4.579831932773109, "grad_norm": 0.7969097110247945, "learning_rate": 1.2892833232723297e-05, "loss": 0.1863, "loss_nan_ranks": 0, "loss_rank_avg": 0.19444799423217773, "step": 4360, "valid_targets_mean": 2430.7, "valid_targets_min": 750 }, { "epoch": 4.5850840336134455, "grad_norm": 0.8950927024396919, "learning_rate": 1.2843890829381303e-05, "loss": 0.1819, "loss_nan_ranks": 0, "loss_rank_avg": 0.1735416203737259, "step": 4365, "valid_targets_mean": 1948.1, "valid_targets_min": 640 }, { "epoch": 4.590336134453781, "grad_norm": 0.7524319791833006, "learning_rate": 1.2794997522294263e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.17769590020179749, "step": 4370, "valid_targets_mean": 2317.9, "valid_targets_min": 917 }, { "epoch": 4.595588235294118, "grad_norm": 0.8185328703075273, "learning_rate": 1.2746153646906766e-05, "loss": 0.1722, "loss_nan_ranks": 0, "loss_rank_avg": 0.17284256219863892, "step": 4375, "valid_targets_mean": 1852.3, "valid_targets_min": 610 }, { "epoch": 4.600840336134453, "grad_norm": 0.8366151911421962, "learning_rate": 1.2697359538324303e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.17999669909477234, "step": 4380, "valid_targets_mean": 2349.4, "valid_targets_min": 689 }, { "epoch": 4.60609243697479, "grad_norm": 0.74572952017287, "learning_rate": 1.2648615531310907e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.18219012022018433, "step": 4385, "valid_targets_mean": 2272.4, "valid_targets_min": 914 }, { "epoch": 4.6113445378151265, "grad_norm": 0.7591238610620517, "learning_rate": 1.259992196028688e-05, "loss": 0.1772, "loss_nan_ranks": 0, "loss_rank_avg": 0.1870465874671936, "step": 4390, "valid_targets_mean": 2377.6, "valid_targets_min": 884 }, { "epoch": 4.616596638655462, "grad_norm": 0.7984813374731973, "learning_rate": 1.2551279159326495e-05, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.1903630644083023, "step": 4395, "valid_targets_mean": 2266.4, "valid_targets_min": 868 }, { "epoch": 4.621848739495798, "grad_norm": 0.7169284378785025, "learning_rate": 1.2502687462155709e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.17516914010047913, "step": 4400, "valid_targets_mean": 2642.4, "valid_targets_min": 1050 }, { "epoch": 4.6271008403361344, "grad_norm": 0.7778626068632182, "learning_rate": 1.2454147202149865e-05, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.18522366881370544, "step": 4405, "valid_targets_mean": 2276.4, "valid_targets_min": 621 }, { "epoch": 4.632352941176471, "grad_norm": 0.7163788723425591, "learning_rate": 1.2405658712331409e-05, "loss": 0.1718, "loss_nan_ranks": 0, "loss_rank_avg": 0.17094354331493378, "step": 4410, "valid_targets_mean": 2692.1, "valid_targets_min": 1078 }, { "epoch": 4.637605042016807, "grad_norm": 0.7021250334619412, "learning_rate": 1.2357222325367604e-05, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.2073124796152115, "step": 4415, "valid_targets_mean": 3277.5, "valid_targets_min": 998 }, { "epoch": 4.642857142857143, "grad_norm": 0.7042673790509252, "learning_rate": 1.2308838373568249e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.18093574047088623, "step": 4420, "valid_targets_mean": 3193.1, "valid_targets_min": 808 }, { "epoch": 4.648109243697479, "grad_norm": 0.7080962295239951, "learning_rate": 1.2260507188883395e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.179480642080307, "step": 4425, "valid_targets_mean": 2543.3, "valid_targets_min": 967 }, { "epoch": 4.6533613445378155, "grad_norm": 0.7498653248193045, "learning_rate": 1.2212229102901077e-05, "loss": 0.1869, "loss_nan_ranks": 0, "loss_rank_avg": 0.1921127885580063, "step": 4430, "valid_targets_mean": 2489.6, "valid_targets_min": 618 }, { "epoch": 4.658613445378151, "grad_norm": 0.7571679788787566, "learning_rate": 1.2164004446845037e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.19102567434310913, "step": 4435, "valid_targets_mean": 2422.0, "valid_targets_min": 692 }, { "epoch": 4.663865546218488, "grad_norm": 0.7458838101603535, "learning_rate": 1.2115833551572438e-05, "loss": 0.1937, "loss_nan_ranks": 0, "loss_rank_avg": 0.18319690227508545, "step": 4440, "valid_targets_mean": 2450.1, "valid_targets_min": 605 }, { "epoch": 4.669117647058823, "grad_norm": 0.7046359584542661, "learning_rate": 1.2067716747571616e-05, "loss": 0.1881, "loss_nan_ranks": 0, "loss_rank_avg": 0.1766650229692459, "step": 4445, "valid_targets_mean": 2313.4, "valid_targets_min": 843 }, { "epoch": 4.67436974789916, "grad_norm": 0.8345834489540149, "learning_rate": 1.201965436495978e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.19209042191505432, "step": 4450, "valid_targets_mean": 2150.6, "valid_targets_min": 962 }, { "epoch": 4.679621848739496, "grad_norm": 0.763774531100772, "learning_rate": 1.1971646733480784e-05, "loss": 0.1822, "loss_nan_ranks": 0, "loss_rank_avg": 0.20099681615829468, "step": 4455, "valid_targets_mean": 2721.1, "valid_targets_min": 1033 }, { "epoch": 4.684873949579832, "grad_norm": 0.6918104106739509, "learning_rate": 1.1923694182502848e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.17281074821949005, "step": 4460, "valid_targets_mean": 2406.6, "valid_targets_min": 978 }, { "epoch": 4.690126050420168, "grad_norm": 0.7551738929861327, "learning_rate": 1.1875797041016286e-05, "loss": 0.1825, "loss_nan_ranks": 0, "loss_rank_avg": 0.1859922856092453, "step": 4465, "valid_targets_mean": 2412.7, "valid_targets_min": 911 }, { "epoch": 4.695378151260504, "grad_norm": 0.7758417255586617, "learning_rate": 1.1827955637631283e-05, "loss": 0.1811, "loss_nan_ranks": 0, "loss_rank_avg": 0.16596679389476776, "step": 4470, "valid_targets_mean": 2247.4, "valid_targets_min": 833 }, { "epoch": 4.70063025210084, "grad_norm": 0.6806231945697778, "learning_rate": 1.1780170300575602e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.1946016550064087, "step": 4475, "valid_targets_mean": 3193.5, "valid_targets_min": 1143 }, { "epoch": 4.705882352941177, "grad_norm": 0.7375240636905129, "learning_rate": 1.1732441357692353e-05, "loss": 0.1871, "loss_nan_ranks": 0, "loss_rank_avg": 0.17887581884860992, "step": 4480, "valid_targets_mean": 2464.6, "valid_targets_min": 697 }, { "epoch": 4.711134453781512, "grad_norm": 0.7620340981837231, "learning_rate": 1.1684769136437742e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.19154343008995056, "step": 4485, "valid_targets_mean": 2281.2, "valid_targets_min": 803 }, { "epoch": 4.716386554621849, "grad_norm": 0.82056252467419, "learning_rate": 1.1637153963878815e-05, "loss": 0.1817, "loss_nan_ranks": 0, "loss_rank_avg": 0.19052766263484955, "step": 4490, "valid_targets_mean": 2145.5, "valid_targets_min": 661 }, { "epoch": 4.7216386554621845, "grad_norm": 0.7301286521046133, "learning_rate": 1.1589596166691231e-05, "loss": 0.1766, "loss_nan_ranks": 0, "loss_rank_avg": 0.1829635053873062, "step": 4495, "valid_targets_mean": 2482.4, "valid_targets_min": 659 }, { "epoch": 4.726890756302521, "grad_norm": 0.7903970658437431, "learning_rate": 1.1542096071157012e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.1784076690673828, "step": 4500, "valid_targets_mean": 2605.2, "valid_targets_min": 950 }, { "epoch": 4.732142857142857, "grad_norm": 0.7637658355202966, "learning_rate": 1.1494654003162285e-05, "loss": 0.1745, "loss_nan_ranks": 0, "loss_rank_avg": 0.18634071946144104, "step": 4505, "valid_targets_mean": 2553.0, "valid_targets_min": 950 }, { "epoch": 4.737394957983193, "grad_norm": 0.7221781006332623, "learning_rate": 1.1447270288195089e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.17665636539459229, "step": 4510, "valid_targets_mean": 2349.6, "valid_targets_min": 847 }, { "epoch": 4.742647058823529, "grad_norm": 0.720008738864535, "learning_rate": 1.1399945251343114e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.183954656124115, "step": 4515, "valid_targets_mean": 2651.1, "valid_targets_min": 963 }, { "epoch": 4.7478991596638656, "grad_norm": 0.7439764441972336, "learning_rate": 1.1352679217291457e-05, "loss": 0.1842, "loss_nan_ranks": 0, "loss_rank_avg": 0.18053632974624634, "step": 4520, "valid_targets_mean": 2257.0, "valid_targets_min": 656 }, { "epoch": 4.753151260504202, "grad_norm": 0.6873632051406735, "learning_rate": 1.1305472510320419e-05, "loss": 0.1783, "loss_nan_ranks": 0, "loss_rank_avg": 0.16327188909053802, "step": 4525, "valid_targets_mean": 2640.4, "valid_targets_min": 682 }, { "epoch": 4.758403361344538, "grad_norm": 0.7442947567531205, "learning_rate": 1.1258325454303286e-05, "loss": 0.195, "loss_nan_ranks": 0, "loss_rank_avg": 0.1675795316696167, "step": 4530, "valid_targets_mean": 2390.1, "valid_targets_min": 826 }, { "epoch": 4.7636554621848735, "grad_norm": 0.7354254137750549, "learning_rate": 1.1211238372704073e-05, "loss": 0.1887, "loss_nan_ranks": 0, "loss_rank_avg": 0.17392656207084656, "step": 4535, "valid_targets_mean": 2248.0, "valid_targets_min": 1064 }, { "epoch": 4.76890756302521, "grad_norm": 0.7224478673738945, "learning_rate": 1.1164211588575339e-05, "loss": 0.1845, "loss_nan_ranks": 0, "loss_rank_avg": 0.16614243388175964, "step": 4540, "valid_targets_mean": 2204.6, "valid_targets_min": 754 }, { "epoch": 4.774159663865547, "grad_norm": 0.6780397730456732, "learning_rate": 1.1117245424555967e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.17192646861076355, "step": 4545, "valid_targets_mean": 2732.8, "valid_targets_min": 635 }, { "epoch": 4.779411764705882, "grad_norm": 0.8114966919737321, "learning_rate": 1.1070340202868915e-05, "loss": 0.1715, "loss_nan_ranks": 0, "loss_rank_avg": 0.16627684235572815, "step": 4550, "valid_targets_mean": 2037.4, "valid_targets_min": 832 }, { "epoch": 4.784663865546219, "grad_norm": 0.7089064475714499, "learning_rate": 1.1023496245319056e-05, "loss": 0.1743, "loss_nan_ranks": 0, "loss_rank_avg": 0.20096446573734283, "step": 4555, "valid_targets_mean": 3190.9, "valid_targets_min": 1018 }, { "epoch": 4.7899159663865545, "grad_norm": 0.7629594666078792, "learning_rate": 1.0976713873290925e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.18434454500675201, "step": 4560, "valid_targets_mean": 2231.0, "valid_targets_min": 731 }, { "epoch": 4.795168067226891, "grad_norm": 0.7206103511159119, "learning_rate": 1.0929993407746543e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.1781184822320938, "step": 4565, "valid_targets_mean": 2413.1, "valid_targets_min": 924 }, { "epoch": 4.800420168067227, "grad_norm": 0.7319103361120156, "learning_rate": 1.0883335169223212e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.19576598703861237, "step": 4570, "valid_targets_mean": 2644.1, "valid_targets_min": 1339 }, { "epoch": 4.805672268907563, "grad_norm": 0.7224561194750161, "learning_rate": 1.0836739477831297e-05, "loss": 0.1769, "loss_nan_ranks": 0, "loss_rank_avg": 0.16441801190376282, "step": 4575, "valid_targets_mean": 2237.8, "valid_targets_min": 776 }, { "epoch": 4.810924369747899, "grad_norm": 0.8825086906465849, "learning_rate": 1.0790206653252055e-05, "loss": 0.169, "loss_nan_ranks": 0, "loss_rank_avg": 0.18621914088726044, "step": 4580, "valid_targets_mean": 2011.2, "valid_targets_min": 631 }, { "epoch": 4.8161764705882355, "grad_norm": 0.6887944713418872, "learning_rate": 1.0743737014735434e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.18349093198776245, "step": 4585, "valid_targets_mean": 2805.9, "valid_targets_min": 595 }, { "epoch": 4.821428571428571, "grad_norm": 0.8266516711323478, "learning_rate": 1.0697330881097857e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.18345323204994202, "step": 4590, "valid_targets_mean": 2207.9, "valid_targets_min": 692 }, { "epoch": 4.826680672268908, "grad_norm": 0.7454608401910962, "learning_rate": 1.0650988570720077e-05, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.16886943578720093, "step": 4595, "valid_targets_mean": 2130.4, "valid_targets_min": 837 }, { "epoch": 4.831932773109243, "grad_norm": 0.7525541827091601, "learning_rate": 1.0604710401544963e-05, "loss": 0.1889, "loss_nan_ranks": 0, "loss_rank_avg": 0.2049073427915573, "step": 4600, "valid_targets_mean": 2671.1, "valid_targets_min": 938 }, { "epoch": 4.83718487394958, "grad_norm": 0.7221773649936342, "learning_rate": 1.0558496691075318e-05, "loss": 0.1874, "loss_nan_ranks": 0, "loss_rank_avg": 0.18932510912418365, "step": 4605, "valid_targets_mean": 2382.8, "valid_targets_min": 533 }, { "epoch": 4.842436974789916, "grad_norm": 0.6282371291333917, "learning_rate": 1.0512347756371726e-05, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.18067455291748047, "step": 4610, "valid_targets_mean": 3488.6, "valid_targets_min": 1483 }, { "epoch": 4.847689075630252, "grad_norm": 0.7736804746763539, "learning_rate": 1.0466263914050362e-05, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.187209352850914, "step": 4615, "valid_targets_mean": 2130.1, "valid_targets_min": 1190 }, { "epoch": 4.852941176470588, "grad_norm": 0.8194923770615844, "learning_rate": 1.0420245480280804e-05, "loss": 0.1711, "loss_nan_ranks": 0, "loss_rank_avg": 0.19902583956718445, "step": 4620, "valid_targets_mean": 2030.2, "valid_targets_min": 870 }, { "epoch": 4.858193277310924, "grad_norm": 0.7237311731603411, "learning_rate": 1.0374292770783891e-05, "loss": 0.1885, "loss_nan_ranks": 0, "loss_rank_avg": 0.18148672580718994, "step": 4625, "valid_targets_mean": 2961.3, "valid_targets_min": 597 }, { "epoch": 4.86344537815126, "grad_norm": 0.6669660493298567, "learning_rate": 1.0328406100829542e-05, "loss": 0.1876, "loss_nan_ranks": 0, "loss_rank_avg": 0.17993488907814026, "step": 4630, "valid_targets_mean": 3014.6, "valid_targets_min": 634 }, { "epoch": 4.868697478991597, "grad_norm": 0.8700432106817276, "learning_rate": 1.0282585785234578e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.18658801913261414, "step": 4635, "valid_targets_mean": 1932.2, "valid_targets_min": 930 }, { "epoch": 4.873949579831933, "grad_norm": 0.6217143473547485, "learning_rate": 1.023683213836061e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.1737050712108612, "step": 4640, "valid_targets_mean": 3531.2, "valid_targets_min": 844 }, { "epoch": 4.879201680672269, "grad_norm": 0.9539626771397886, "learning_rate": 1.0191145474111823e-05, "loss": 0.1846, "loss_nan_ranks": 0, "loss_rank_avg": 0.19349545240402222, "step": 4645, "valid_targets_mean": 1414.2, "valid_targets_min": 746 }, { "epoch": 4.884453781512605, "grad_norm": 0.6923182425799058, "learning_rate": 1.0145526105932872e-05, "loss": 0.1712, "loss_nan_ranks": 0, "loss_rank_avg": 0.16115731000900269, "step": 4650, "valid_targets_mean": 2663.4, "valid_targets_min": 814 }, { "epoch": 4.889705882352941, "grad_norm": 0.6914625755370188, "learning_rate": 1.0099974346806714e-05, "loss": 0.1916, "loss_nan_ranks": 0, "loss_rank_avg": 0.1792561411857605, "step": 4655, "valid_targets_mean": 2781.5, "valid_targets_min": 1252 }, { "epoch": 4.894957983193278, "grad_norm": 0.7734782088863728, "learning_rate": 1.0054490509252423e-05, "loss": 0.191, "loss_nan_ranks": 0, "loss_rank_avg": 0.20624291896820068, "step": 4660, "valid_targets_mean": 2440.4, "valid_targets_min": 759 }, { "epoch": 4.900210084033613, "grad_norm": 0.7941952415974891, "learning_rate": 1.0009074905323118e-05, "loss": 0.1686, "loss_nan_ranks": 0, "loss_rank_avg": 0.17345239222049713, "step": 4665, "valid_targets_mean": 2916.6, "valid_targets_min": 1297 }, { "epoch": 4.90546218487395, "grad_norm": 0.8030163177897169, "learning_rate": 9.963727846603784e-06, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.18559759855270386, "step": 4670, "valid_targets_mean": 2144.8, "valid_targets_min": 987 }, { "epoch": 4.910714285714286, "grad_norm": 0.7030553547126519, "learning_rate": 9.918449644209087e-06, "loss": 0.1852, "loss_nan_ranks": 0, "loss_rank_avg": 0.18912020325660706, "step": 4675, "valid_targets_mean": 2720.7, "valid_targets_min": 1084 }, { "epoch": 4.915966386554622, "grad_norm": 0.6845418285443712, "learning_rate": 9.873240608781341e-06, "loss": 0.182, "loss_nan_ranks": 0, "loss_rank_avg": 0.202968031167984, "step": 4680, "valid_targets_mean": 3153.9, "valid_targets_min": 1043 }, { "epoch": 4.921218487394958, "grad_norm": 0.7655672446200298, "learning_rate": 9.828101050488308e-06, "loss": 0.1873, "loss_nan_ranks": 0, "loss_rank_avg": 0.18019559979438782, "step": 4685, "valid_targets_mean": 1993.6, "valid_targets_min": 1195 }, { "epoch": 4.926470588235294, "grad_norm": 0.7622908992963848, "learning_rate": 9.783031279021063e-06, "loss": 0.1795, "loss_nan_ranks": 0, "loss_rank_avg": 0.19854578375816345, "step": 4690, "valid_targets_mean": 2434.5, "valid_targets_min": 1013 }, { "epoch": 4.93172268907563, "grad_norm": 0.7356813022171075, "learning_rate": 9.738031603591926e-06, "loss": 0.1864, "loss_nan_ranks": 0, "loss_rank_avg": 0.1860363483428955, "step": 4695, "valid_targets_mean": 2400.0, "valid_targets_min": 934 }, { "epoch": 4.936974789915967, "grad_norm": 0.720810615748148, "learning_rate": 9.69310233293227e-06, "loss": 0.1853, "loss_nan_ranks": 0, "loss_rank_avg": 0.1856434941291809, "step": 4700, "valid_targets_mean": 2621.8, "valid_targets_min": 1276 }, { "epoch": 4.942226890756302, "grad_norm": 0.7063545010234002, "learning_rate": 9.648243775290476e-06, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.16022886335849762, "step": 4705, "valid_targets_mean": 2576.8, "valid_targets_min": 1221 }, { "epoch": 4.947478991596639, "grad_norm": 0.7386993073314914, "learning_rate": 9.60345623842974e-06, "loss": 0.1793, "loss_nan_ranks": 0, "loss_rank_avg": 0.17438361048698425, "step": 4710, "valid_targets_mean": 2572.9, "valid_targets_min": 715 }, { "epoch": 4.9527310924369745, "grad_norm": 0.7347227314045449, "learning_rate": 9.558740029626046e-06, "loss": 0.1749, "loss_nan_ranks": 0, "loss_rank_avg": 0.1749304234981537, "step": 4715, "valid_targets_mean": 2584.6, "valid_targets_min": 612 }, { "epoch": 4.957983193277311, "grad_norm": 0.728403778635231, "learning_rate": 9.51409545566597e-06, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.18584081530570984, "step": 4720, "valid_targets_mean": 2500.6, "valid_targets_min": 660 }, { "epoch": 4.963235294117647, "grad_norm": 0.7578264772501891, "learning_rate": 9.469522822844663e-06, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.1682163029909134, "step": 4725, "valid_targets_mean": 2061.4, "valid_targets_min": 691 }, { "epoch": 4.968487394957983, "grad_norm": 0.7750388844604879, "learning_rate": 9.425022436963664e-06, "loss": 0.1932, "loss_nan_ranks": 0, "loss_rank_avg": 0.19586464762687683, "step": 4730, "valid_targets_mean": 2407.8, "valid_targets_min": 657 }, { "epoch": 4.973739495798319, "grad_norm": 0.7766444281597565, "learning_rate": 9.380594603328875e-06, "loss": 0.1984, "loss_nan_ranks": 0, "loss_rank_avg": 0.2102508395910263, "step": 4735, "valid_targets_mean": 2843.3, "valid_targets_min": 639 }, { "epoch": 4.9789915966386555, "grad_norm": 0.760942443434771, "learning_rate": 9.336239626748432e-06, "loss": 0.1806, "loss_nan_ranks": 0, "loss_rank_avg": 0.17757880687713623, "step": 4740, "valid_targets_mean": 2666.6, "valid_targets_min": 825 }, { "epoch": 4.984243697478991, "grad_norm": 0.7731058692289628, "learning_rate": 9.291957811530602e-06, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.18547788262367249, "step": 4745, "valid_targets_mean": 2214.3, "valid_targets_min": 760 }, { "epoch": 4.989495798319328, "grad_norm": 0.700031528165842, "learning_rate": 9.247749461481712e-06, "loss": 0.1696, "loss_nan_ranks": 0, "loss_rank_avg": 0.18496280908584595, "step": 4750, "valid_targets_mean": 2794.8, "valid_targets_min": 945 }, { "epoch": 4.994747899159664, "grad_norm": 0.6273143784305558, "learning_rate": 9.203614879904083e-06, "loss": 0.1798, "loss_nan_ranks": 0, "loss_rank_avg": 0.15987840294837952, "step": 4755, "valid_targets_mean": 3185.1, "valid_targets_min": 1250 }, { "epoch": 5.0, "grad_norm": 0.6788365442881951, "learning_rate": 9.159554369593901e-06, "loss": 0.1866, "loss_nan_ranks": 0, "loss_rank_avg": 0.17320957779884338, "step": 4760, "valid_targets_mean": 2633.3, "valid_targets_min": 687 }, { "epoch": 5.005252100840337, "grad_norm": 0.7483605516753753, "learning_rate": 9.115568232839193e-06, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.12966476380825043, "step": 4765, "valid_targets_mean": 1753.9, "valid_targets_min": 881 }, { "epoch": 5.010504201680672, "grad_norm": 0.7211521050334696, "learning_rate": 9.071656771417721e-06, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.16123877465724945, "step": 4770, "valid_targets_mean": 2470.6, "valid_targets_min": 1058 }, { "epoch": 5.015756302521009, "grad_norm": 0.7296273456769096, "learning_rate": 9.027820286594902e-06, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.14505019783973694, "step": 4775, "valid_targets_mean": 2658.1, "valid_targets_min": 1128 }, { "epoch": 5.0210084033613445, "grad_norm": 0.7817862758275839, "learning_rate": 8.984059079121785e-06, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.15351414680480957, "step": 4780, "valid_targets_mean": 2114.3, "valid_targets_min": 589 }, { "epoch": 5.026260504201681, "grad_norm": 0.7668268893222531, "learning_rate": 8.940373449232935e-06, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.16739562153816223, "step": 4785, "valid_targets_mean": 2364.6, "valid_targets_min": 802 }, { "epoch": 5.031512605042017, "grad_norm": 0.820070132627084, "learning_rate": 8.896763696644405e-06, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.15973633527755737, "step": 4790, "valid_targets_mean": 1928.4, "valid_targets_min": 740 }, { "epoch": 5.036764705882353, "grad_norm": 0.7252481874686856, "learning_rate": 8.853230120551693e-06, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.14669166505336761, "step": 4795, "valid_targets_mean": 2317.4, "valid_targets_min": 790 }, { "epoch": 5.042016806722689, "grad_norm": 0.8044647525929012, "learning_rate": 8.809773019627635e-06, "loss": 0.1566, "loss_nan_ranks": 0, "loss_rank_avg": 0.17486470937728882, "step": 4800, "valid_targets_mean": 2453.2, "valid_targets_min": 864 }, { "epoch": 5.0472689075630255, "grad_norm": 0.7168891105498033, "learning_rate": 8.766392692020413e-06, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.16313612461090088, "step": 4805, "valid_targets_mean": 3045.1, "valid_targets_min": 1015 }, { "epoch": 5.052521008403361, "grad_norm": 0.8391271783579383, "learning_rate": 8.723089435351497e-06, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.17179730534553528, "step": 4810, "valid_targets_mean": 2010.1, "valid_targets_min": 836 }, { "epoch": 5.057773109243698, "grad_norm": 0.7301522003326225, "learning_rate": 8.679863546713559e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.17533841729164124, "step": 4815, "valid_targets_mean": 3249.5, "valid_targets_min": 611 }, { "epoch": 5.063025210084033, "grad_norm": 0.886339846842999, "learning_rate": 8.636715322668498e-06, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.16565924882888794, "step": 4820, "valid_targets_mean": 2003.6, "valid_targets_min": 908 }, { "epoch": 5.06827731092437, "grad_norm": 0.7726449898609571, "learning_rate": 8.593645059245365e-06, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.15337593853473663, "step": 4825, "valid_targets_mean": 2167.6, "valid_targets_min": 740 }, { "epoch": 5.073529411764706, "grad_norm": 0.7695203697189681, "learning_rate": 8.550653051938333e-06, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.1670958697795868, "step": 4830, "valid_targets_mean": 2386.7, "valid_targets_min": 755 }, { "epoch": 5.078781512605042, "grad_norm": 0.8074962356870891, "learning_rate": 8.507739595704695e-06, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.1489427387714386, "step": 4835, "valid_targets_mean": 2025.5, "valid_targets_min": 703 }, { "epoch": 5.084033613445378, "grad_norm": 0.8716776759288114, "learning_rate": 8.464904984962832e-06, "loss": 0.1634, "loss_nan_ranks": 0, "loss_rank_avg": 0.16994109749794006, "step": 4840, "valid_targets_mean": 2000.9, "valid_targets_min": 679 }, { "epoch": 5.089285714285714, "grad_norm": 0.8076509459810718, "learning_rate": 8.422149513590151e-06, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.17325329780578613, "step": 4845, "valid_targets_mean": 2370.3, "valid_targets_min": 537 }, { "epoch": 5.09453781512605, "grad_norm": 0.8070190471856774, "learning_rate": 8.37947347492115e-06, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.15762285888195038, "step": 4850, "valid_targets_mean": 2040.4, "valid_targets_min": 621 }, { "epoch": 5.099789915966387, "grad_norm": 0.74092533277044, "learning_rate": 8.33687716174532e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.16209125518798828, "step": 4855, "valid_targets_mean": 2598.8, "valid_targets_min": 669 }, { "epoch": 5.105042016806722, "grad_norm": 0.860251504616201, "learning_rate": 8.294360866305192e-06, "loss": 0.1628, "loss_nan_ranks": 0, "loss_rank_avg": 0.15497906506061554, "step": 4860, "valid_targets_mean": 2211.9, "valid_targets_min": 1015 }, { "epoch": 5.110294117647059, "grad_norm": 0.7907729718003471, "learning_rate": 8.251924880294317e-06, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.16414563357830048, "step": 4865, "valid_targets_mean": 2080.1, "valid_targets_min": 919 }, { "epoch": 5.1155462184873945, "grad_norm": 0.8047837776866085, "learning_rate": 8.20956949485527e-06, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.15285125374794006, "step": 4870, "valid_targets_mean": 1991.6, "valid_targets_min": 571 }, { "epoch": 5.120798319327731, "grad_norm": 0.7304681966773338, "learning_rate": 8.167295000577622e-06, "loss": 0.1693, "loss_nan_ranks": 0, "loss_rank_avg": 0.15932945907115936, "step": 4875, "valid_targets_mean": 2356.6, "valid_targets_min": 621 }, { "epoch": 5.126050420168067, "grad_norm": 0.7843064737707304, "learning_rate": 8.125101687496e-06, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.1509605348110199, "step": 4880, "valid_targets_mean": 2156.1, "valid_targets_min": 945 }, { "epoch": 5.131302521008403, "grad_norm": 0.6507131542748491, "learning_rate": 8.082989845088038e-06, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.168035089969635, "step": 4885, "valid_targets_mean": 3697.9, "valid_targets_min": 1139 }, { "epoch": 5.13655462184874, "grad_norm": 0.7983692941356186, "learning_rate": 8.040959762272441e-06, "loss": 0.1711, "loss_nan_ranks": 0, "loss_rank_avg": 0.17778906226158142, "step": 4890, "valid_targets_mean": 2277.1, "valid_targets_min": 596 }, { "epoch": 5.141806722689076, "grad_norm": 0.717526944817668, "learning_rate": 7.999011727406995e-06, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.1474049985408783, "step": 4895, "valid_targets_mean": 3174.6, "valid_targets_min": 753 }, { "epoch": 5.147058823529412, "grad_norm": 0.6501295927520986, "learning_rate": 7.957146028286524e-06, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.15974193811416626, "step": 4900, "valid_targets_mean": 3719.8, "valid_targets_min": 786 }, { "epoch": 5.152310924369748, "grad_norm": 0.7634163772813823, "learning_rate": 7.915362952141017e-06, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.13993379473686218, "step": 4905, "valid_targets_mean": 2612.3, "valid_targets_min": 679 }, { "epoch": 5.157563025210084, "grad_norm": 0.8229169359259055, "learning_rate": 7.873662785633594e-06, "loss": 0.1627, "loss_nan_ranks": 0, "loss_rank_avg": 0.17392058670520782, "step": 4910, "valid_targets_mean": 2420.1, "valid_targets_min": 685 }, { "epoch": 5.16281512605042, "grad_norm": 0.8391334241227872, "learning_rate": 7.832045814858538e-06, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.15847104787826538, "step": 4915, "valid_targets_mean": 2340.0, "valid_targets_min": 703 }, { "epoch": 5.168067226890757, "grad_norm": 0.7113772435226458, "learning_rate": 7.790512325339367e-06, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.17543965578079224, "step": 4920, "valid_targets_mean": 2999.2, "valid_targets_min": 1254 }, { "epoch": 5.173319327731092, "grad_norm": 0.8373320616460568, "learning_rate": 7.74906260202685e-06, "loss": 0.1666, "loss_nan_ranks": 0, "loss_rank_avg": 0.16569611430168152, "step": 4925, "valid_targets_mean": 2456.8, "valid_targets_min": 704 }, { "epoch": 5.178571428571429, "grad_norm": 0.756975477682416, "learning_rate": 7.707696929297053e-06, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.15648490190505981, "step": 4930, "valid_targets_mean": 2480.5, "valid_targets_min": 789 }, { "epoch": 5.1838235294117645, "grad_norm": 0.841074398063682, "learning_rate": 7.666415590949382e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.16663537919521332, "step": 4935, "valid_targets_mean": 2205.2, "valid_targets_min": 817 }, { "epoch": 5.189075630252101, "grad_norm": 0.8588889722655582, "learning_rate": 7.625218870204676e-06, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.16082826256752014, "step": 4940, "valid_targets_mean": 2507.4, "valid_targets_min": 765 }, { "epoch": 5.194327731092437, "grad_norm": 0.7390042440173223, "learning_rate": 7.584107049703195e-06, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.15865691006183624, "step": 4945, "valid_targets_mean": 2532.7, "valid_targets_min": 780 }, { "epoch": 5.199579831932773, "grad_norm": 0.7806217716341791, "learning_rate": 7.5430804115027615e-06, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.15922147035598755, "step": 4950, "valid_targets_mean": 2130.4, "valid_targets_min": 791 }, { "epoch": 5.204831932773109, "grad_norm": 0.6872497366416, "learning_rate": 7.502139237076744e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.16006314754486084, "step": 4955, "valid_targets_mean": 3239.2, "valid_targets_min": 656 }, { "epoch": 5.2100840336134455, "grad_norm": 0.8265925780625734, "learning_rate": 7.461283807312194e-06, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.15462356805801392, "step": 4960, "valid_targets_mean": 2074.3, "valid_targets_min": 736 }, { "epoch": 5.215336134453781, "grad_norm": 0.8400103721164567, "learning_rate": 7.420514402507886e-06, "loss": 0.1716, "loss_nan_ranks": 0, "loss_rank_avg": 0.16285106539726257, "step": 4965, "valid_targets_mean": 2134.1, "valid_targets_min": 567 }, { "epoch": 5.220588235294118, "grad_norm": 0.7819781182832531, "learning_rate": 7.379831302372389e-06, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.15541312098503113, "step": 4970, "valid_targets_mean": 2262.2, "valid_targets_min": 567 }, { "epoch": 5.225840336134453, "grad_norm": 0.8105251128609028, "learning_rate": 7.3392347860221556e-06, "loss": 0.1707, "loss_nan_ranks": 0, "loss_rank_avg": 0.16982173919677734, "step": 4975, "valid_targets_mean": 2223.4, "valid_targets_min": 999 }, { "epoch": 5.23109243697479, "grad_norm": 0.6863440387762159, "learning_rate": 7.298725131979629e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.15579064190387726, "step": 4980, "valid_targets_mean": 3175.9, "valid_targets_min": 1177 }, { "epoch": 5.236344537815126, "grad_norm": 0.7441930568222063, "learning_rate": 7.258302618171287e-06, "loss": 0.1701, "loss_nan_ranks": 0, "loss_rank_avg": 0.1511012315750122, "step": 4985, "valid_targets_mean": 2616.9, "valid_targets_min": 733 }, { "epoch": 5.241596638655462, "grad_norm": 0.7374029049491165, "learning_rate": 7.217967521925775e-06, "loss": 0.1621, "loss_nan_ranks": 0, "loss_rank_avg": 0.16436655819416046, "step": 4990, "valid_targets_mean": 2690.6, "valid_targets_min": 874 }, { "epoch": 5.246848739495798, "grad_norm": 0.7497430314524601, "learning_rate": 7.177720119971998e-06, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.17379173636436462, "step": 4995, "valid_targets_mean": 2911.5, "valid_targets_min": 835 }, { "epoch": 5.2521008403361344, "grad_norm": 0.7942479630297596, "learning_rate": 7.137560688437184e-06, "loss": 0.1658, "loss_nan_ranks": 0, "loss_rank_avg": 0.1384781152009964, "step": 5000, "valid_targets_mean": 1960.1, "valid_targets_min": 765 }, { "epoch": 5.257352941176471, "grad_norm": 0.6952857832526612, "learning_rate": 7.097489502845047e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.12435892224311829, "step": 5005, "valid_targets_mean": 2232.8, "valid_targets_min": 420 }, { "epoch": 5.262605042016807, "grad_norm": 0.7259264839559267, "learning_rate": 7.0575068381138525e-06, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.15408116579055786, "step": 5010, "valid_targets_mean": 2326.8, "valid_targets_min": 1105 }, { "epoch": 5.267857142857143, "grad_norm": 0.6907832100331577, "learning_rate": 7.0176129685545414e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.1581760197877884, "step": 5015, "valid_targets_mean": 2910.8, "valid_targets_min": 643 }, { "epoch": 5.273109243697479, "grad_norm": 0.7359189102249872, "learning_rate": 6.977808167868867e-06, "loss": 0.1655, "loss_nan_ranks": 0, "loss_rank_avg": 0.1630137860774994, "step": 5020, "valid_targets_mean": 3007.1, "valid_targets_min": 1082 }, { "epoch": 5.2783613445378155, "grad_norm": 0.7813513338182236, "learning_rate": 6.9380927091475085e-06, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.16749534010887146, "step": 5025, "valid_targets_mean": 2539.6, "valid_targets_min": 793 }, { "epoch": 5.283613445378151, "grad_norm": 0.7597593894886342, "learning_rate": 6.898466864868165e-06, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.16621197760105133, "step": 5030, "valid_targets_mean": 2721.4, "valid_targets_min": 1009 }, { "epoch": 5.288865546218488, "grad_norm": 0.7182742303119539, "learning_rate": 6.858930906893751e-06, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.15185761451721191, "step": 5035, "valid_targets_mean": 2491.1, "valid_targets_min": 754 }, { "epoch": 5.294117647058823, "grad_norm": 0.8593841083426136, "learning_rate": 6.819485106470454e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.15788263082504272, "step": 5040, "valid_targets_mean": 1728.0, "valid_targets_min": 846 }, { "epoch": 5.29936974789916, "grad_norm": 0.8035500930290126, "learning_rate": 6.780129734225949e-06, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.15254664421081543, "step": 5045, "valid_targets_mean": 2170.8, "valid_targets_min": 841 }, { "epoch": 5.304621848739496, "grad_norm": 0.8459834255980975, "learning_rate": 6.740865060167483e-06, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.16684821248054504, "step": 5050, "valid_targets_mean": 1869.9, "valid_targets_min": 740 }, { "epoch": 5.309873949579832, "grad_norm": 0.7852698744711136, "learning_rate": 6.701691353680049e-06, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.1623380482196808, "step": 5055, "valid_targets_mean": 2586.2, "valid_targets_min": 728 }, { "epoch": 5.315126050420168, "grad_norm": 0.7811887298191118, "learning_rate": 6.662608883524542e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.13154323399066925, "step": 5060, "valid_targets_mean": 1648.8, "valid_targets_min": 739 }, { "epoch": 5.320378151260504, "grad_norm": 0.660895377255489, "learning_rate": 6.6236179178359115e-06, "loss": 0.1642, "loss_nan_ranks": 0, "loss_rank_avg": 0.15457244217395782, "step": 5065, "valid_targets_mean": 3175.9, "valid_targets_min": 680 }, { "epoch": 5.32563025210084, "grad_norm": 0.7245039671860787, "learning_rate": 6.5847187241213e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.14748461544513702, "step": 5070, "valid_targets_mean": 2657.9, "valid_targets_min": 878 }, { "epoch": 5.330882352941177, "grad_norm": 0.7753382710745726, "learning_rate": 6.5459115692582386e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.16546081006526947, "step": 5075, "valid_targets_mean": 2395.2, "valid_targets_min": 798 }, { "epoch": 5.336134453781512, "grad_norm": 0.7698920766313514, "learning_rate": 6.507196719492819e-06, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.1609654426574707, "step": 5080, "valid_targets_mean": 2615.0, "valid_targets_min": 881 }, { "epoch": 5.341386554621849, "grad_norm": 0.8553168767751825, "learning_rate": 6.468574440437801e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.15425896644592285, "step": 5085, "valid_targets_mean": 1917.0, "valid_targets_min": 647 }, { "epoch": 5.3466386554621845, "grad_norm": 0.7379979219387762, "learning_rate": 6.43004499707089e-06, "loss": 0.1704, "loss_nan_ranks": 0, "loss_rank_avg": 0.18386310338974, "step": 5090, "valid_targets_mean": 2954.1, "valid_targets_min": 917 }, { "epoch": 5.351890756302521, "grad_norm": 0.800532265924272, "learning_rate": 6.3916086537328545e-06, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.1512497365474701, "step": 5095, "valid_targets_mean": 2645.6, "valid_targets_min": 641 }, { "epoch": 5.357142857142857, "grad_norm": 0.7258456117778306, "learning_rate": 6.3532656741257145e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.15273120999336243, "step": 5100, "valid_targets_mean": 2574.7, "valid_targets_min": 759 }, { "epoch": 5.362394957983193, "grad_norm": 0.732365954356259, "learning_rate": 6.315016321310965e-06, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.16224431991577148, "step": 5105, "valid_targets_mean": 2581.6, "valid_targets_min": 835 }, { "epoch": 5.367647058823529, "grad_norm": 0.7789962344565333, "learning_rate": 6.276860857707727e-06, "loss": 0.1719, "loss_nan_ranks": 0, "loss_rank_avg": 0.17684108018875122, "step": 5110, "valid_targets_mean": 2496.4, "valid_targets_min": 776 }, { "epoch": 5.3728991596638656, "grad_norm": 0.8532814228814727, "learning_rate": 6.238799545090994e-06, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.1521385908126831, "step": 5115, "valid_targets_mean": 2414.0, "valid_targets_min": 713 }, { "epoch": 5.378151260504202, "grad_norm": 0.7899952744078172, "learning_rate": 6.20083264458981e-06, "loss": 0.1474, "loss_nan_ranks": 0, "loss_rank_avg": 0.1502818763256073, "step": 5120, "valid_targets_mean": 2204.8, "valid_targets_min": 716 }, { "epoch": 5.383403361344538, "grad_norm": 0.6387635570636864, "learning_rate": 6.162960416685469e-06, "loss": 0.1602, "loss_nan_ranks": 0, "loss_rank_avg": 0.1471373438835144, "step": 5125, "valid_targets_mean": 3084.1, "valid_targets_min": 1468 }, { "epoch": 5.388655462184874, "grad_norm": 0.8485693482893446, "learning_rate": 6.125183121209741e-06, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.1780264526605606, "step": 5130, "valid_targets_mean": 2274.9, "valid_targets_min": 1094 }, { "epoch": 5.39390756302521, "grad_norm": 0.7495677095087009, "learning_rate": 6.087501017343107e-06, "loss": 0.1644, "loss_nan_ranks": 0, "loss_rank_avg": 0.15651904046535492, "step": 5135, "valid_targets_mean": 2542.9, "valid_targets_min": 763 }, { "epoch": 5.399159663865547, "grad_norm": 0.7435758493446045, "learning_rate": 6.0499143636129384e-06, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.1455836445093155, "step": 5140, "valid_targets_mean": 2512.5, "valid_targets_min": 797 }, { "epoch": 5.404411764705882, "grad_norm": 0.8993390562265813, "learning_rate": 6.012423417891766e-06, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.17336681485176086, "step": 5145, "valid_targets_mean": 2680.2, "valid_targets_min": 801 }, { "epoch": 5.409663865546219, "grad_norm": 0.8004525963625007, "learning_rate": 5.975028437395493e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.15126681327819824, "step": 5150, "valid_targets_mean": 2013.7, "valid_targets_min": 790 }, { "epoch": 5.4149159663865545, "grad_norm": 0.7799255786777086, "learning_rate": 5.937729678681612e-06, "loss": 0.1576, "loss_nan_ranks": 0, "loss_rank_avg": 0.15724611282348633, "step": 5155, "valid_targets_mean": 2525.8, "valid_targets_min": 1280 }, { "epoch": 5.420168067226891, "grad_norm": 0.7841845158497852, "learning_rate": 5.9005273976474684e-06, "loss": 0.171, "loss_nan_ranks": 0, "loss_rank_avg": 0.15903203189373016, "step": 5160, "valid_targets_mean": 2379.1, "valid_targets_min": 1163 }, { "epoch": 5.425420168067227, "grad_norm": 0.6717665505168996, "learning_rate": 5.8634218495285126e-06, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.14495673775672913, "step": 5165, "valid_targets_mean": 2827.6, "valid_targets_min": 1100 }, { "epoch": 5.430672268907563, "grad_norm": 0.8298875239928819, "learning_rate": 5.8264132888965155e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.14547504484653473, "step": 5170, "valid_targets_mean": 2200.4, "valid_targets_min": 744 }, { "epoch": 5.435924369747899, "grad_norm": 0.7078895304712665, "learning_rate": 5.789501969657853e-06, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.14443817734718323, "step": 5175, "valid_targets_mean": 2713.6, "valid_targets_min": 785 }, { "epoch": 5.4411764705882355, "grad_norm": 0.7468395911409705, "learning_rate": 5.752688145051761e-06, "loss": 0.1645, "loss_nan_ranks": 0, "loss_rank_avg": 0.15606167912483215, "step": 5180, "valid_targets_mean": 2896.7, "valid_targets_min": 933 }, { "epoch": 5.446428571428571, "grad_norm": 0.7339528998149712, "learning_rate": 5.715972067648561e-06, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.16431309282779694, "step": 5185, "valid_targets_mean": 2671.4, "valid_targets_min": 780 }, { "epoch": 5.451680672268908, "grad_norm": 0.7898995773556446, "learning_rate": 5.679353989347989e-06, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.14948245882987976, "step": 5190, "valid_targets_mean": 2137.9, "valid_targets_min": 623 }, { "epoch": 5.456932773109243, "grad_norm": 0.8149040646058742, "learning_rate": 5.642834161377408e-06, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.16367627680301666, "step": 5195, "valid_targets_mean": 2087.3, "valid_targets_min": 1040 }, { "epoch": 5.46218487394958, "grad_norm": 0.6719154088237885, "learning_rate": 5.606412834290121e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.14343780279159546, "step": 5200, "valid_targets_mean": 3016.2, "valid_targets_min": 1041 }, { "epoch": 5.467436974789916, "grad_norm": 0.8508194897949711, "learning_rate": 5.570090257963645e-06, "loss": 0.1638, "loss_nan_ranks": 0, "loss_rank_avg": 0.16275382041931152, "step": 5205, "valid_targets_mean": 1842.1, "valid_targets_min": 1076 }, { "epoch": 5.472689075630252, "grad_norm": 0.7598842769868193, "learning_rate": 5.533866681597981e-06, "loss": 0.155, "loss_nan_ranks": 0, "loss_rank_avg": 0.1676841378211975, "step": 5210, "valid_targets_mean": 2668.4, "valid_targets_min": 900 }, { "epoch": 5.477941176470588, "grad_norm": 0.8473153688144975, "learning_rate": 5.497742353713928e-06, "loss": 0.1689, "loss_nan_ranks": 0, "loss_rank_avg": 0.17238308489322662, "step": 5215, "valid_targets_mean": 2029.6, "valid_targets_min": 670 }, { "epoch": 5.483193277310924, "grad_norm": 0.737492773817561, "learning_rate": 5.461717522151371e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.15577836334705353, "step": 5220, "valid_targets_mean": 2799.9, "valid_targets_min": 782 }, { "epoch": 5.48844537815126, "grad_norm": 0.7013802768068832, "learning_rate": 5.4257924340675535e-06, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.16768768429756165, "step": 5225, "valid_targets_mean": 3200.6, "valid_targets_min": 1303 }, { "epoch": 5.493697478991597, "grad_norm": 0.6898526895385486, "learning_rate": 5.389967335935429e-06, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.15428847074508667, "step": 5230, "valid_targets_mean": 2979.0, "valid_targets_min": 735 }, { "epoch": 5.498949579831933, "grad_norm": 0.8269332396210477, "learning_rate": 5.3542424735419306e-06, "loss": 0.1662, "loss_nan_ranks": 0, "loss_rank_avg": 0.1691667139530182, "step": 5235, "valid_targets_mean": 2126.2, "valid_targets_min": 641 }, { "epoch": 5.504201680672269, "grad_norm": 0.7582781505938827, "learning_rate": 5.318618091986294e-06, "loss": 0.1595, "loss_nan_ranks": 0, "loss_rank_avg": 0.16203898191452026, "step": 5240, "valid_targets_mean": 2414.2, "valid_targets_min": 758 }, { "epoch": 5.509453781512605, "grad_norm": 0.964837540275934, "learning_rate": 5.283094435678398e-06, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.18285033106803894, "step": 5245, "valid_targets_mean": 2520.3, "valid_targets_min": 814 }, { "epoch": 5.514705882352941, "grad_norm": 0.7407984840086744, "learning_rate": 5.2476717483370685e-06, "loss": 0.1691, "loss_nan_ranks": 0, "loss_rank_avg": 0.18044058978557587, "step": 5250, "valid_targets_mean": 2980.8, "valid_targets_min": 757 }, { "epoch": 5.519957983193278, "grad_norm": 0.670814241203273, "learning_rate": 5.212350272988394e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.13862532377243042, "step": 5255, "valid_targets_mean": 2928.0, "valid_targets_min": 752 }, { "epoch": 5.525210084033613, "grad_norm": 0.7638249491401231, "learning_rate": 5.177130251964088e-06, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.15651783347129822, "step": 5260, "valid_targets_mean": 2388.1, "valid_targets_min": 620 }, { "epoch": 5.53046218487395, "grad_norm": 0.7464606207804972, "learning_rate": 5.1420119268998085e-06, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.15144014358520508, "step": 5265, "valid_targets_mean": 2414.2, "valid_targets_min": 739 }, { "epoch": 5.535714285714286, "grad_norm": 0.6723804956667677, "learning_rate": 5.106995538733488e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.12311984598636627, "step": 5270, "valid_targets_mean": 2505.5, "valid_targets_min": 814 }, { "epoch": 5.540966386554622, "grad_norm": 0.7514104012472849, "learning_rate": 5.07208132770372e-06, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.16300344467163086, "step": 5275, "valid_targets_mean": 2621.9, "valid_targets_min": 1151 }, { "epoch": 5.546218487394958, "grad_norm": 0.8709704943028632, "learning_rate": 5.037269533348075e-06, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.15614300966262817, "step": 5280, "valid_targets_mean": 2086.8, "valid_targets_min": 892 }, { "epoch": 5.551470588235294, "grad_norm": 0.8145404233606028, "learning_rate": 5.002560394501463e-06, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.1704893410205841, "step": 5285, "valid_targets_mean": 2252.9, "valid_targets_min": 816 }, { "epoch": 5.55672268907563, "grad_norm": 0.7858067778473078, "learning_rate": 4.9679541492945135e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.17581012845039368, "step": 5290, "valid_targets_mean": 2497.4, "valid_targets_min": 832 }, { "epoch": 5.561974789915967, "grad_norm": 0.7444934360144145, "learning_rate": 4.933451035151913e-06, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.16977301239967346, "step": 5295, "valid_targets_mean": 2621.8, "valid_targets_min": 734 }, { "epoch": 5.567226890756302, "grad_norm": 0.7002188781201552, "learning_rate": 4.899051288790806e-06, "loss": 0.1643, "loss_nan_ranks": 0, "loss_rank_avg": 0.15018996596336365, "step": 5300, "valid_targets_mean": 2713.4, "valid_targets_min": 839 }, { "epoch": 5.572478991596639, "grad_norm": 0.7598676053646428, "learning_rate": 4.86475514621916e-06, "loss": 0.165, "loss_nan_ranks": 0, "loss_rank_avg": 0.16991931200027466, "step": 5305, "valid_targets_mean": 2667.0, "valid_targets_min": 900 }, { "epoch": 5.5777310924369745, "grad_norm": 0.8820515115776142, "learning_rate": 4.830562842734112e-06, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.1688452661037445, "step": 5310, "valid_targets_mean": 2134.6, "valid_targets_min": 903 }, { "epoch": 5.582983193277311, "grad_norm": 0.7149756144412622, "learning_rate": 4.796474612920421e-06, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.15258319675922394, "step": 5315, "valid_targets_mean": 2937.4, "valid_targets_min": 513 }, { "epoch": 5.588235294117647, "grad_norm": 0.6941030908245607, "learning_rate": 4.762490690648813e-06, "loss": 0.1652, "loss_nan_ranks": 0, "loss_rank_avg": 0.17828604578971863, "step": 5320, "valid_targets_mean": 3366.6, "valid_targets_min": 613 }, { "epoch": 5.593487394957983, "grad_norm": 0.7755309453396569, "learning_rate": 4.728611309074374e-06, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.16606014966964722, "step": 5325, "valid_targets_mean": 2534.5, "valid_targets_min": 746 }, { "epoch": 5.598739495798319, "grad_norm": 0.7161574736206265, "learning_rate": 4.694836700634975e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.1472625732421875, "step": 5330, "valid_targets_mean": 2363.2, "valid_targets_min": 864 }, { "epoch": 5.6039915966386555, "grad_norm": 0.9658673174845026, "learning_rate": 4.661167097049668e-06, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.15956471860408783, "step": 5335, "valid_targets_mean": 2047.2, "valid_targets_min": 922 }, { "epoch": 5.609243697478991, "grad_norm": 0.8292596385955369, "learning_rate": 4.62760272931708e-06, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.16373419761657715, "step": 5340, "valid_targets_mean": 2055.4, "valid_targets_min": 873 }, { "epoch": 5.614495798319328, "grad_norm": 0.7872816299655447, "learning_rate": 4.594143827713844e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.16614991426467896, "step": 5345, "valid_targets_mean": 2267.2, "valid_targets_min": 676 }, { "epoch": 5.619747899159664, "grad_norm": 0.6885239670075206, "learning_rate": 4.56079062179303e-06, "loss": 0.1614, "loss_nan_ranks": 0, "loss_rank_avg": 0.1568869948387146, "step": 5350, "valid_targets_mean": 3092.1, "valid_targets_min": 739 }, { "epoch": 5.625, "grad_norm": 0.7063945748122799, "learning_rate": 4.527543340382538e-06, "loss": 0.1653, "loss_nan_ranks": 0, "loss_rank_avg": 0.15817028284072876, "step": 5355, "valid_targets_mean": 3193.8, "valid_targets_min": 720 }, { "epoch": 5.630252100840336, "grad_norm": 0.7483586106813811, "learning_rate": 4.494402211583569e-06, "loss": 0.1674, "loss_nan_ranks": 0, "loss_rank_avg": 0.1763601005077362, "step": 5360, "valid_targets_mean": 2585.2, "valid_targets_min": 702 }, { "epoch": 5.635504201680672, "grad_norm": 0.7266651690365762, "learning_rate": 4.461367462769009e-06, "loss": 0.1649, "loss_nan_ranks": 0, "loss_rank_avg": 0.15703195333480835, "step": 5365, "valid_targets_mean": 2579.4, "valid_targets_min": 943 }, { "epoch": 5.640756302521009, "grad_norm": 0.7723418200616802, "learning_rate": 4.428439320581923e-06, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.16179069876670837, "step": 5370, "valid_targets_mean": 2583.6, "valid_targets_min": 1207 }, { "epoch": 5.6460084033613445, "grad_norm": 0.6951598907006209, "learning_rate": 4.3956180109339705e-06, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.15667061507701874, "step": 5375, "valid_targets_mean": 2790.9, "valid_targets_min": 985 }, { "epoch": 5.651260504201681, "grad_norm": 0.7579446080195453, "learning_rate": 4.362903759003849e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.15197469294071198, "step": 5380, "valid_targets_mean": 2506.1, "valid_targets_min": 853 }, { "epoch": 5.656512605042017, "grad_norm": 0.7299857797114069, "learning_rate": 4.33029678923576e-06, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.1476059854030609, "step": 5385, "valid_targets_mean": 2806.4, "valid_targets_min": 824 }, { "epoch": 5.661764705882353, "grad_norm": 0.7781274130758863, "learning_rate": 4.297797325337889e-06, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.1483781933784485, "step": 5390, "valid_targets_mean": 2407.4, "valid_targets_min": 1184 }, { "epoch": 5.667016806722689, "grad_norm": 0.7313088256357814, "learning_rate": 4.265405590280822e-06, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.15789197385311127, "step": 5395, "valid_targets_mean": 3041.6, "valid_targets_min": 1206 }, { "epoch": 5.6722689075630255, "grad_norm": 0.8103212447323822, "learning_rate": 4.233121806296072e-06, "loss": 0.1651, "loss_nan_ranks": 0, "loss_rank_avg": 0.17392036318778992, "step": 5400, "valid_targets_mean": 2288.4, "valid_targets_min": 533 }, { "epoch": 5.677521008403361, "grad_norm": 0.7595385849740667, "learning_rate": 4.200946194874514e-06, "loss": 0.1584, "loss_nan_ranks": 0, "loss_rank_avg": 0.15691381692886353, "step": 5405, "valid_targets_mean": 2395.4, "valid_targets_min": 914 }, { "epoch": 5.682773109243698, "grad_norm": 0.7278254832783921, "learning_rate": 4.168878976764872e-06, "loss": 0.164, "loss_nan_ranks": 0, "loss_rank_avg": 0.1525121033191681, "step": 5410, "valid_targets_mean": 2631.4, "valid_targets_min": 1157 }, { "epoch": 5.688025210084033, "grad_norm": 0.8021682749292429, "learning_rate": 4.136920371972228e-06, "loss": 0.1625, "loss_nan_ranks": 0, "loss_rank_avg": 0.14895716309547424, "step": 5415, "valid_targets_mean": 1936.1, "valid_targets_min": 912 }, { "epoch": 5.69327731092437, "grad_norm": 0.6953948453787546, "learning_rate": 4.105070599756482e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.15940669178962708, "step": 5420, "valid_targets_mean": 2777.6, "valid_targets_min": 865 }, { "epoch": 5.698529411764706, "grad_norm": 0.770187756365488, "learning_rate": 4.073329878630856e-06, "loss": 0.1667, "loss_nan_ranks": 0, "loss_rank_avg": 0.16655011475086212, "step": 5425, "valid_targets_mean": 2557.6, "valid_targets_min": 770 }, { "epoch": 5.703781512605042, "grad_norm": 0.7698518711299432, "learning_rate": 4.041698426360425e-06, "loss": 0.1695, "loss_nan_ranks": 0, "loss_rank_avg": 0.1650160849094391, "step": 5430, "valid_targets_mean": 2342.6, "valid_targets_min": 682 }, { "epoch": 5.709033613445378, "grad_norm": 0.7840326454397952, "learning_rate": 4.010176459960569e-06, "loss": 0.1603, "loss_nan_ranks": 0, "loss_rank_avg": 0.161130890250206, "step": 5435, "valid_targets_mean": 2237.3, "valid_targets_min": 715 }, { "epoch": 5.714285714285714, "grad_norm": 0.6973943107045614, "learning_rate": 3.978764195695528e-06, "loss": 0.1572, "loss_nan_ranks": 0, "loss_rank_avg": 0.14485879242420197, "step": 5440, "valid_targets_mean": 2737.0, "valid_targets_min": 977 }, { "epoch": 5.71953781512605, "grad_norm": 0.8240293274129915, "learning_rate": 3.947461849076912e-06, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.19433113932609558, "step": 5445, "valid_targets_mean": 2314.3, "valid_targets_min": 977 }, { "epoch": 5.724789915966387, "grad_norm": 0.8114689626823407, "learning_rate": 3.916269634862193e-06, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.15822897851467133, "step": 5450, "valid_targets_mean": 2607.1, "valid_targets_min": 636 }, { "epoch": 5.730042016806722, "grad_norm": 0.8364269359269342, "learning_rate": 3.885187767053269e-06, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.1558850109577179, "step": 5455, "valid_targets_mean": 1694.3, "valid_targets_min": 838 }, { "epoch": 5.735294117647059, "grad_norm": 0.8692400632474553, "learning_rate": 3.854216458894973e-06, "loss": 0.1636, "loss_nan_ranks": 0, "loss_rank_avg": 0.16702617704868317, "step": 5460, "valid_targets_mean": 2202.1, "valid_targets_min": 777 }, { "epoch": 5.740546218487395, "grad_norm": 0.7101368299314894, "learning_rate": 3.823355922873606e-06, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.14841680228710175, "step": 5465, "valid_targets_mean": 2778.5, "valid_targets_min": 738 }, { "epoch": 5.745798319327731, "grad_norm": 0.7291139806638217, "learning_rate": 3.792606370715508e-06, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1669558882713318, "step": 5470, "valid_targets_mean": 2786.6, "valid_targets_min": 1024 }, { "epoch": 5.751050420168067, "grad_norm": 0.8199168939791637, "learning_rate": 3.761968013385584e-06, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.15248140692710876, "step": 5475, "valid_targets_mean": 1965.8, "valid_targets_min": 655 }, { "epoch": 5.756302521008403, "grad_norm": 0.7220120926134376, "learning_rate": 3.731441061085843e-06, "loss": 0.1679, "loss_nan_ranks": 0, "loss_rank_avg": 0.15842077136039734, "step": 5480, "valid_targets_mean": 2855.1, "valid_targets_min": 1118 }, { "epoch": 5.76155462184874, "grad_norm": 0.7691870517732631, "learning_rate": 3.701025723253988e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.14176911115646362, "step": 5485, "valid_targets_mean": 2196.8, "valid_targets_min": 640 }, { "epoch": 5.766806722689076, "grad_norm": 0.6895030971240736, "learning_rate": 3.67072220856197e-06, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.15497374534606934, "step": 5490, "valid_targets_mean": 2655.5, "valid_targets_min": 1184 }, { "epoch": 5.772058823529412, "grad_norm": 0.7338262928726779, "learning_rate": 3.640530724914517e-06, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.16165027022361755, "step": 5495, "valid_targets_mean": 2627.9, "valid_targets_min": 949 }, { "epoch": 5.777310924369748, "grad_norm": 0.7406660843906033, "learning_rate": 3.61045147944777e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.14221808314323425, "step": 5500, "valid_targets_mean": 2517.7, "valid_targets_min": 578 }, { "epoch": 5.782563025210084, "grad_norm": 0.7608572974428726, "learning_rate": 3.5804846785278315e-06, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.15930047631263733, "step": 5505, "valid_targets_mean": 2888.9, "valid_targets_min": 1200 }, { "epoch": 5.78781512605042, "grad_norm": 0.7935824693797842, "learning_rate": 3.5506305277493326e-06, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.1513899266719818, "step": 5510, "valid_targets_mean": 2279.6, "valid_targets_min": 597 }, { "epoch": 5.793067226890757, "grad_norm": 0.790428932578931, "learning_rate": 3.520889231934057e-06, "loss": 0.1624, "loss_nan_ranks": 0, "loss_rank_avg": 0.1564992070198059, "step": 5515, "valid_targets_mean": 2152.1, "valid_targets_min": 1278 }, { "epoch": 5.798319327731092, "grad_norm": 0.8386478323895583, "learning_rate": 3.4912609951295084e-06, "loss": 0.1692, "loss_nan_ranks": 0, "loss_rank_avg": 0.1771148443222046, "step": 5520, "valid_targets_mean": 2142.2, "valid_targets_min": 841 }, { "epoch": 5.803571428571429, "grad_norm": 0.8169074903755393, "learning_rate": 3.461746020607526e-06, "loss": 0.1659, "loss_nan_ranks": 0, "loss_rank_avg": 0.16074536740779877, "step": 5525, "valid_targets_mean": 2207.6, "valid_targets_min": 760 }, { "epoch": 5.8088235294117645, "grad_norm": 0.7542209212555967, "learning_rate": 3.432344510862895e-06, "loss": 0.1612, "loss_nan_ranks": 0, "loss_rank_avg": 0.17460983991622925, "step": 5530, "valid_targets_mean": 2285.8, "valid_targets_min": 721 }, { "epoch": 5.814075630252101, "grad_norm": 0.9980332994549753, "learning_rate": 3.403056667611917e-06, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.17128345370292664, "step": 5535, "valid_targets_mean": 2691.8, "valid_targets_min": 785 }, { "epoch": 5.819327731092437, "grad_norm": 0.7583521616551634, "learning_rate": 3.373882691791088e-06, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.15085886418819427, "step": 5540, "valid_targets_mean": 2659.0, "valid_targets_min": 748 }, { "epoch": 5.824579831932773, "grad_norm": 0.8477434832925683, "learning_rate": 3.344822783555679e-06, "loss": 0.1623, "loss_nan_ranks": 0, "loss_rank_avg": 0.16110014915466309, "step": 5545, "valid_targets_mean": 1985.5, "valid_targets_min": 697 }, { "epoch": 5.829831932773109, "grad_norm": 0.7643511912140655, "learning_rate": 3.315877142278363e-06, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.16038095951080322, "step": 5550, "valid_targets_mean": 2380.6, "valid_targets_min": 725 }, { "epoch": 5.8350840336134455, "grad_norm": 0.7518728544106923, "learning_rate": 3.287045966547866e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.17358054220676422, "step": 5555, "valid_targets_mean": 2760.2, "valid_targets_min": 692 }, { "epoch": 5.840336134453781, "grad_norm": 0.7124048514016621, "learning_rate": 3.258329454167599e-06, "loss": 0.159, "loss_nan_ranks": 0, "loss_rank_avg": 0.1632152795791626, "step": 5560, "valid_targets_mean": 2886.0, "valid_targets_min": 710 }, { "epoch": 5.845588235294118, "grad_norm": 0.8638758876946544, "learning_rate": 3.2297278021542833e-06, "loss": 0.1732, "loss_nan_ranks": 0, "loss_rank_avg": 0.18239599466323853, "step": 5565, "valid_targets_mean": 2045.9, "valid_targets_min": 818 }, { "epoch": 5.850840336134453, "grad_norm": 0.8074069942626705, "learning_rate": 3.201241206736614e-06, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.19121696054935455, "step": 5570, "valid_targets_mean": 2512.3, "valid_targets_min": 819 }, { "epoch": 5.85609243697479, "grad_norm": 0.8094730562236274, "learning_rate": 3.1728698633539266e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.1697961837053299, "step": 5575, "valid_targets_mean": 2204.6, "valid_targets_min": 713 }, { "epoch": 5.8613445378151265, "grad_norm": 0.7593441846784588, "learning_rate": 3.1446139666548212e-06, "loss": 0.1631, "loss_nan_ranks": 0, "loss_rank_avg": 0.1595013290643692, "step": 5580, "valid_targets_mean": 2633.0, "valid_targets_min": 707 }, { "epoch": 5.866596638655462, "grad_norm": 0.7957651638135713, "learning_rate": 3.1164737104958707e-06, "loss": 0.1599, "loss_nan_ranks": 0, "loss_rank_avg": 0.15644320845603943, "step": 5585, "valid_targets_mean": 1890.6, "valid_targets_min": 797 }, { "epoch": 5.871848739495798, "grad_norm": 0.8090053281592035, "learning_rate": 3.0884492879402452e-06, "loss": 0.1633, "loss_nan_ranks": 0, "loss_rank_avg": 0.17713585495948792, "step": 5590, "valid_targets_mean": 2193.5, "valid_targets_min": 682 }, { "epoch": 5.8771008403361344, "grad_norm": 0.7500689718315519, "learning_rate": 3.0605408912564184e-06, "loss": 0.1647, "loss_nan_ranks": 0, "loss_rank_avg": 0.16628164052963257, "step": 5595, "valid_targets_mean": 2580.8, "valid_targets_min": 754 }, { "epoch": 5.882352941176471, "grad_norm": 0.8192677926893119, "learning_rate": 3.032748711916851e-06, "loss": 0.1657, "loss_nan_ranks": 0, "loss_rank_avg": 0.16836728155612946, "step": 5600, "valid_targets_mean": 2461.7, "valid_targets_min": 788 }, { "epoch": 5.887605042016807, "grad_norm": 0.7874830104284019, "learning_rate": 3.0050729405966495e-06, "loss": 0.1632, "loss_nan_ranks": 0, "loss_rank_avg": 0.16090510785579681, "step": 5605, "valid_targets_mean": 2267.6, "valid_targets_min": 244 }, { "epoch": 5.892857142857143, "grad_norm": 0.7833656235582289, "learning_rate": 2.9775137671722754e-06, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.1637769341468811, "step": 5610, "valid_targets_mean": 2443.2, "valid_targets_min": 713 }, { "epoch": 5.898109243697479, "grad_norm": 0.7228128266155345, "learning_rate": 2.9500713807202565e-06, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.15642684698104858, "step": 5615, "valid_targets_mean": 2638.7, "valid_targets_min": 683 }, { "epoch": 5.9033613445378155, "grad_norm": 0.6752375605078036, "learning_rate": 2.9227459695158543e-06, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.15065337717533112, "step": 5620, "valid_targets_mean": 3194.4, "valid_targets_min": 1263 }, { "epoch": 5.908613445378151, "grad_norm": 0.8638709102103872, "learning_rate": 2.895537721031809e-06, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.16943012177944183, "step": 5625, "valid_targets_mean": 1833.1, "valid_targets_min": 776 }, { "epoch": 5.913865546218488, "grad_norm": 0.7646968532660349, "learning_rate": 2.8684468219370364e-06, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.14894887804985046, "step": 5630, "valid_targets_mean": 2673.2, "valid_targets_min": 697 }, { "epoch": 5.919117647058823, "grad_norm": 0.7612881911075914, "learning_rate": 2.841473458095334e-06, "loss": 0.1668, "loss_nan_ranks": 0, "loss_rank_avg": 0.14882472157478333, "step": 5635, "valid_targets_mean": 2316.6, "valid_targets_min": 635 }, { "epoch": 5.92436974789916, "grad_norm": 0.7425817529470462, "learning_rate": 2.8146178145641355e-06, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.1679328829050064, "step": 5640, "valid_targets_mean": 2502.5, "valid_targets_min": 687 }, { "epoch": 5.929621848739496, "grad_norm": 0.9027720359549637, "learning_rate": 2.787880075593217e-06, "loss": 0.1669, "loss_nan_ranks": 0, "loss_rank_avg": 0.15756511688232422, "step": 5645, "valid_targets_mean": 2311.6, "valid_targets_min": 642 }, { "epoch": 5.934873949579832, "grad_norm": 0.6980735937613616, "learning_rate": 2.7612604246234355e-06, "loss": 0.1608, "loss_nan_ranks": 0, "loss_rank_avg": 0.16025885939598083, "step": 5650, "valid_targets_mean": 2912.9, "valid_targets_min": 854 }, { "epoch": 5.940126050420168, "grad_norm": 0.7529592237919616, "learning_rate": 2.7347590442854867e-06, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.17594562470912933, "step": 5655, "valid_targets_mean": 2683.8, "valid_targets_min": 1005 }, { "epoch": 5.945378151260504, "grad_norm": 0.7696301031774723, "learning_rate": 2.7083761163986433e-06, "loss": 0.1683, "loss_nan_ranks": 0, "loss_rank_avg": 0.17107313871383667, "step": 5660, "valid_targets_mean": 2896.2, "valid_targets_min": 732 }, { "epoch": 5.95063025210084, "grad_norm": 0.7798340627342268, "learning_rate": 2.682111821969493e-06, "loss": 0.1654, "loss_nan_ranks": 0, "loss_rank_avg": 0.16536115109920502, "step": 5665, "valid_targets_mean": 2587.5, "valid_targets_min": 873 }, { "epoch": 5.955882352941177, "grad_norm": 0.7149524883372318, "learning_rate": 2.6559663411907233e-06, "loss": 0.1604, "loss_nan_ranks": 0, "loss_rank_avg": 0.1709938943386078, "step": 5670, "valid_targets_mean": 2945.9, "valid_targets_min": 780 }, { "epoch": 5.961134453781512, "grad_norm": 0.7165019494853891, "learning_rate": 2.629939853439856e-06, "loss": 0.1664, "loss_nan_ranks": 0, "loss_rank_avg": 0.16053658723831177, "step": 5675, "valid_targets_mean": 2915.6, "valid_targets_min": 820 }, { "epoch": 5.966386554621849, "grad_norm": 0.9589101754966618, "learning_rate": 2.604032537278052e-06, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.15422767400741577, "step": 5680, "valid_targets_mean": 1772.9, "valid_targets_min": 622 }, { "epoch": 5.9716386554621845, "grad_norm": 0.7874586260627973, "learning_rate": 2.5782445704488447e-06, "loss": 0.1618, "loss_nan_ranks": 0, "loss_rank_avg": 0.14686915278434753, "step": 5685, "valid_targets_mean": 2175.2, "valid_targets_min": 662 }, { "epoch": 5.976890756302521, "grad_norm": 0.8291299717722125, "learning_rate": 2.5525761298769515e-06, "loss": 0.1672, "loss_nan_ranks": 0, "loss_rank_avg": 0.17729215323925018, "step": 5690, "valid_targets_mean": 2213.9, "valid_targets_min": 1434 }, { "epoch": 5.982142857142857, "grad_norm": 0.8550297198565612, "learning_rate": 2.527027391667054e-06, "loss": 0.1688, "loss_nan_ranks": 0, "loss_rank_avg": 0.18570925295352936, "step": 5695, "valid_targets_mean": 2631.9, "valid_targets_min": 840 }, { "epoch": 5.987394957983193, "grad_norm": 0.8225215202521778, "learning_rate": 2.501598531102587e-06, "loss": 0.1619, "loss_nan_ranks": 0, "loss_rank_avg": 0.1654691994190216, "step": 5700, "valid_targets_mean": 2116.9, "valid_targets_min": 721 }, { "epoch": 5.992647058823529, "grad_norm": 0.7818605889350404, "learning_rate": 2.47628972264452e-06, "loss": 0.1597, "loss_nan_ranks": 0, "loss_rank_avg": 0.15820591151714325, "step": 5705, "valid_targets_mean": 2376.9, "valid_targets_min": 775 }, { "epoch": 5.9978991596638656, "grad_norm": 0.7205251991716778, "learning_rate": 2.4511011399301944e-06, "loss": 0.1681, "loss_nan_ranks": 0, "loss_rank_avg": 0.16490915417671204, "step": 5710, "valid_targets_mean": 3045.2, "valid_targets_min": 921 }, { "epoch": 6.003151260504202, "grad_norm": 0.79777985742783, "learning_rate": 2.4260329557721107e-06, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.16908371448516846, "step": 5715, "valid_targets_mean": 2234.9, "valid_targets_min": 789 }, { "epoch": 6.008403361344538, "grad_norm": 0.7056977699167971, "learning_rate": 2.4010853421567237e-06, "loss": 0.1435, "loss_nan_ranks": 0, "loss_rank_avg": 0.1342272162437439, "step": 5720, "valid_targets_mean": 2620.8, "valid_targets_min": 1276 }, { "epoch": 6.013655462184874, "grad_norm": 0.7206882042436742, "learning_rate": 2.376258470243309e-06, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.1475621461868286, "step": 5725, "valid_targets_mean": 2910.7, "valid_targets_min": 998 }, { "epoch": 6.01890756302521, "grad_norm": 0.6958104794523656, "learning_rate": 2.351552510362758e-06, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.14622151851654053, "step": 5730, "valid_targets_mean": 3744.4, "valid_targets_min": 1153 }, { "epoch": 6.024159663865547, "grad_norm": 0.74834161850093, "learning_rate": 2.326967632016406e-06, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.1483282744884491, "step": 5735, "valid_targets_mean": 2573.9, "valid_targets_min": 791 }, { "epoch": 6.029411764705882, "grad_norm": 0.7566577246672258, "learning_rate": 2.302504003874888e-06, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.14986348152160645, "step": 5740, "valid_targets_mean": 2467.8, "valid_targets_min": 697 }, { "epoch": 6.034663865546219, "grad_norm": 0.7394059807325174, "learning_rate": 2.2781617937769675e-06, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.15996532142162323, "step": 5745, "valid_targets_mean": 3097.9, "valid_targets_min": 914 }, { "epoch": 6.0399159663865545, "grad_norm": 0.7291797979840863, "learning_rate": 2.2539411687283907e-06, "loss": 0.1588, "loss_nan_ranks": 0, "loss_rank_avg": 0.15175995230674744, "step": 5750, "valid_targets_mean": 2689.8, "valid_targets_min": 1214 }, { "epoch": 6.045168067226891, "grad_norm": 0.8021207951201383, "learning_rate": 2.229842294900744e-06, "loss": 0.1484, "loss_nan_ranks": 0, "loss_rank_avg": 0.15454252064228058, "step": 5755, "valid_targets_mean": 2140.5, "valid_targets_min": 829 }, { "epoch": 6.050420168067227, "grad_norm": 0.7912228519081135, "learning_rate": 2.205865337630302e-06, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.15131813287734985, "step": 5760, "valid_targets_mean": 2908.2, "valid_targets_min": 1220 }, { "epoch": 6.055672268907563, "grad_norm": 0.7907789459812723, "learning_rate": 2.182010461416899e-06, "loss": 0.1562, "loss_nan_ranks": 0, "loss_rank_avg": 0.1566312164068222, "step": 5765, "valid_targets_mean": 2503.7, "valid_targets_min": 757 }, { "epoch": 6.060924369747899, "grad_norm": 0.8839642676042035, "learning_rate": 2.158277829922817e-06, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.1570267528295517, "step": 5770, "valid_targets_mean": 1742.3, "valid_targets_min": 544 }, { "epoch": 6.0661764705882355, "grad_norm": 0.8625467723504546, "learning_rate": 2.1346676059716253e-06, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.14902624487876892, "step": 5775, "valid_targets_mean": 2078.1, "valid_targets_min": 754 }, { "epoch": 6.071428571428571, "grad_norm": 0.7087088554579924, "learning_rate": 2.1111799515471066e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.13471050560474396, "step": 5780, "valid_targets_mean": 2473.5, "valid_targets_min": 697 }, { "epoch": 6.076680672268908, "grad_norm": 0.7327436066837598, "learning_rate": 2.0878150277921195e-06, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.13805945217609406, "step": 5785, "valid_targets_mean": 2741.4, "valid_targets_min": 704 }, { "epoch": 6.081932773109243, "grad_norm": 0.8315227818730387, "learning_rate": 2.064572995007492e-06, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.14630141854286194, "step": 5790, "valid_targets_mean": 2002.4, "valid_targets_min": 676 }, { "epoch": 6.08718487394958, "grad_norm": 0.8401948839242035, "learning_rate": 2.0414540126509274e-06, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.16226598620414734, "step": 5795, "valid_targets_mean": 2131.1, "valid_targets_min": 719 }, { "epoch": 6.092436974789916, "grad_norm": 0.8776927085638933, "learning_rate": 2.0184582393359253e-06, "loss": 0.1492, "loss_nan_ranks": 0, "loss_rank_avg": 0.15649349987506866, "step": 5800, "valid_targets_mean": 1861.4, "valid_targets_min": 761 }, { "epoch": 6.097689075630252, "grad_norm": 0.8211711286578806, "learning_rate": 1.99558583283066e-06, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.14332887530326843, "step": 5805, "valid_targets_mean": 2022.8, "valid_targets_min": 692 }, { "epoch": 6.102941176470588, "grad_norm": 0.732033944801811, "learning_rate": 1.9728369500569333e-06, "loss": 0.1415, "loss_nan_ranks": 0, "loss_rank_avg": 0.13911320269107819, "step": 5810, "valid_targets_mean": 2577.7, "valid_targets_min": 578 }, { "epoch": 6.108193277310924, "grad_norm": 0.8099862293022083, "learning_rate": 1.950211747089077e-06, "loss": 0.1567, "loss_nan_ranks": 0, "loss_rank_avg": 0.14890515804290771, "step": 5815, "valid_targets_mean": 2239.7, "valid_targets_min": 705 }, { "epoch": 6.11344537815126, "grad_norm": 0.8280954650156288, "learning_rate": 1.927710379152881e-06, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.15409252047538757, "step": 5820, "valid_targets_mean": 2037.0, "valid_targets_min": 605 }, { "epoch": 6.118697478991597, "grad_norm": 0.7720826623857413, "learning_rate": 1.9053330006245452e-06, "loss": 0.1487, "loss_nan_ranks": 0, "loss_rank_avg": 0.1435692012310028, "step": 5825, "valid_targets_mean": 2505.6, "valid_targets_min": 810 }, { "epoch": 6.123949579831933, "grad_norm": 0.8602830964405195, "learning_rate": 1.8830797650296006e-06, "loss": 0.1536, "loss_nan_ranks": 0, "loss_rank_avg": 0.15629276633262634, "step": 5830, "valid_targets_mean": 1843.5, "valid_targets_min": 807 }, { "epoch": 6.129201680672269, "grad_norm": 0.7886878487521178, "learning_rate": 1.8609508250418628e-06, "loss": 0.163, "loss_nan_ranks": 0, "loss_rank_avg": 0.17373371124267578, "step": 5835, "valid_targets_mean": 2652.3, "valid_targets_min": 1395 }, { "epoch": 6.1344537815126055, "grad_norm": 0.8219543982430842, "learning_rate": 1.8389463324823986e-06, "loss": 0.1471, "loss_nan_ranks": 0, "loss_rank_avg": 0.14603424072265625, "step": 5840, "valid_targets_mean": 2208.8, "valid_targets_min": 859 }, { "epoch": 6.139705882352941, "grad_norm": 0.8240205796466581, "learning_rate": 1.81706643831846e-06, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.1447804570198059, "step": 5845, "valid_targets_mean": 2197.1, "valid_targets_min": 787 }, { "epoch": 6.144957983193278, "grad_norm": 0.7863349767944662, "learning_rate": 1.7953112926624715e-06, "loss": 0.1574, "loss_nan_ranks": 0, "loss_rank_avg": 0.14369264245033264, "step": 5850, "valid_targets_mean": 2488.8, "valid_targets_min": 875 }, { "epoch": 6.150210084033613, "grad_norm": 0.7481918069687116, "learning_rate": 1.7736810447709852e-06, "loss": 0.1404, "loss_nan_ranks": 0, "loss_rank_avg": 0.14041663706302643, "step": 5855, "valid_targets_mean": 2419.5, "valid_targets_min": 631 }, { "epoch": 6.15546218487395, "grad_norm": 0.7548879647168044, "learning_rate": 1.7521758430436553e-06, "loss": 0.1568, "loss_nan_ranks": 0, "loss_rank_avg": 0.15782803297042847, "step": 5860, "valid_targets_mean": 2704.7, "valid_targets_min": 768 }, { "epoch": 6.160714285714286, "grad_norm": 0.8818736318364171, "learning_rate": 1.7307958350222366e-06, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.1596248298883438, "step": 5865, "valid_targets_mean": 2219.8, "valid_targets_min": 836 }, { "epoch": 6.165966386554622, "grad_norm": 0.8306669309571554, "learning_rate": 1.7095411673895545e-06, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.16560135781764984, "step": 5870, "valid_targets_mean": 2339.6, "valid_targets_min": 672 }, { "epoch": 6.171218487394958, "grad_norm": 0.7839020315929305, "learning_rate": 1.6884119859685034e-06, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.16316699981689453, "step": 5875, "valid_targets_mean": 2607.8, "valid_targets_min": 644 }, { "epoch": 6.176470588235294, "grad_norm": 0.7562882938551625, "learning_rate": 1.6674084357210562e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440119594335556, "step": 5880, "valid_targets_mean": 2218.6, "valid_targets_min": 801 }, { "epoch": 6.18172268907563, "grad_norm": 0.7626842826181003, "learning_rate": 1.6465306607472608e-06, "loss": 0.1489, "loss_nan_ranks": 0, "loss_rank_avg": 0.13738971948623657, "step": 5885, "valid_targets_mean": 2323.1, "valid_targets_min": 917 }, { "epoch": 6.186974789915967, "grad_norm": 0.7942359627663949, "learning_rate": 1.625778804284246e-06, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.14948052167892456, "step": 5890, "valid_targets_mean": 2511.6, "valid_targets_min": 743 }, { "epoch": 6.192226890756302, "grad_norm": 0.8431028429315225, "learning_rate": 1.6051530087052558e-06, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.15867841243743896, "step": 5895, "valid_targets_mean": 2291.1, "valid_targets_min": 940 }, { "epoch": 6.197478991596639, "grad_norm": 0.8666438002772852, "learning_rate": 1.5846534155186511e-06, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.14912620186805725, "step": 5900, "valid_targets_mean": 1881.3, "valid_targets_min": 680 }, { "epoch": 6.2027310924369745, "grad_norm": 0.8110997063724646, "learning_rate": 1.564280165366956e-06, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.1503579318523407, "step": 5905, "valid_targets_mean": 2042.6, "valid_targets_min": 614 }, { "epoch": 6.207983193277311, "grad_norm": 0.7289206797878542, "learning_rate": 1.544033398025886e-06, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.15290409326553345, "step": 5910, "valid_targets_mean": 2841.8, "valid_targets_min": 650 }, { "epoch": 6.213235294117647, "grad_norm": 0.8826762189160628, "learning_rate": 1.5239132524033951e-06, "loss": 0.1446, "loss_nan_ranks": 0, "loss_rank_avg": 0.15168313682079315, "step": 5915, "valid_targets_mean": 2273.7, "valid_targets_min": 867 }, { "epoch": 6.218487394957983, "grad_norm": 0.6729261276809203, "learning_rate": 1.50391986653871e-06, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.1368652582168579, "step": 5920, "valid_targets_mean": 3169.6, "valid_targets_min": 790 }, { "epoch": 6.223739495798319, "grad_norm": 0.7965190893498632, "learning_rate": 1.4840533776013954e-06, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.1640886664390564, "step": 5925, "valid_targets_mean": 2498.8, "valid_targets_min": 625 }, { "epoch": 6.2289915966386555, "grad_norm": 0.7757965453046244, "learning_rate": 1.4643139218904035e-06, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.14865760505199432, "step": 5930, "valid_targets_mean": 2731.4, "valid_targets_min": 698 }, { "epoch": 6.234243697478991, "grad_norm": 0.7962903371122022, "learning_rate": 1.4447016348331477e-06, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.13591375946998596, "step": 5935, "valid_targets_mean": 2047.8, "valid_targets_min": 781 }, { "epoch": 6.239495798319328, "grad_norm": 0.7557635968086313, "learning_rate": 1.4252166509845777e-06, "loss": 0.1585, "loss_nan_ranks": 0, "loss_rank_avg": 0.15759332478046417, "step": 5940, "valid_targets_mean": 2775.9, "valid_targets_min": 875 }, { "epoch": 6.244747899159663, "grad_norm": 0.7204075261247243, "learning_rate": 1.4058591040262259e-06, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.14412742853164673, "step": 5945, "valid_targets_mean": 2885.9, "valid_targets_min": 632 }, { "epoch": 6.25, "grad_norm": 0.7821960625396808, "learning_rate": 1.3866291267653309e-06, "loss": 0.1514, "loss_nan_ranks": 0, "loss_rank_avg": 0.15519963204860687, "step": 5950, "valid_targets_mean": 2386.9, "valid_targets_min": 917 }, { "epoch": 6.255252100840336, "grad_norm": 0.7211652670433405, "learning_rate": 1.3675268511339067e-06, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.14521880447864532, "step": 5955, "valid_targets_mean": 2996.6, "valid_targets_min": 684 }, { "epoch": 6.260504201680672, "grad_norm": 0.8118712246185013, "learning_rate": 1.3485524081878288e-06, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.16166505217552185, "step": 5960, "valid_targets_mean": 2691.8, "valid_targets_min": 937 }, { "epoch": 6.265756302521009, "grad_norm": 0.859100591202131, "learning_rate": 1.3297059281059533e-06, "loss": 0.1561, "loss_nan_ranks": 0, "loss_rank_avg": 0.1694069802761078, "step": 5965, "valid_targets_mean": 2484.4, "valid_targets_min": 734 }, { "epoch": 6.2710084033613445, "grad_norm": 0.6880675870848753, "learning_rate": 1.3109875401892146e-06, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.13731975853443146, "step": 5970, "valid_targets_mean": 3048.2, "valid_targets_min": 728 }, { "epoch": 6.276260504201681, "grad_norm": 0.78207546197356, "learning_rate": 1.2923973728597373e-06, "loss": 0.1425, "loss_nan_ranks": 0, "loss_rank_avg": 0.13927319645881653, "step": 5975, "valid_targets_mean": 2147.8, "valid_targets_min": 725 }, { "epoch": 6.281512605042017, "grad_norm": 0.9014126476888846, "learning_rate": 1.2739355536599508e-06, "loss": 0.1429, "loss_nan_ranks": 0, "loss_rank_avg": 0.1446988582611084, "step": 5980, "valid_targets_mean": 1929.1, "valid_targets_min": 627 }, { "epoch": 6.286764705882353, "grad_norm": 0.7420292923016639, "learning_rate": 1.2556022092517362e-06, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.14270836114883423, "step": 5985, "valid_targets_mean": 2397.7, "valid_targets_min": 966 }, { "epoch": 6.292016806722689, "grad_norm": 0.7955077467970862, "learning_rate": 1.237397465415524e-06, "loss": 0.1453, "loss_nan_ranks": 0, "loss_rank_avg": 0.1445448398590088, "step": 5990, "valid_targets_mean": 2025.7, "valid_targets_min": 620 }, { "epoch": 6.2972689075630255, "grad_norm": 0.8287126470993438, "learning_rate": 1.2193214470494664e-06, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.1324065625667572, "step": 5995, "valid_targets_mean": 1985.8, "valid_targets_min": 867 }, { "epoch": 6.302521008403361, "grad_norm": 0.7561550704661556, "learning_rate": 1.201374278168541e-06, "loss": 0.1452, "loss_nan_ranks": 0, "loss_rank_avg": 0.15818336606025696, "step": 6000, "valid_targets_mean": 2369.2, "valid_targets_min": 806 }, { "epoch": 6.307773109243698, "grad_norm": 0.7629710579022473, "learning_rate": 1.1835560819037429e-06, "loss": 0.1427, "loss_nan_ranks": 0, "loss_rank_avg": 0.12634852528572083, "step": 6005, "valid_targets_mean": 2487.6, "valid_targets_min": 870 }, { "epoch": 6.313025210084033, "grad_norm": 0.8264383119430665, "learning_rate": 1.1658669805012112e-06, "loss": 0.144, "loss_nan_ranks": 0, "loss_rank_avg": 0.14036674797534943, "step": 6010, "valid_targets_mean": 1953.5, "valid_targets_min": 639 }, { "epoch": 6.31827731092437, "grad_norm": 0.8768123841384081, "learning_rate": 1.1483070953213904e-06, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.1594979465007782, "step": 6015, "valid_targets_mean": 2033.9, "valid_targets_min": 734 }, { "epoch": 6.323529411764706, "grad_norm": 0.8008028472783635, "learning_rate": 1.130876546838211e-06, "loss": 0.1592, "loss_nan_ranks": 0, "loss_rank_avg": 0.16434642672538757, "step": 6020, "valid_targets_mean": 2647.7, "valid_targets_min": 1279 }, { "epoch": 6.328781512605042, "grad_norm": 0.778716540961378, "learning_rate": 1.1135754546382627e-06, "loss": 0.1439, "loss_nan_ranks": 0, "loss_rank_avg": 0.15541379153728485, "step": 6025, "valid_targets_mean": 2563.2, "valid_targets_min": 700 }, { "epoch": 6.334033613445378, "grad_norm": 0.7658767727670047, "learning_rate": 1.0964039374199564e-06, "loss": 0.1476, "loss_nan_ranks": 0, "loss_rank_avg": 0.14019645750522614, "step": 6030, "valid_targets_mean": 2198.1, "valid_targets_min": 742 }, { "epoch": 6.339285714285714, "grad_norm": 0.7848881321896162, "learning_rate": 1.07936211299273e-06, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.15517699718475342, "step": 6035, "valid_targets_mean": 2547.2, "valid_targets_min": 825 }, { "epoch": 6.34453781512605, "grad_norm": 1.1562955954823186, "learning_rate": 1.0624500982762376e-06, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.1641463041305542, "step": 6040, "valid_targets_mean": 2856.1, "valid_targets_min": 933 }, { "epoch": 6.349789915966387, "grad_norm": 1.243869663850212, "learning_rate": 1.045668009299523e-06, "loss": 0.1615, "loss_nan_ranks": 0, "loss_rank_avg": 0.1688794195652008, "step": 6045, "valid_targets_mean": 1660.8, "valid_targets_min": 629 }, { "epoch": 6.355042016806722, "grad_norm": 0.9029029473166272, "learning_rate": 1.029015961200266e-06, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.16218698024749756, "step": 6050, "valid_targets_mean": 1781.9, "valid_targets_min": 678 }, { "epoch": 6.360294117647059, "grad_norm": 0.839913681660097, "learning_rate": 1.012494068223946e-06, "loss": 0.1545, "loss_nan_ranks": 0, "loss_rank_avg": 0.14709152281284332, "step": 6055, "valid_targets_mean": 1895.1, "valid_targets_min": 646 }, { "epoch": 6.3655462184873945, "grad_norm": 0.7974623565020086, "learning_rate": 9.961024437230948e-07, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.13561251759529114, "step": 6060, "valid_targets_mean": 2064.5, "valid_targets_min": 612 }, { "epoch": 6.370798319327731, "grad_norm": 0.709502267033278, "learning_rate": 9.798412001565038e-07, "loss": 0.1591, "loss_nan_ranks": 0, "loss_rank_avg": 0.16175958514213562, "step": 6065, "valid_targets_mean": 3175.9, "valid_targets_min": 780 }, { "epoch": 6.376050420168067, "grad_norm": 0.9037744133249849, "learning_rate": 9.63710449088453e-07, "loss": 0.1499, "loss_nan_ranks": 0, "loss_rank_avg": 0.15407252311706543, "step": 6070, "valid_targets_mean": 1908.1, "valid_targets_min": 703 }, { "epoch": 6.381302521008403, "grad_norm": 0.797641245566909, "learning_rate": 9.477103011879408e-07, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.15560175478458405, "step": 6075, "valid_targets_mean": 2465.2, "valid_targets_min": 703 }, { "epoch": 6.38655462184874, "grad_norm": 0.7237125765315087, "learning_rate": 9.318408662279399e-07, "loss": 0.1527, "loss_nan_ranks": 0, "loss_rank_avg": 0.14476794004440308, "step": 6080, "valid_targets_mean": 2732.1, "valid_targets_min": 686 }, { "epoch": 6.391806722689076, "grad_norm": 0.7575017424625796, "learning_rate": 9.161022530846253e-07, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.13442182540893555, "step": 6085, "valid_targets_mean": 2915.2, "valid_targets_min": 1127 }, { "epoch": 6.397058823529412, "grad_norm": 0.8267114749782785, "learning_rate": 9.004945697366452e-07, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.14276978373527527, "step": 6090, "valid_targets_mean": 2019.4, "valid_targets_min": 909 }, { "epoch": 6.402310924369748, "grad_norm": 0.7237677872215658, "learning_rate": 8.850179232643641e-07, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.14779332280158997, "step": 6095, "valid_targets_mean": 2826.4, "valid_targets_min": 898 }, { "epoch": 6.407563025210084, "grad_norm": 0.8400966461486415, "learning_rate": 8.696724198491369e-07, "loss": 0.1537, "loss_nan_ranks": 0, "loss_rank_avg": 0.15353678166866302, "step": 6100, "valid_targets_mean": 2215.9, "valid_targets_min": 621 }, { "epoch": 6.41281512605042, "grad_norm": 0.7477003864167849, "learning_rate": 8.544581647725825e-07, "loss": 0.1461, "loss_nan_ranks": 0, "loss_rank_avg": 0.1523742377758026, "step": 6105, "valid_targets_mean": 2844.5, "valid_targets_min": 921 }, { "epoch": 6.418067226890757, "grad_norm": 0.8178307661739669, "learning_rate": 8.393752624158603e-07, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.14179328083992004, "step": 6110, "valid_targets_mean": 1932.0, "valid_targets_min": 740 }, { "epoch": 6.423319327731092, "grad_norm": 0.6634779755671151, "learning_rate": 8.244238162589435e-07, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.14001640677452087, "step": 6115, "valid_targets_mean": 3367.4, "valid_targets_min": 1289 }, { "epoch": 6.428571428571429, "grad_norm": 0.7620021165612041, "learning_rate": 8.096039288799251e-07, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.15005478262901306, "step": 6120, "valid_targets_mean": 2588.8, "valid_targets_min": 725 }, { "epoch": 6.4338235294117645, "grad_norm": 0.7934644918251871, "learning_rate": 7.949157019543064e-07, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.17349065840244293, "step": 6125, "valid_targets_mean": 2498.0, "valid_targets_min": 909 }, { "epoch": 6.439075630252101, "grad_norm": 0.7690205077229771, "learning_rate": 7.803592362542911e-07, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.16106484830379486, "step": 6130, "valid_targets_mean": 2574.9, "valid_targets_min": 1357 }, { "epoch": 6.444327731092437, "grad_norm": 0.8681115870866193, "learning_rate": 7.659346316481086e-07, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.14451289176940918, "step": 6135, "valid_targets_mean": 1931.4, "valid_targets_min": 679 }, { "epoch": 6.449579831932773, "grad_norm": 0.7601643918944068, "learning_rate": 7.516419870993296e-07, "loss": 0.1493, "loss_nan_ranks": 0, "loss_rank_avg": 0.15384207665920258, "step": 6140, "valid_targets_mean": 2423.4, "valid_targets_min": 718 }, { "epoch": 6.454831932773109, "grad_norm": 0.7370958836376663, "learning_rate": 7.374814006661667e-07, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1404162049293518, "step": 6145, "valid_targets_mean": 2909.4, "valid_targets_min": 692 }, { "epoch": 6.4600840336134455, "grad_norm": 0.8042467319801916, "learning_rate": 7.234529695008241e-07, "loss": 0.1459, "loss_nan_ranks": 0, "loss_rank_avg": 0.15728093683719635, "step": 6150, "valid_targets_mean": 2223.1, "valid_targets_min": 979 }, { "epoch": 6.465336134453781, "grad_norm": 0.7816915471785587, "learning_rate": 7.095567898488175e-07, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.16815775632858276, "step": 6155, "valid_targets_mean": 2402.7, "valid_targets_min": 1133 }, { "epoch": 6.470588235294118, "grad_norm": 0.9016085189910406, "learning_rate": 6.957929570483224e-07, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.16057243943214417, "step": 6160, "valid_targets_mean": 2306.2, "valid_targets_min": 640 }, { "epoch": 6.475840336134453, "grad_norm": 0.7983769298179959, "learning_rate": 6.821615655295155e-07, "loss": 0.1605, "loss_nan_ranks": 0, "loss_rank_avg": 0.16977722942829132, "step": 6165, "valid_targets_mean": 2523.9, "valid_targets_min": 604 }, { "epoch": 6.48109243697479, "grad_norm": 0.8711158720727042, "learning_rate": 6.686627088139253e-07, "loss": 0.1579, "loss_nan_ranks": 0, "loss_rank_avg": 0.17021444439888, "step": 6170, "valid_targets_mean": 2276.9, "valid_targets_min": 618 }, { "epoch": 6.486344537815126, "grad_norm": 0.7653732434373907, "learning_rate": 6.552964795137895e-07, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.16731613874435425, "step": 6175, "valid_targets_mean": 2977.2, "valid_targets_min": 567 }, { "epoch": 6.491596638655462, "grad_norm": 0.7898921304427059, "learning_rate": 6.420629693314317e-07, "loss": 0.148, "loss_nan_ranks": 0, "loss_rank_avg": 0.14303874969482422, "step": 6180, "valid_targets_mean": 2086.4, "valid_targets_min": 722 }, { "epoch": 6.496848739495798, "grad_norm": 0.8022544168817034, "learning_rate": 6.289622690586151e-07, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.15002703666687012, "step": 6185, "valid_targets_mean": 2577.0, "valid_targets_min": 967 }, { "epoch": 6.5021008403361344, "grad_norm": 0.7765235327781467, "learning_rate": 6.159944685759289e-07, "loss": 0.1598, "loss_nan_ranks": 0, "loss_rank_avg": 0.1665143221616745, "step": 6190, "valid_targets_mean": 2581.1, "valid_targets_min": 1206 }, { "epoch": 6.507352941176471, "grad_norm": 0.6652766905185039, "learning_rate": 6.031596568521792e-07, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.15390489995479584, "step": 6195, "valid_targets_mean": 3575.8, "valid_targets_min": 936 }, { "epoch": 6.512605042016807, "grad_norm": 0.823897053974955, "learning_rate": 5.904579219437567e-07, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.14515843987464905, "step": 6200, "valid_targets_mean": 2476.0, "valid_targets_min": 897 }, { "epoch": 6.517857142857143, "grad_norm": 0.8693729158649441, "learning_rate": 5.778893509940497e-07, "loss": 0.1456, "loss_nan_ranks": 0, "loss_rank_avg": 0.14359763264656067, "step": 6205, "valid_targets_mean": 1601.5, "valid_targets_min": 715 }, { "epoch": 6.523109243697479, "grad_norm": 0.7360524356141547, "learning_rate": 5.654540302328526e-07, "loss": 0.1464, "loss_nan_ranks": 0, "loss_rank_avg": 0.1544869840145111, "step": 6210, "valid_targets_mean": 3031.3, "valid_targets_min": 868 }, { "epoch": 6.5283613445378155, "grad_norm": 0.8214329921549752, "learning_rate": 5.531520449757465e-07, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.15624156594276428, "step": 6215, "valid_targets_mean": 2231.3, "valid_targets_min": 746 }, { "epoch": 6.533613445378151, "grad_norm": 0.7526069627643952, "learning_rate": 5.409834796235447e-07, "loss": 0.1503, "loss_nan_ranks": 0, "loss_rank_avg": 0.14001137018203735, "step": 6220, "valid_targets_mean": 2640.0, "valid_targets_min": 700 }, { "epoch": 6.538865546218488, "grad_norm": 0.8221429966093985, "learning_rate": 5.28948417661701e-07, "loss": 0.153, "loss_nan_ranks": 0, "loss_rank_avg": 0.1630651354789734, "step": 6225, "valid_targets_mean": 2143.7, "valid_targets_min": 668 }, { "epoch": 6.544117647058823, "grad_norm": 0.8173958277347929, "learning_rate": 5.170469416597223e-07, "loss": 0.1617, "loss_nan_ranks": 0, "loss_rank_avg": 0.14818143844604492, "step": 6230, "valid_targets_mean": 2997.8, "valid_targets_min": 1061 }, { "epoch": 6.54936974789916, "grad_norm": 0.7574217024984009, "learning_rate": 5.05279133270633e-07, "loss": 0.1438, "loss_nan_ranks": 0, "loss_rank_avg": 0.1506175696849823, "step": 6235, "valid_targets_mean": 2813.8, "valid_targets_min": 822 }, { "epoch": 6.554621848739496, "grad_norm": 0.8789551921829356, "learning_rate": 4.936450732303866e-07, "loss": 0.1648, "loss_nan_ranks": 0, "loss_rank_avg": 0.17505599558353424, "step": 6240, "valid_targets_mean": 2185.9, "valid_targets_min": 773 }, { "epoch": 6.559873949579832, "grad_norm": 0.7800209416470806, "learning_rate": 4.821448413573237e-07, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.1431932896375656, "step": 6245, "valid_targets_mean": 2216.9, "valid_targets_min": 759 }, { "epoch": 6.565126050420168, "grad_norm": 0.7715463308797006, "learning_rate": 4.70778516551631e-07, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.15793776512145996, "step": 6250, "valid_targets_mean": 2604.6, "valid_targets_min": 873 }, { "epoch": 6.570378151260504, "grad_norm": 0.7929402427060284, "learning_rate": 4.595461767947829e-07, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.17367711663246155, "step": 6255, "valid_targets_mean": 2793.5, "valid_targets_min": 890 }, { "epoch": 6.57563025210084, "grad_norm": 0.7558379818924563, "learning_rate": 4.484478991490249e-07, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.1597421020269394, "step": 6260, "valid_targets_mean": 2706.1, "valid_targets_min": 680 }, { "epoch": 6.580882352941177, "grad_norm": 0.8203283121654529, "learning_rate": 4.374837597568338e-07, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.13600069284439087, "step": 6265, "valid_targets_mean": 2013.9, "valid_targets_min": 725 }, { "epoch": 6.586134453781512, "grad_norm": 0.7685017317264076, "learning_rate": 4.266538338403936e-07, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.1418771594762802, "step": 6270, "valid_targets_mean": 2087.0, "valid_targets_min": 888 }, { "epoch": 6.591386554621849, "grad_norm": 0.7689705022584826, "learning_rate": 4.159581957010894e-07, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.15910068154335022, "step": 6275, "valid_targets_mean": 2749.8, "valid_targets_min": 694 }, { "epoch": 6.5966386554621845, "grad_norm": 0.8350274594286426, "learning_rate": 4.0539691871898545e-07, "loss": 0.1635, "loss_nan_ranks": 0, "loss_rank_avg": 0.14839161932468414, "step": 6280, "valid_targets_mean": 2080.6, "valid_targets_min": 941 }, { "epoch": 6.601890756302521, "grad_norm": 0.7123586297209112, "learning_rate": 3.949700753523344e-07, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.14631910622119904, "step": 6285, "valid_targets_mean": 2960.0, "valid_targets_min": 763 }, { "epoch": 6.607142857142857, "grad_norm": 0.7608218792468966, "learning_rate": 3.8467773713707134e-07, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.14922720193862915, "step": 6290, "valid_targets_mean": 2525.2, "valid_targets_min": 1231 }, { "epoch": 6.612394957983193, "grad_norm": 0.781295609634859, "learning_rate": 3.7451997468632486e-07, "loss": 0.142, "loss_nan_ranks": 0, "loss_rank_avg": 0.1524946689605713, "step": 6295, "valid_targets_mean": 2446.9, "valid_targets_min": 692 }, { "epoch": 6.617647058823529, "grad_norm": 1.3621692596047696, "learning_rate": 3.6449685768993327e-07, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.15170569717884064, "step": 6300, "valid_targets_mean": 2007.3, "valid_targets_min": 549 }, { "epoch": 6.6228991596638656, "grad_norm": 0.9081109225494257, "learning_rate": 3.5460845491396944e-07, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.154941126704216, "step": 6305, "valid_targets_mean": 2046.6, "valid_targets_min": 650 }, { "epoch": 6.628151260504202, "grad_norm": 0.7545604154002317, "learning_rate": 3.448548342002589e-07, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.15161868929862976, "step": 6310, "valid_targets_mean": 2837.8, "valid_targets_min": 973 }, { "epoch": 6.633403361344538, "grad_norm": 0.8680496469961246, "learning_rate": 3.352360624659312e-07, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.1834527552127838, "step": 6315, "valid_targets_mean": 2255.1, "valid_targets_min": 744 }, { "epoch": 6.6386554621848735, "grad_norm": 0.7171097775844976, "learning_rate": 3.2575220570294276e-07, "loss": 0.1529, "loss_nan_ranks": 0, "loss_rank_avg": 0.15503129363059998, "step": 6320, "valid_targets_mean": 2962.4, "valid_targets_min": 750 }, { "epoch": 6.64390756302521, "grad_norm": 0.6658600775544034, "learning_rate": 3.164033289776369e-07, "loss": 0.1423, "loss_nan_ranks": 0, "loss_rank_avg": 0.12674590945243835, "step": 6325, "valid_targets_mean": 2999.2, "valid_targets_min": 761 }, { "epoch": 6.649159663865547, "grad_norm": 0.7748035457490327, "learning_rate": 3.071894964302935e-07, "loss": 0.1477, "loss_nan_ranks": 0, "loss_rank_avg": 0.16250720620155334, "step": 6330, "valid_targets_mean": 2583.9, "valid_targets_min": 850 }, { "epoch": 6.654411764705882, "grad_norm": 0.7894017447041788, "learning_rate": 2.981107712746867e-07, "loss": 0.1448, "loss_nan_ranks": 0, "loss_rank_avg": 0.14615963399410248, "step": 6335, "valid_targets_mean": 2359.9, "valid_targets_min": 814 }, { "epoch": 6.659663865546219, "grad_norm": 0.7275796769976358, "learning_rate": 2.891672157976522e-07, "loss": 0.1389, "loss_nan_ranks": 0, "loss_rank_avg": 0.1456836611032486, "step": 6340, "valid_targets_mean": 2687.1, "valid_targets_min": 726 }, { "epoch": 6.6649159663865545, "grad_norm": 0.7464610444598423, "learning_rate": 2.803588913586608e-07, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.15692494809627533, "step": 6345, "valid_targets_mean": 2862.6, "valid_targets_min": 1185 }, { "epoch": 6.670168067226891, "grad_norm": 0.7409587755798085, "learning_rate": 2.716858583894033e-07, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.14683926105499268, "step": 6350, "valid_targets_mean": 2565.6, "valid_targets_min": 1187 }, { "epoch": 6.675420168067227, "grad_norm": 0.8489660086658728, "learning_rate": 2.6314817639335964e-07, "loss": 0.1486, "loss_nan_ranks": 0, "loss_rank_avg": 0.14783814549446106, "step": 6355, "valid_targets_mean": 2178.1, "valid_targets_min": 1163 }, { "epoch": 6.680672268907563, "grad_norm": 0.7446724408854097, "learning_rate": 2.547459039454103e-07, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.13613933324813843, "step": 6360, "valid_targets_mean": 2619.4, "valid_targets_min": 776 }, { "epoch": 6.685924369747899, "grad_norm": 0.7468301149926823, "learning_rate": 2.4647909869142117e-07, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.15531302988529205, "step": 6365, "valid_targets_mean": 2749.7, "valid_targets_min": 788 }, { "epoch": 6.6911764705882355, "grad_norm": 0.8038823609900482, "learning_rate": 2.3834781734784817e-07, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.14846262335777283, "step": 6370, "valid_targets_mean": 2125.0, "valid_targets_min": 852 }, { "epoch": 6.696428571428571, "grad_norm": 0.7769587079233549, "learning_rate": 2.3035211570135995e-07, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.1341462880373001, "step": 6375, "valid_targets_mean": 1821.1, "valid_targets_min": 958 }, { "epoch": 6.701680672268908, "grad_norm": 0.7298168762864212, "learning_rate": 2.224920486084403e-07, "loss": 0.1586, "loss_nan_ranks": 0, "loss_rank_avg": 0.15344950556755066, "step": 6380, "valid_targets_mean": 2839.2, "valid_targets_min": 1147 }, { "epoch": 6.706932773109243, "grad_norm": 0.778338115342936, "learning_rate": 2.1476766999502408e-07, "loss": 0.1428, "loss_nan_ranks": 0, "loss_rank_avg": 0.13469842076301575, "step": 6385, "valid_targets_mean": 2178.6, "valid_targets_min": 776 }, { "epoch": 6.71218487394958, "grad_norm": 0.816451492189734, "learning_rate": 2.071790328561152e-07, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.15425826609134674, "step": 6390, "valid_targets_mean": 2324.4, "valid_targets_min": 841 }, { "epoch": 6.717436974789916, "grad_norm": 0.8201419970370695, "learning_rate": 1.997261892554403e-07, "loss": 0.1563, "loss_nan_ranks": 0, "loss_rank_avg": 0.15658767521381378, "step": 6395, "valid_targets_mean": 2310.4, "valid_targets_min": 912 }, { "epoch": 6.722689075630252, "grad_norm": 0.7500376618247141, "learning_rate": 1.9240919032506688e-07, "loss": 0.147, "loss_nan_ranks": 0, "loss_rank_avg": 0.14455173909664154, "step": 6400, "valid_targets_mean": 2628.5, "valid_targets_min": 474 }, { "epoch": 6.727941176470588, "grad_norm": 0.7584572682030627, "learning_rate": 1.8522808626507683e-07, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.15599125623703003, "step": 6405, "valid_targets_mean": 2658.8, "valid_targets_min": 420 }, { "epoch": 6.733193277310924, "grad_norm": 0.7357895023796207, "learning_rate": 1.781829263432111e-07, "loss": 0.1594, "loss_nan_ranks": 0, "loss_rank_avg": 0.14581039547920227, "step": 6410, "valid_targets_mean": 2959.5, "valid_targets_min": 713 }, { "epoch": 6.73844537815126, "grad_norm": 0.6891830564600709, "learning_rate": 1.7127375889452569e-07, "loss": 0.1528, "loss_nan_ranks": 0, "loss_rank_avg": 0.13923324644565582, "step": 6415, "valid_targets_mean": 2834.0, "valid_targets_min": 1194 }, { "epoch": 6.743697478991597, "grad_norm": 0.7199729752533398, "learning_rate": 1.6450063132107396e-07, "loss": 0.1479, "loss_nan_ranks": 0, "loss_rank_avg": 0.1373451054096222, "step": 6420, "valid_targets_mean": 2572.8, "valid_targets_min": 626 }, { "epoch": 6.748949579831933, "grad_norm": 0.7647019920185888, "learning_rate": 1.5786359009156928e-07, "loss": 0.1433, "loss_nan_ranks": 0, "loss_rank_avg": 0.15924891829490662, "step": 6425, "valid_targets_mean": 2990.7, "valid_targets_min": 793 }, { "epoch": 6.754201680672269, "grad_norm": 0.8310727483362449, "learning_rate": 1.5136268074107398e-07, "loss": 0.157, "loss_nan_ranks": 0, "loss_rank_avg": 0.1688929796218872, "step": 6430, "valid_targets_mean": 2370.5, "valid_targets_min": 738 }, { "epoch": 6.759453781512605, "grad_norm": 0.825061605955483, "learning_rate": 1.44997947870682e-07, "loss": 0.1639, "loss_nan_ranks": 0, "loss_rank_avg": 0.16266357898712158, "step": 6435, "valid_targets_mean": 2281.9, "valid_targets_min": 1074 }, { "epoch": 6.764705882352941, "grad_norm": 0.8533595418248784, "learning_rate": 1.3876943514721465e-07, "loss": 0.1525, "loss_nan_ranks": 0, "loss_rank_avg": 0.16743487119674683, "step": 6440, "valid_targets_mean": 2262.5, "valid_targets_min": 970 }, { "epoch": 6.769957983193278, "grad_norm": 0.7748683785377023, "learning_rate": 1.3267718530292296e-07, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.14080220460891724, "step": 6445, "valid_targets_mean": 2343.4, "valid_targets_min": 738 }, { "epoch": 6.775210084033613, "grad_norm": 0.8320606022762239, "learning_rate": 1.267212401351925e-07, "loss": 0.16, "loss_nan_ranks": 0, "loss_rank_avg": 0.1550496518611908, "step": 6450, "valid_targets_mean": 2402.6, "valid_targets_min": 857 }, { "epoch": 6.78046218487395, "grad_norm": 0.7474317684737926, "learning_rate": 1.2090164050625907e-07, "loss": 0.1736, "loss_nan_ranks": 0, "loss_rank_avg": 0.16620126366615295, "step": 6455, "valid_targets_mean": 3082.7, "valid_targets_min": 658 }, { "epoch": 6.785714285714286, "grad_norm": 0.9565980511087515, "learning_rate": 1.1521842634292013e-07, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.160188689827919, "step": 6460, "valid_targets_mean": 1479.5, "valid_targets_min": 642 }, { "epoch": 6.790966386554622, "grad_norm": 0.8532947647691757, "learning_rate": 1.0967163663627044e-07, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.15419529378414154, "step": 6465, "valid_targets_mean": 2052.6, "valid_targets_min": 642 }, { "epoch": 6.796218487394958, "grad_norm": 0.8255781206219238, "learning_rate": 1.0426130944143353e-07, "loss": 0.151, "loss_nan_ranks": 0, "loss_rank_avg": 0.14306730031967163, "step": 6470, "valid_targets_mean": 1963.2, "valid_targets_min": 830 }, { "epoch": 6.801470588235294, "grad_norm": 0.8837049669576724, "learning_rate": 9.898748187729513e-08, "loss": 0.1549, "loss_nan_ranks": 0, "loss_rank_avg": 0.15094450116157532, "step": 6475, "valid_targets_mean": 2181.6, "valid_targets_min": 919 }, { "epoch": 6.80672268907563, "grad_norm": 0.7790666833598698, "learning_rate": 9.385019012625007e-08, "loss": 0.1469, "loss_nan_ranks": 0, "loss_rank_avg": 0.14933770895004272, "step": 6480, "valid_targets_mean": 2469.9, "valid_targets_min": 1015 }, { "epoch": 6.811974789915967, "grad_norm": 0.9087222050552412, "learning_rate": 8.884946943395811e-08, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.16928185522556305, "step": 6485, "valid_targets_mean": 1823.7, "valid_targets_min": 808 }, { "epoch": 6.817226890756302, "grad_norm": 0.7419966743487549, "learning_rate": 8.398535410910402e-08, "loss": 0.161, "loss_nan_ranks": 0, "loss_rank_avg": 0.16752246022224426, "step": 6490, "valid_targets_mean": 3067.3, "valid_targets_min": 796 }, { "epoch": 6.822478991596639, "grad_norm": 0.7768443736140654, "learning_rate": 7.925787752314674e-08, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.14006970822811127, "step": 6495, "valid_targets_mean": 2286.3, "valid_targets_min": 837 }, { "epoch": 6.8277310924369745, "grad_norm": 0.7839422460590042, "learning_rate": 7.466707211010838e-08, "loss": 0.1526, "loss_nan_ranks": 0, "loss_rank_avg": 0.15227356553077698, "step": 6500, "valid_targets_mean": 2435.8, "valid_targets_min": 794 }, { "epoch": 6.832983193277311, "grad_norm": 0.8085913813487312, "learning_rate": 7.02129693663478e-08, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.14806930720806122, "step": 6505, "valid_targets_mean": 2763.4, "valid_targets_min": 809 }, { "epoch": 6.838235294117647, "grad_norm": 0.830479023779582, "learning_rate": 6.589559985033189e-08, "loss": 0.1577, "loss_nan_ranks": 0, "loss_rank_avg": 0.15857365727424622, "step": 6510, "valid_targets_mean": 2199.1, "valid_targets_min": 697 }, { "epoch": 6.843487394957983, "grad_norm": 0.7805037615428879, "learning_rate": 6.171499318244234e-08, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1644633412361145, "step": 6515, "valid_targets_mean": 2826.9, "valid_targets_min": 1091 }, { "epoch": 6.848739495798319, "grad_norm": 0.8243868421023237, "learning_rate": 5.767117804476696e-08, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.1619555652141571, "step": 6520, "valid_targets_mean": 2291.1, "valid_targets_min": 785 }, { "epoch": 6.8539915966386555, "grad_norm": 0.6718196143534856, "learning_rate": 5.376418218089541e-08, "loss": 0.1468, "loss_nan_ranks": 0, "loss_rank_avg": 0.1486797034740448, "step": 6525, "valid_targets_mean": 3316.1, "valid_targets_min": 645 }, { "epoch": 6.859243697478991, "grad_norm": 0.7639600711267872, "learning_rate": 4.99940323957393e-08, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.15114453434944153, "step": 6530, "valid_targets_mean": 2355.1, "valid_targets_min": 930 }, { "epoch": 6.864495798319328, "grad_norm": 0.7434040074285687, "learning_rate": 4.63607545553435e-08, "loss": 0.1491, "loss_nan_ranks": 0, "loss_rank_avg": 0.16190582513809204, "step": 6535, "valid_targets_mean": 2631.9, "valid_targets_min": 997 }, { "epoch": 6.869747899159664, "grad_norm": 0.7576726635038536, "learning_rate": 4.2864373586706254e-08, "loss": 0.1539, "loss_nan_ranks": 0, "loss_rank_avg": 0.1667475700378418, "step": 6540, "valid_targets_mean": 3037.7, "valid_targets_min": 1256 }, { "epoch": 6.875, "grad_norm": 0.7949042840267881, "learning_rate": 3.950491347761487e-08, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.15799729526042938, "step": 6545, "valid_targets_mean": 2813.3, "valid_targets_min": 981 }, { "epoch": 6.880252100840336, "grad_norm": 0.7599470557620672, "learning_rate": 3.628239727647254e-08, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.14834260940551758, "step": 6550, "valid_targets_mean": 2786.1, "valid_targets_min": 551 }, { "epoch": 6.885504201680672, "grad_norm": 0.7438096344765326, "learning_rate": 3.319684709215176e-08, "loss": 0.1488, "loss_nan_ranks": 0, "loss_rank_avg": 0.1484309434890747, "step": 6555, "valid_targets_mean": 2842.8, "valid_targets_min": 675 }, { "epoch": 6.890756302521009, "grad_norm": 0.8034592781374419, "learning_rate": 3.024828409383007e-08, "loss": 0.1601, "loss_nan_ranks": 0, "loss_rank_avg": 0.1651192605495453, "step": 6560, "valid_targets_mean": 2401.8, "valid_targets_min": 1118 }, { "epoch": 6.8960084033613445, "grad_norm": 0.7481979263488755, "learning_rate": 2.743672851085233e-08, "loss": 0.1447, "loss_nan_ranks": 0, "loss_rank_avg": 0.13949503004550934, "step": 6565, "valid_targets_mean": 2675.6, "valid_targets_min": 799 }, { "epoch": 6.901260504201681, "grad_norm": 0.8092072610442079, "learning_rate": 2.4762199632588634e-08, "loss": 0.1466, "loss_nan_ranks": 0, "loss_rank_avg": 0.17036761343479156, "step": 6570, "valid_targets_mean": 2485.1, "valid_targets_min": 909 }, { "epoch": 6.906512605042017, "grad_norm": 0.8049873065525076, "learning_rate": 2.2224715808309983e-08, "loss": 0.156, "loss_nan_ranks": 0, "loss_rank_avg": 0.15256905555725098, "step": 6575, "valid_targets_mean": 2644.2, "valid_targets_min": 814 }, { "epoch": 6.911764705882353, "grad_norm": 0.8617962635473019, "learning_rate": 1.9824294447043923e-08, "loss": 0.1571, "loss_nan_ranks": 0, "loss_rank_avg": 0.15142729878425598, "step": 6580, "valid_targets_mean": 2083.2, "valid_targets_min": 512 }, { "epoch": 6.917016806722689, "grad_norm": 0.8008776691217604, "learning_rate": 1.7560952017481313e-08, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.1459037810564041, "step": 6585, "valid_targets_mean": 2554.2, "valid_targets_min": 952 }, { "epoch": 6.9222689075630255, "grad_norm": 0.7191951703364022, "learning_rate": 1.5434704047836424e-08, "loss": 0.1475, "loss_nan_ranks": 0, "loss_rank_avg": 0.145742267370224, "step": 6590, "valid_targets_mean": 2792.4, "valid_targets_min": 651 }, { "epoch": 6.927521008403361, "grad_norm": 0.7871859947545846, "learning_rate": 1.344556512576256e-08, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.1482214331626892, "step": 6595, "valid_targets_mean": 2457.0, "valid_targets_min": 700 }, { "epoch": 6.932773109243698, "grad_norm": 0.7643202727978451, "learning_rate": 1.1593548898236606e-08, "loss": 0.162, "loss_nan_ranks": 0, "loss_rank_avg": 0.15590517222881317, "step": 6600, "valid_targets_mean": 2423.8, "valid_targets_min": 791 }, { "epoch": 6.938025210084033, "grad_norm": 0.8242802199893152, "learning_rate": 9.878668071474639e-09, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.1575925648212433, "step": 6605, "valid_targets_mean": 2134.1, "valid_targets_min": 719 }, { "epoch": 6.94327731092437, "grad_norm": 0.7939290019589629, "learning_rate": 8.3009344108409e-09, "loss": 0.1626, "loss_nan_ranks": 0, "loss_rank_avg": 0.1599077582359314, "step": 6610, "valid_targets_mean": 2462.1, "valid_targets_min": 1122 }, { "epoch": 6.948529411764706, "grad_norm": 0.8359337734301073, "learning_rate": 6.860358740763406e-09, "loss": 0.1607, "loss_nan_ranks": 0, "loss_rank_avg": 0.15786179900169373, "step": 6615, "valid_targets_mean": 2346.8, "valid_targets_min": 628 }, { "epoch": 6.953781512605042, "grad_norm": 0.8230966514103626, "learning_rate": 5.55695094467179e-09, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.15767702460289001, "step": 6620, "valid_targets_mean": 2301.7, "valid_targets_min": 667 }, { "epoch": 6.959033613445378, "grad_norm": 0.8839955512653498, "learning_rate": 4.3907199649151355e-09, "loss": 0.1555, "loss_nan_ranks": 0, "loss_rank_avg": 0.14466795325279236, "step": 6625, "valid_targets_mean": 1904.7, "valid_targets_min": 721 }, { "epoch": 6.964285714285714, "grad_norm": 0.7315947556803873, "learning_rate": 3.361673802708687e-09, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.1519755721092224, "step": 6630, "valid_targets_mean": 2944.4, "valid_targets_min": 659 }, { "epoch": 6.96953781512605, "grad_norm": 0.9022304224894817, "learning_rate": 2.469819518080563e-09, "loss": 0.1613, "loss_nan_ranks": 0, "loss_rank_avg": 0.1760965883731842, "step": 6635, "valid_targets_mean": 2122.0, "valid_targets_min": 750 }, { "epoch": 6.974789915966387, "grad_norm": 0.9761476002877811, "learning_rate": 1.7151632298140209e-09, "loss": 0.1531, "loss_nan_ranks": 0, "loss_rank_avg": 0.14784833788871765, "step": 6640, "valid_targets_mean": 2816.7, "valid_targets_min": 1127 }, { "epoch": 6.980042016806722, "grad_norm": 0.7716322233500594, "learning_rate": 1.0977101154163727e-09, "loss": 0.1524, "loss_nan_ranks": 0, "loss_rank_avg": 0.155085951089859, "step": 6645, "valid_targets_mean": 2472.3, "valid_targets_min": 1348 }, { "epoch": 6.985294117647059, "grad_norm": 0.8463421638101505, "learning_rate": 6.174644110767958e-10, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.16529741883277893, "step": 6650, "valid_targets_mean": 2150.7, "valid_targets_min": 842 }, { "epoch": 6.990546218487395, "grad_norm": 0.7405547503921337, "learning_rate": 2.744294116419077e-10, "loss": 0.146, "loss_nan_ranks": 0, "loss_rank_avg": 0.13631612062454224, "step": 6655, "valid_targets_mean": 2381.4, "valid_targets_min": 791 }, { "epoch": 6.995798319327731, "grad_norm": 0.8184309324867913, "learning_rate": 6.860747058468064e-11, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.15874159336090088, "step": 6660, "valid_targets_mean": 2120.4, "valid_targets_min": 680 }, { "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.1511024534702301, "step": 6664, "total_flos": 1189037529694208.0, "train_loss": 0.22791378844041926, "train_runtime": 28576.9639, "train_samples_per_second": 3.731, "train_steps_per_second": 0.233, "valid_targets_mean": 3122.5, "valid_targets_min": 647 } ], "logging_steps": 5, "max_steps": 6664, "num_input_tokens_seen": 0, "num_train_epochs": 7, "save_steps": 200, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1189037529694208.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }