{ "best_global_step": null, "best_metric": null, "best_model_checkpoint": null, "epoch": 6.0, "eval_steps": 500, "global_step": 2442, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.012285012285012284, "grad_norm": 20.35053560709185, "learning_rate": 6.530612244897961e-07, "loss": 1.0266, "loss_nan_ranks": 0, "loss_rank_avg": 1.016836166381836, "step": 5, "valid_targets_mean": 1221.5, "valid_targets_min": 648 }, { "epoch": 0.02457002457002457, "grad_norm": 16.603510355056123, "learning_rate": 1.469387755102041e-06, "loss": 0.9886, "loss_nan_ranks": 0, "loss_rank_avg": 0.9607698917388916, "step": 10, "valid_targets_mean": 1451.9, "valid_targets_min": 971 }, { "epoch": 0.036855036855036855, "grad_norm": 16.816054244261874, "learning_rate": 2.285714285714286e-06, "loss": 0.972, "loss_nan_ranks": 0, "loss_rank_avg": 0.965086042881012, "step": 15, "valid_targets_mean": 1169.6, "valid_targets_min": 739 }, { "epoch": 0.04914004914004914, "grad_norm": 10.473733849996067, "learning_rate": 3.1020408163265307e-06, "loss": 0.8641, "loss_nan_ranks": 0, "loss_rank_avg": 0.829804003238678, "step": 20, "valid_targets_mean": 1340.2, "valid_targets_min": 853 }, { "epoch": 0.06142506142506143, "grad_norm": 6.719886648102692, "learning_rate": 3.9183673469387755e-06, "loss": 0.779, "loss_nan_ranks": 0, "loss_rank_avg": 0.7282828092575073, "step": 25, "valid_targets_mean": 1187.4, "valid_targets_min": 699 }, { "epoch": 0.07371007371007371, "grad_norm": 4.642242575672464, "learning_rate": 4.734693877551021e-06, "loss": 0.6757, "loss_nan_ranks": 0, "loss_rank_avg": 0.6520389914512634, "step": 30, "valid_targets_mean": 1321.6, "valid_targets_min": 568 }, { "epoch": 0.085995085995086, "grad_norm": 2.7965705811975607, "learning_rate": 5.551020408163266e-06, "loss": 0.6122, "loss_nan_ranks": 0, "loss_rank_avg": 0.5742930173873901, "step": 35, "valid_targets_mean": 1361.1, "valid_targets_min": 654 }, { "epoch": 0.09828009828009827, "grad_norm": 1.9647310620540863, "learning_rate": 6.36734693877551e-06, "loss": 0.5417, "loss_nan_ranks": 0, "loss_rank_avg": 0.5204732418060303, "step": 40, "valid_targets_mean": 1321.1, "valid_targets_min": 574 }, { "epoch": 0.11056511056511056, "grad_norm": 1.6336158421098663, "learning_rate": 7.183673469387755e-06, "loss": 0.4913, "loss_nan_ranks": 0, "loss_rank_avg": 0.48145467042922974, "step": 45, "valid_targets_mean": 1290.8, "valid_targets_min": 531 }, { "epoch": 0.12285012285012285, "grad_norm": 1.6098593343945324, "learning_rate": 8.000000000000001e-06, "loss": 0.4652, "loss_nan_ranks": 0, "loss_rank_avg": 0.45056235790252686, "step": 50, "valid_targets_mean": 1294.9, "valid_targets_min": 783 }, { "epoch": 0.13513513513513514, "grad_norm": 1.487675000715524, "learning_rate": 8.816326530612247e-06, "loss": 0.4215, "loss_nan_ranks": 0, "loss_rank_avg": 0.41585201025009155, "step": 55, "valid_targets_mean": 1332.2, "valid_targets_min": 794 }, { "epoch": 0.14742014742014742, "grad_norm": 1.5044656855552325, "learning_rate": 9.63265306122449e-06, "loss": 0.4064, "loss_nan_ranks": 0, "loss_rank_avg": 0.3813883662223816, "step": 60, "valid_targets_mean": 1311.1, "valid_targets_min": 693 }, { "epoch": 0.1597051597051597, "grad_norm": 1.3262454599596, "learning_rate": 1.0448979591836737e-05, "loss": 0.3753, "loss_nan_ranks": 0, "loss_rank_avg": 0.36576443910598755, "step": 65, "valid_targets_mean": 1226.4, "valid_targets_min": 624 }, { "epoch": 0.171990171990172, "grad_norm": 1.1566857700781938, "learning_rate": 1.126530612244898e-05, "loss": 0.372, "loss_nan_ranks": 0, "loss_rank_avg": 0.37514474987983704, "step": 70, "valid_targets_mean": 1539.2, "valid_targets_min": 768 }, { "epoch": 0.18427518427518427, "grad_norm": 1.2676859471136912, "learning_rate": 1.2081632653061225e-05, "loss": 0.3477, "loss_nan_ranks": 0, "loss_rank_avg": 0.33851388096809387, "step": 75, "valid_targets_mean": 1114.2, "valid_targets_min": 661 }, { "epoch": 0.19656019656019655, "grad_norm": 1.3741420718567798, "learning_rate": 1.2897959183673469e-05, "loss": 0.3266, "loss_nan_ranks": 0, "loss_rank_avg": 0.3353644013404846, "step": 80, "valid_targets_mean": 1143.4, "valid_targets_min": 712 }, { "epoch": 0.20884520884520885, "grad_norm": 1.107327074899049, "learning_rate": 1.3714285714285716e-05, "loss": 0.3201, "loss_nan_ranks": 0, "loss_rank_avg": 0.31138500571250916, "step": 85, "valid_targets_mean": 1249.1, "valid_targets_min": 590 }, { "epoch": 0.22113022113022113, "grad_norm": 1.2916481544068563, "learning_rate": 1.4530612244897961e-05, "loss": 0.3025, "loss_nan_ranks": 0, "loss_rank_avg": 0.30402475595474243, "step": 90, "valid_targets_mean": 1252.0, "valid_targets_min": 649 }, { "epoch": 0.2334152334152334, "grad_norm": 1.2219729652086049, "learning_rate": 1.5346938775510204e-05, "loss": 0.3136, "loss_nan_ranks": 0, "loss_rank_avg": 0.31273770332336426, "step": 95, "valid_targets_mean": 1185.1, "valid_targets_min": 631 }, { "epoch": 0.2457002457002457, "grad_norm": 1.0254894202707463, "learning_rate": 1.616326530612245e-05, "loss": 0.3132, "loss_nan_ranks": 0, "loss_rank_avg": 0.2911428213119507, "step": 100, "valid_targets_mean": 1281.2, "valid_targets_min": 940 }, { "epoch": 0.257985257985258, "grad_norm": 1.19134839145044, "learning_rate": 1.6979591836734695e-05, "loss": 0.3108, "loss_nan_ranks": 0, "loss_rank_avg": 0.3086431920528412, "step": 105, "valid_targets_mean": 1279.0, "valid_targets_min": 711 }, { "epoch": 0.2702702702702703, "grad_norm": 1.051295827944603, "learning_rate": 1.779591836734694e-05, "loss": 0.2949, "loss_nan_ranks": 0, "loss_rank_avg": 0.3161376118659973, "step": 110, "valid_targets_mean": 1383.6, "valid_targets_min": 897 }, { "epoch": 0.28255528255528256, "grad_norm": 1.001465215723732, "learning_rate": 1.8612244897959185e-05, "loss": 0.2868, "loss_nan_ranks": 0, "loss_rank_avg": 0.27010855078697205, "step": 115, "valid_targets_mean": 1363.2, "valid_targets_min": 813 }, { "epoch": 0.29484029484029484, "grad_norm": 1.0939416312953611, "learning_rate": 1.942857142857143e-05, "loss": 0.2882, "loss_nan_ranks": 0, "loss_rank_avg": 0.29551124572753906, "step": 120, "valid_targets_mean": 1317.6, "valid_targets_min": 710 }, { "epoch": 0.3071253071253071, "grad_norm": 1.017797618825815, "learning_rate": 2.0244897959183672e-05, "loss": 0.2896, "loss_nan_ranks": 0, "loss_rank_avg": 0.27586787939071655, "step": 125, "valid_targets_mean": 1418.5, "valid_targets_min": 941 }, { "epoch": 0.3194103194103194, "grad_norm": 1.2127705134680413, "learning_rate": 2.106122448979592e-05, "loss": 0.2911, "loss_nan_ranks": 0, "loss_rank_avg": 0.2948208451271057, "step": 130, "valid_targets_mean": 1013.2, "valid_targets_min": 663 }, { "epoch": 0.3316953316953317, "grad_norm": 1.1881461995379652, "learning_rate": 2.1877551020408166e-05, "loss": 0.2837, "loss_nan_ranks": 0, "loss_rank_avg": 0.30349838733673096, "step": 135, "valid_targets_mean": 1376.4, "valid_targets_min": 727 }, { "epoch": 0.343980343980344, "grad_norm": 1.0220364541266478, "learning_rate": 2.269387755102041e-05, "loss": 0.2945, "loss_nan_ranks": 0, "loss_rank_avg": 0.31276723742485046, "step": 140, "valid_targets_mean": 1266.6, "valid_targets_min": 637 }, { "epoch": 0.35626535626535627, "grad_norm": 1.0259584649302287, "learning_rate": 2.3510204081632656e-05, "loss": 0.2735, "loss_nan_ranks": 0, "loss_rank_avg": 0.28521037101745605, "step": 145, "valid_targets_mean": 1381.8, "valid_targets_min": 724 }, { "epoch": 0.36855036855036855, "grad_norm": 1.387643384965655, "learning_rate": 2.4326530612244898e-05, "loss": 0.2848, "loss_nan_ranks": 0, "loss_rank_avg": 0.28743278980255127, "step": 150, "valid_targets_mean": 1333.6, "valid_targets_min": 646 }, { "epoch": 0.3808353808353808, "grad_norm": 1.104844187565239, "learning_rate": 2.5142857142857143e-05, "loss": 0.2726, "loss_nan_ranks": 0, "loss_rank_avg": 0.267228364944458, "step": 155, "valid_targets_mean": 1163.2, "valid_targets_min": 700 }, { "epoch": 0.3931203931203931, "grad_norm": 1.0781870060932552, "learning_rate": 2.5959183673469392e-05, "loss": 0.2835, "loss_nan_ranks": 0, "loss_rank_avg": 0.2731441855430603, "step": 160, "valid_targets_mean": 1182.2, "valid_targets_min": 800 }, { "epoch": 0.40540540540540543, "grad_norm": 1.2518533850963875, "learning_rate": 2.6775510204081637e-05, "loss": 0.273, "loss_nan_ranks": 0, "loss_rank_avg": 0.2699888348579407, "step": 165, "valid_targets_mean": 1239.4, "valid_targets_min": 713 }, { "epoch": 0.4176904176904177, "grad_norm": 1.168759326203342, "learning_rate": 2.7591836734693882e-05, "loss": 0.2688, "loss_nan_ranks": 0, "loss_rank_avg": 0.26571792364120483, "step": 170, "valid_targets_mean": 1398.9, "valid_targets_min": 598 }, { "epoch": 0.42997542997543, "grad_norm": 0.9396552751253561, "learning_rate": 2.8408163265306124e-05, "loss": 0.2762, "loss_nan_ranks": 0, "loss_rank_avg": 0.2691813111305237, "step": 175, "valid_targets_mean": 1485.3, "valid_targets_min": 872 }, { "epoch": 0.44226044226044225, "grad_norm": 1.2096875417684458, "learning_rate": 2.922448979591837e-05, "loss": 0.2787, "loss_nan_ranks": 0, "loss_rank_avg": 0.2808350920677185, "step": 180, "valid_targets_mean": 1162.1, "valid_targets_min": 721 }, { "epoch": 0.45454545454545453, "grad_norm": 1.1999093025296843, "learning_rate": 3.0040816326530614e-05, "loss": 0.2667, "loss_nan_ranks": 0, "loss_rank_avg": 0.2688295841217041, "step": 185, "valid_targets_mean": 1101.2, "valid_targets_min": 516 }, { "epoch": 0.4668304668304668, "grad_norm": 1.1647181597312102, "learning_rate": 3.085714285714286e-05, "loss": 0.2624, "loss_nan_ranks": 0, "loss_rank_avg": 0.2831493616104126, "step": 190, "valid_targets_mean": 1266.9, "valid_targets_min": 619 }, { "epoch": 0.47911547911547914, "grad_norm": 1.0284185612708663, "learning_rate": 3.1673469387755105e-05, "loss": 0.2602, "loss_nan_ranks": 0, "loss_rank_avg": 0.24393121898174286, "step": 195, "valid_targets_mean": 1164.9, "valid_targets_min": 756 }, { "epoch": 0.4914004914004914, "grad_norm": 1.0003942487517488, "learning_rate": 3.2489795918367346e-05, "loss": 0.2523, "loss_nan_ranks": 0, "loss_rank_avg": 0.22005441784858704, "step": 200, "valid_targets_mean": 1244.3, "valid_targets_min": 618 }, { "epoch": 0.5036855036855037, "grad_norm": 1.0107391467706224, "learning_rate": 3.3306122448979595e-05, "loss": 0.2636, "loss_nan_ranks": 0, "loss_rank_avg": 0.2617947459220886, "step": 205, "valid_targets_mean": 1234.1, "valid_targets_min": 874 }, { "epoch": 0.515970515970516, "grad_norm": 1.2118728098280296, "learning_rate": 3.4122448979591843e-05, "loss": 0.2615, "loss_nan_ranks": 0, "loss_rank_avg": 0.2575775384902954, "step": 210, "valid_targets_mean": 1321.1, "valid_targets_min": 861 }, { "epoch": 0.5282555282555282, "grad_norm": 0.9892491299567787, "learning_rate": 3.4938775510204085e-05, "loss": 0.249, "loss_nan_ranks": 0, "loss_rank_avg": 0.2387700229883194, "step": 215, "valid_targets_mean": 1299.9, "valid_targets_min": 1000 }, { "epoch": 0.5405405405405406, "grad_norm": 1.0482471985131325, "learning_rate": 3.575510204081633e-05, "loss": 0.2583, "loss_nan_ranks": 0, "loss_rank_avg": 0.2581407427787781, "step": 220, "valid_targets_mean": 1370.2, "valid_targets_min": 783 }, { "epoch": 0.5528255528255528, "grad_norm": 1.0295148997419448, "learning_rate": 3.6571428571428576e-05, "loss": 0.2548, "loss_nan_ranks": 0, "loss_rank_avg": 0.24649953842163086, "step": 225, "valid_targets_mean": 1169.7, "valid_targets_min": 696 }, { "epoch": 0.5651105651105651, "grad_norm": 0.9681847418509463, "learning_rate": 3.738775510204082e-05, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.27282947301864624, "step": 230, "valid_targets_mean": 1279.6, "valid_targets_min": 809 }, { "epoch": 0.5773955773955773, "grad_norm": 0.9238070431221829, "learning_rate": 3.8204081632653066e-05, "loss": 0.252, "loss_nan_ranks": 0, "loss_rank_avg": 0.24655944108963013, "step": 235, "valid_targets_mean": 1360.4, "valid_targets_min": 725 }, { "epoch": 0.5896805896805897, "grad_norm": 0.9098797568997322, "learning_rate": 3.902040816326531e-05, "loss": 0.2625, "loss_nan_ranks": 0, "loss_rank_avg": 0.23307578265666962, "step": 240, "valid_targets_mean": 1383.3, "valid_targets_min": 631 }, { "epoch": 0.601965601965602, "grad_norm": 1.006785214329797, "learning_rate": 3.983673469387755e-05, "loss": 0.2594, "loss_nan_ranks": 0, "loss_rank_avg": 0.26228320598602295, "step": 245, "valid_targets_mean": 1284.8, "valid_targets_min": 679 }, { "epoch": 0.6142506142506142, "grad_norm": 1.0525191631080537, "learning_rate": 3.9999672841332876e-05, "loss": 0.2549, "loss_nan_ranks": 0, "loss_rank_avg": 0.23748120665550232, "step": 250, "valid_targets_mean": 1343.1, "valid_targets_min": 643 }, { "epoch": 0.6265356265356266, "grad_norm": 1.0681183261616904, "learning_rate": 3.999834377759164e-05, "loss": 0.2604, "loss_nan_ranks": 0, "loss_rank_avg": 0.25798824429512024, "step": 255, "valid_targets_mean": 1271.4, "valid_targets_min": 582 }, { "epoch": 0.6388206388206388, "grad_norm": 1.039669566160986, "learning_rate": 3.999599242924703e-05, "loss": 0.2573, "loss_nan_ranks": 0, "loss_rank_avg": 0.26076722145080566, "step": 260, "valid_targets_mean": 1133.4, "valid_targets_min": 577 }, { "epoch": 0.6511056511056511, "grad_norm": 1.0724973460550207, "learning_rate": 3.999261891649637e-05, "loss": 0.2576, "loss_nan_ranks": 0, "loss_rank_avg": 0.23584957420825958, "step": 265, "valid_targets_mean": 1405.9, "valid_targets_min": 979 }, { "epoch": 0.6633906633906634, "grad_norm": 0.9104706365824741, "learning_rate": 3.9988223411788436e-05, "loss": 0.2593, "loss_nan_ranks": 0, "loss_rank_avg": 0.2530933618545532, "step": 270, "valid_targets_mean": 1466.0, "valid_targets_min": 753 }, { "epoch": 0.6756756756756757, "grad_norm": 1.0963583541448956, "learning_rate": 3.998280613981468e-05, "loss": 0.247, "loss_nan_ranks": 0, "loss_rank_avg": 0.2414504736661911, "step": 275, "valid_targets_mean": 1352.9, "valid_targets_min": 819 }, { "epoch": 0.687960687960688, "grad_norm": 0.9882989853095971, "learning_rate": 3.9976367377497725e-05, "loss": 0.2519, "loss_nan_ranks": 0, "loss_rank_avg": 0.24604278802871704, "step": 280, "valid_targets_mean": 1113.4, "valid_targets_min": 631 }, { "epoch": 0.7002457002457002, "grad_norm": 0.995524650089483, "learning_rate": 3.99689074539772e-05, "loss": 0.2503, "loss_nan_ranks": 0, "loss_rank_avg": 0.24476918578147888, "step": 285, "valid_targets_mean": 1168.4, "valid_targets_min": 599 }, { "epoch": 0.7125307125307125, "grad_norm": 0.9891596679542455, "learning_rate": 3.9960426750592936e-05, "loss": 0.2454, "loss_nan_ranks": 0, "loss_rank_avg": 0.25576359033584595, "step": 290, "valid_targets_mean": 1179.9, "valid_targets_min": 833 }, { "epoch": 0.7248157248157249, "grad_norm": 0.9551067978223167, "learning_rate": 3.995092570086546e-05, "loss": 0.2498, "loss_nan_ranks": 0, "loss_rank_avg": 0.2365557849407196, "step": 295, "valid_targets_mean": 1248.8, "valid_targets_min": 681 }, { "epoch": 0.7371007371007371, "grad_norm": 0.8993619363801122, "learning_rate": 3.9940404790473825e-05, "loss": 0.2459, "loss_nan_ranks": 0, "loss_rank_avg": 0.230590358376503, "step": 300, "valid_targets_mean": 1189.8, "valid_targets_min": 656 }, { "epoch": 0.7493857493857494, "grad_norm": 0.9950400883383362, "learning_rate": 3.992886455723082e-05, "loss": 0.2491, "loss_nan_ranks": 0, "loss_rank_avg": 0.25279349088668823, "step": 305, "valid_targets_mean": 1129.0, "valid_targets_min": 546 }, { "epoch": 0.7616707616707616, "grad_norm": 0.8527006472613714, "learning_rate": 3.991630559105541e-05, "loss": 0.2356, "loss_nan_ranks": 0, "loss_rank_avg": 0.22874727845191956, "step": 310, "valid_targets_mean": 1332.6, "valid_targets_min": 828 }, { "epoch": 0.773955773955774, "grad_norm": 1.0419255233532783, "learning_rate": 3.990272853394268e-05, "loss": 0.2446, "loss_nan_ranks": 0, "loss_rank_avg": 0.22870038449764252, "step": 315, "valid_targets_mean": 1102.8, "valid_targets_min": 692 }, { "epoch": 0.7862407862407862, "grad_norm": 0.8716345618424153, "learning_rate": 3.988813407993089e-05, "loss": 0.2261, "loss_nan_ranks": 0, "loss_rank_avg": 0.23537375032901764, "step": 320, "valid_targets_mean": 1293.5, "valid_targets_min": 848 }, { "epoch": 0.7985257985257985, "grad_norm": 0.8810969006097469, "learning_rate": 3.987252297506613e-05, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.24338498711585999, "step": 325, "valid_targets_mean": 1233.5, "valid_targets_min": 659 }, { "epoch": 0.8108108108108109, "grad_norm": 0.9626770961212678, "learning_rate": 3.9855896017364075e-05, "loss": 0.2354, "loss_nan_ranks": 0, "loss_rank_avg": 0.2470875233411789, "step": 330, "valid_targets_mean": 1239.8, "valid_targets_min": 559 }, { "epoch": 0.8230958230958231, "grad_norm": 0.9176247579572656, "learning_rate": 3.983825405676927e-05, "loss": 0.2432, "loss_nan_ranks": 0, "loss_rank_avg": 0.23234277963638306, "step": 335, "valid_targets_mean": 1354.6, "valid_targets_min": 898 }, { "epoch": 0.8353808353808354, "grad_norm": 0.8965361140622664, "learning_rate": 3.981959799511161e-05, "loss": 0.24, "loss_nan_ranks": 0, "loss_rank_avg": 0.23358391225337982, "step": 340, "valid_targets_mean": 1369.1, "valid_targets_min": 613 }, { "epoch": 0.8476658476658476, "grad_norm": 1.073981004545888, "learning_rate": 3.979992878606032e-05, "loss": 0.2499, "loss_nan_ranks": 0, "loss_rank_avg": 0.2327095866203308, "step": 345, "valid_targets_mean": 1122.8, "valid_targets_min": 683 }, { "epoch": 0.85995085995086, "grad_norm": 1.0151351479751622, "learning_rate": 3.977924743507513e-05, "loss": 0.2483, "loss_nan_ranks": 0, "loss_rank_avg": 0.23525191843509674, "step": 350, "valid_targets_mean": 1256.2, "valid_targets_min": 592 }, { "epoch": 0.8722358722358723, "grad_norm": 0.9282381133656055, "learning_rate": 3.975755499935492e-05, "loss": 0.2541, "loss_nan_ranks": 0, "loss_rank_avg": 0.27992555499076843, "step": 355, "valid_targets_mean": 1211.7, "valid_targets_min": 597 }, { "epoch": 0.8845208845208845, "grad_norm": 0.7744300003477048, "learning_rate": 3.973485258778368e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.2320326268672943, "step": 360, "valid_targets_mean": 1523.9, "valid_targets_min": 696 }, { "epoch": 0.8968058968058968, "grad_norm": 0.8915272025257586, "learning_rate": 3.971114136087379e-05, "loss": 0.2398, "loss_nan_ranks": 0, "loss_rank_avg": 0.23646889626979828, "step": 365, "valid_targets_mean": 1359.6, "valid_targets_min": 834 }, { "epoch": 0.9090909090909091, "grad_norm": 0.9986391400817158, "learning_rate": 3.968642253070675e-05, "loss": 0.2347, "loss_nan_ranks": 0, "loss_rank_avg": 0.23117730021476746, "step": 370, "valid_targets_mean": 1226.4, "valid_targets_min": 601 }, { "epoch": 0.9213759213759214, "grad_norm": 1.0663907580975795, "learning_rate": 3.966069736087116e-05, "loss": 0.2464, "loss_nan_ranks": 0, "loss_rank_avg": 0.2413148581981659, "step": 375, "valid_targets_mean": 1369.7, "valid_targets_min": 569 }, { "epoch": 0.9336609336609336, "grad_norm": 0.9688455896189119, "learning_rate": 3.963396716639818e-05, "loss": 0.2346, "loss_nan_ranks": 0, "loss_rank_avg": 0.2318524718284607, "step": 380, "valid_targets_mean": 1273.9, "valid_targets_min": 855 }, { "epoch": 0.9459459459459459, "grad_norm": 0.9406165224783458, "learning_rate": 3.960623331369427e-05, "loss": 0.2352, "loss_nan_ranks": 0, "loss_rank_avg": 0.20918339490890503, "step": 385, "valid_targets_mean": 1067.1, "valid_targets_min": 833 }, { "epoch": 0.9582309582309583, "grad_norm": 0.8493184795160157, "learning_rate": 3.957749722047138e-05, "loss": 0.2309, "loss_nan_ranks": 0, "loss_rank_avg": 0.23976099491119385, "step": 390, "valid_targets_mean": 1263.5, "valid_targets_min": 639 }, { "epoch": 0.9705159705159705, "grad_norm": 0.8446197614217856, "learning_rate": 3.9547760355674405e-05, "loss": 0.2222, "loss_nan_ranks": 0, "loss_rank_avg": 0.2245807945728302, "step": 395, "valid_targets_mean": 1357.5, "valid_targets_min": 860 }, { "epoch": 0.9828009828009828, "grad_norm": 0.9002227045931153, "learning_rate": 3.951702423940621e-05, "loss": 0.2343, "loss_nan_ranks": 0, "loss_rank_avg": 0.2399313747882843, "step": 400, "valid_targets_mean": 1242.1, "valid_targets_min": 668 }, { "epoch": 0.995085995085995, "grad_norm": 0.9146265445163199, "learning_rate": 3.948529044284981e-05, "loss": 0.2268, "loss_nan_ranks": 0, "loss_rank_avg": 0.24605955183506012, "step": 405, "valid_targets_mean": 1379.3, "valid_targets_min": 605 }, { "epoch": 1.0073710073710074, "grad_norm": 0.8846119726465934, "learning_rate": 3.9452560588188135e-05, "loss": 0.2383, "loss_nan_ranks": 0, "loss_rank_avg": 0.21427395939826965, "step": 410, "valid_targets_mean": 1292.4, "valid_targets_min": 625 }, { "epoch": 1.0196560196560196, "grad_norm": 0.8429800757595586, "learning_rate": 3.9418836348521045e-05, "loss": 0.2308, "loss_nan_ranks": 0, "loss_rank_avg": 0.22194769978523254, "step": 415, "valid_targets_mean": 1537.8, "valid_targets_min": 854 }, { "epoch": 1.031941031941032, "grad_norm": 1.0879669131500758, "learning_rate": 3.9384119447779854e-05, "loss": 0.2216, "loss_nan_ranks": 0, "loss_rank_avg": 0.21954546868801117, "step": 420, "valid_targets_mean": 1291.0, "valid_targets_min": 679 }, { "epoch": 1.0442260442260443, "grad_norm": 0.91150482238475, "learning_rate": 3.934841166063919e-05, "loss": 0.218, "loss_nan_ranks": 0, "loss_rank_avg": 0.21371571719646454, "step": 425, "valid_targets_mean": 1232.7, "valid_targets_min": 555 }, { "epoch": 1.0565110565110565, "grad_norm": 0.9859894476975108, "learning_rate": 3.931171481242625e-05, "loss": 0.2078, "loss_nan_ranks": 0, "loss_rank_avg": 0.20356549322605133, "step": 430, "valid_targets_mean": 1253.1, "valid_targets_min": 685 }, { "epoch": 1.0687960687960687, "grad_norm": 0.929488975303167, "learning_rate": 3.927403077902753e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.22038447856903076, "step": 435, "valid_targets_mean": 1190.2, "valid_targets_min": 696 }, { "epoch": 1.0810810810810811, "grad_norm": 0.9198148139807539, "learning_rate": 3.9235361486792905e-05, "loss": 0.2213, "loss_nan_ranks": 0, "loss_rank_avg": 0.23593559861183167, "step": 440, "valid_targets_mean": 1318.4, "valid_targets_min": 859 }, { "epoch": 1.0933660933660934, "grad_norm": 0.865539205726412, "learning_rate": 3.9195708912437176e-05, "loss": 0.2166, "loss_nan_ranks": 0, "loss_rank_avg": 0.199513241648674, "step": 445, "valid_targets_mean": 1262.8, "valid_targets_min": 832 }, { "epoch": 1.1056511056511056, "grad_norm": 0.8862960683914471, "learning_rate": 3.915507508293901e-05, "loss": 0.2114, "loss_nan_ranks": 0, "loss_rank_avg": 0.2223977893590927, "step": 450, "valid_targets_mean": 1404.8, "valid_targets_min": 928 }, { "epoch": 1.117936117936118, "grad_norm": 0.8859574165063384, "learning_rate": 3.911346207543734e-05, "loss": 0.2101, "loss_nan_ranks": 0, "loss_rank_avg": 0.21623465418815613, "step": 455, "valid_targets_mean": 1318.5, "valid_targets_min": 676 }, { "epoch": 1.1302211302211302, "grad_norm": 1.0054461891918525, "learning_rate": 3.907087201712515e-05, "loss": 0.2314, "loss_nan_ranks": 0, "loss_rank_avg": 0.23490525782108307, "step": 460, "valid_targets_mean": 1302.8, "valid_targets_min": 516 }, { "epoch": 1.1425061425061425, "grad_norm": 0.8741596133273296, "learning_rate": 3.902730708514078e-05, "loss": 0.2061, "loss_nan_ranks": 0, "loss_rank_avg": 0.18964213132858276, "step": 465, "valid_targets_mean": 1216.9, "valid_targets_min": 707 }, { "epoch": 1.154791154791155, "grad_norm": 0.9441571131207358, "learning_rate": 3.8982769506456616e-05, "loss": 0.2135, "loss_nan_ranks": 0, "loss_rank_avg": 0.23256821930408478, "step": 470, "valid_targets_mean": 1205.5, "valid_targets_min": 633 }, { "epoch": 1.1670761670761671, "grad_norm": 0.8475920842038459, "learning_rate": 3.893726155776524e-05, "loss": 0.2165, "loss_nan_ranks": 0, "loss_rank_avg": 0.19832265377044678, "step": 475, "valid_targets_mean": 1206.9, "valid_targets_min": 552 }, { "epoch": 1.1793611793611793, "grad_norm": 0.9251072573203696, "learning_rate": 3.8890785565363046e-05, "loss": 0.2103, "loss_nan_ranks": 0, "loss_rank_avg": 0.2146698236465454, "step": 480, "valid_targets_mean": 1227.5, "valid_targets_min": 772 }, { "epoch": 1.1916461916461916, "grad_norm": 0.9740444472309585, "learning_rate": 3.884334390503136e-05, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.21822363138198853, "step": 485, "valid_targets_mean": 1097.0, "valid_targets_min": 623 }, { "epoch": 1.203931203931204, "grad_norm": 0.8370410301775648, "learning_rate": 3.8794939001914955e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.22085630893707275, "step": 490, "valid_targets_mean": 1390.9, "valid_targets_min": 721 }, { "epoch": 1.2162162162162162, "grad_norm": 0.9186018225806699, "learning_rate": 3.87455733303981e-05, "loss": 0.2189, "loss_nan_ranks": 0, "loss_rank_avg": 0.2234152853488922, "step": 495, "valid_targets_mean": 1152.8, "valid_targets_min": 559 }, { "epoch": 1.2285012285012284, "grad_norm": 0.8405706051298435, "learning_rate": 3.869524941397805e-05, "loss": 0.2137, "loss_nan_ranks": 0, "loss_rank_avg": 0.21818791329860687, "step": 500, "valid_targets_mean": 1246.1, "valid_targets_min": 702 }, { "epoch": 1.2407862407862407, "grad_norm": 0.9209574543994296, "learning_rate": 3.8643969825136095e-05, "loss": 0.2152, "loss_nan_ranks": 0, "loss_rank_avg": 0.21757091581821442, "step": 505, "valid_targets_mean": 1152.7, "valid_targets_min": 599 }, { "epoch": 1.253071253071253, "grad_norm": 0.8067547007661393, "learning_rate": 3.8591737185206024e-05, "loss": 0.2153, "loss_nan_ranks": 0, "loss_rank_avg": 0.203495055437088, "step": 510, "valid_targets_mean": 1283.2, "valid_targets_min": 680 }, { "epoch": 1.2653562653562653, "grad_norm": 0.8723905147518646, "learning_rate": 3.853855416424011e-05, "loss": 0.2124, "loss_nan_ranks": 0, "loss_rank_avg": 0.22284701466560364, "step": 515, "valid_targets_mean": 1208.0, "valid_targets_min": 666 }, { "epoch": 1.2776412776412776, "grad_norm": 0.8107646956453654, "learning_rate": 3.848442348087267e-05, "loss": 0.2131, "loss_nan_ranks": 0, "loss_rank_avg": 0.20091310143470764, "step": 520, "valid_targets_mean": 1367.6, "valid_targets_min": 764 }, { "epoch": 1.28992628992629, "grad_norm": 0.8840227552984795, "learning_rate": 3.842934790218106e-05, "loss": 0.2109, "loss_nan_ranks": 0, "loss_rank_avg": 0.21159666776657104, "step": 525, "valid_targets_mean": 1263.2, "valid_targets_min": 856 }, { "epoch": 1.3022113022113022, "grad_norm": 0.9823970363721356, "learning_rate": 3.837333024354422e-05, "loss": 0.2136, "loss_nan_ranks": 0, "loss_rank_avg": 0.22919949889183044, "step": 530, "valid_targets_mean": 1240.1, "valid_targets_min": 563 }, { "epoch": 1.3144963144963144, "grad_norm": 1.735042209364941, "learning_rate": 3.8316373368498794e-05, "loss": 0.1981, "loss_nan_ranks": 0, "loss_rank_avg": 0.21260014176368713, "step": 535, "valid_targets_mean": 1401.2, "valid_targets_min": 604 }, { "epoch": 1.3267813267813269, "grad_norm": 0.8022885779180352, "learning_rate": 3.82584801885927e-05, "loss": 0.2155, "loss_nan_ranks": 0, "loss_rank_avg": 0.21027901768684387, "step": 540, "valid_targets_mean": 1354.0, "valid_targets_min": 695 }, { "epoch": 1.339066339066339, "grad_norm": 0.7971643641976438, "learning_rate": 3.8199653663236336e-05, "loss": 0.2175, "loss_nan_ranks": 0, "loss_rank_avg": 0.22587084770202637, "step": 545, "valid_targets_mean": 1381.9, "valid_targets_min": 957 }, { "epoch": 1.3513513513513513, "grad_norm": 0.8515238470974948, "learning_rate": 3.813989679955128e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.20897898077964783, "step": 550, "valid_targets_mean": 1361.9, "valid_targets_min": 826 }, { "epoch": 1.3636363636363638, "grad_norm": 0.8555526583280557, "learning_rate": 3.8079212652216595e-05, "loss": 0.2045, "loss_nan_ranks": 0, "loss_rank_avg": 0.20616090297698975, "step": 555, "valid_targets_mean": 1297.0, "valid_targets_min": 602 }, { "epoch": 1.375921375921376, "grad_norm": 0.8964923469359567, "learning_rate": 3.8017604323312616e-05, "loss": 0.2068, "loss_nan_ranks": 0, "loss_rank_avg": 0.20442214608192444, "step": 560, "valid_targets_mean": 1286.3, "valid_targets_min": 717 }, { "epoch": 1.3882063882063882, "grad_norm": 1.0497145720091325, "learning_rate": 3.795507496216246e-05, "loss": 0.2201, "loss_nan_ranks": 0, "loss_rank_avg": 0.22913996875286102, "step": 565, "valid_targets_mean": 1299.9, "valid_targets_min": 755 }, { "epoch": 1.4004914004914004, "grad_norm": 0.8618095265826493, "learning_rate": 3.789162776517098e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.2160976678133011, "step": 570, "valid_targets_mean": 1281.5, "valid_targets_min": 677 }, { "epoch": 1.4127764127764126, "grad_norm": 0.8211183730608299, "learning_rate": 3.78272659756614e-05, "loss": 0.2173, "loss_nan_ranks": 0, "loss_rank_avg": 0.23328492045402527, "step": 575, "valid_targets_mean": 1361.1, "valid_targets_min": 699 }, { "epoch": 1.425061425061425, "grad_norm": 0.8273749298069341, "learning_rate": 3.776199288370948e-05, "loss": 0.2199, "loss_nan_ranks": 0, "loss_rank_avg": 0.23211979866027832, "step": 580, "valid_targets_mean": 1328.4, "valid_targets_min": 851 }, { "epoch": 1.4373464373464373, "grad_norm": 0.8559553834741782, "learning_rate": 3.7695811825975386e-05, "loss": 0.2052, "loss_nan_ranks": 0, "loss_rank_avg": 0.19386297464370728, "step": 585, "valid_targets_mean": 1047.1, "valid_targets_min": 571 }, { "epoch": 1.4496314496314495, "grad_norm": 0.7737724552422564, "learning_rate": 3.76287261855331e-05, "loss": 0.2065, "loss_nan_ranks": 0, "loss_rank_avg": 0.20705577731132507, "step": 590, "valid_targets_mean": 1450.2, "valid_targets_min": 906 }, { "epoch": 1.461916461916462, "grad_norm": 0.7544548232380602, "learning_rate": 3.7560739391697465e-05, "loss": 0.2157, "loss_nan_ranks": 0, "loss_rank_avg": 0.18719275295734406, "step": 595, "valid_targets_mean": 1226.5, "valid_targets_min": 600 }, { "epoch": 1.4742014742014742, "grad_norm": 0.8636863005403776, "learning_rate": 3.749185491984891e-05, "loss": 0.2099, "loss_nan_ranks": 0, "loss_rank_avg": 0.20051462948322296, "step": 600, "valid_targets_mean": 1257.8, "valid_targets_min": 772 }, { "epoch": 1.4864864864864864, "grad_norm": 0.7920583706263344, "learning_rate": 3.7422076291255785e-05, "loss": 0.1975, "loss_nan_ranks": 0, "loss_rank_avg": 0.19033858180046082, "step": 605, "valid_targets_mean": 1164.7, "valid_targets_min": 677 }, { "epoch": 1.4987714987714988, "grad_norm": 0.8334219155321024, "learning_rate": 3.7351407072894356e-05, "loss": 0.2082, "loss_nan_ranks": 0, "loss_rank_avg": 0.20213520526885986, "step": 610, "valid_targets_mean": 1286.6, "valid_targets_min": 957 }, { "epoch": 1.511056511056511, "grad_norm": 0.9313275078782892, "learning_rate": 3.7279850877266486e-05, "loss": 0.2194, "loss_nan_ranks": 0, "loss_rank_avg": 0.22305332124233246, "step": 615, "valid_targets_mean": 1265.1, "valid_targets_min": 727 }, { "epoch": 1.5233415233415233, "grad_norm": 0.8208145495971357, "learning_rate": 3.720741136221491e-05, "loss": 0.2074, "loss_nan_ranks": 0, "loss_rank_avg": 0.21243973076343536, "step": 620, "valid_targets_mean": 1292.1, "valid_targets_min": 704 }, { "epoch": 1.5356265356265357, "grad_norm": 0.8307696500817636, "learning_rate": 3.713409223073636e-05, "loss": 0.214, "loss_nan_ranks": 0, "loss_rank_avg": 0.21302366256713867, "step": 625, "valid_targets_mean": 1229.5, "valid_targets_min": 501 }, { "epoch": 1.547911547911548, "grad_norm": 0.8467719298005856, "learning_rate": 3.705989723079214e-05, "loss": 0.2172, "loss_nan_ranks": 0, "loss_rank_avg": 0.22414334118366241, "step": 630, "valid_targets_mean": 1386.8, "valid_targets_min": 516 }, { "epoch": 1.5601965601965602, "grad_norm": 0.8338920310244855, "learning_rate": 3.698483015511665e-05, "loss": 0.2093, "loss_nan_ranks": 0, "loss_rank_avg": 0.21425983309745789, "step": 635, "valid_targets_mean": 1345.6, "valid_targets_min": 608 }, { "epoch": 1.5724815724815726, "grad_norm": 0.847033756979806, "learning_rate": 3.690889484102344e-05, "loss": 0.2073, "loss_nan_ranks": 0, "loss_rank_avg": 0.19102904200553894, "step": 640, "valid_targets_mean": 1151.4, "valid_targets_min": 587 }, { "epoch": 1.5847665847665846, "grad_norm": 0.8357252424027696, "learning_rate": 3.683209517020908e-05, "loss": 0.2107, "loss_nan_ranks": 0, "loss_rank_avg": 0.22609484195709229, "step": 645, "valid_targets_mean": 1317.7, "valid_targets_min": 678 }, { "epoch": 1.597051597051597, "grad_norm": 0.8978628194123708, "learning_rate": 3.675443506855473e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.25122907757759094, "step": 650, "valid_targets_mean": 1355.8, "valid_targets_min": 749 }, { "epoch": 1.6093366093366095, "grad_norm": 0.8144918816074354, "learning_rate": 3.6675918505925456e-05, "loss": 0.2125, "loss_nan_ranks": 0, "loss_rank_avg": 0.19278162717819214, "step": 655, "valid_targets_mean": 1167.2, "valid_targets_min": 622 }, { "epoch": 1.6216216216216215, "grad_norm": 0.8678549604409258, "learning_rate": 3.6596549495967276e-05, "loss": 0.212, "loss_nan_ranks": 0, "loss_rank_avg": 0.2218804657459259, "step": 660, "valid_targets_mean": 1284.0, "valid_targets_min": 749 }, { "epoch": 1.633906633906634, "grad_norm": 0.8353937245559396, "learning_rate": 3.651633209590202e-05, "loss": 0.2123, "loss_nan_ranks": 0, "loss_rank_avg": 0.18236777186393738, "step": 665, "valid_targets_mean": 1267.4, "valid_targets_min": 532 }, { "epoch": 1.6461916461916462, "grad_norm": 0.7951973802311657, "learning_rate": 3.6435270406319914e-05, "loss": 0.2258, "loss_nan_ranks": 0, "loss_rank_avg": 0.2141144722700119, "step": 670, "valid_targets_mean": 1371.6, "valid_targets_min": 691 }, { "epoch": 1.6584766584766584, "grad_norm": 0.8471980022480241, "learning_rate": 3.635336857096997e-05, "loss": 0.2086, "loss_nan_ranks": 0, "loss_rank_avg": 0.2074558138847351, "step": 675, "valid_targets_mean": 1272.0, "valid_targets_min": 863 }, { "epoch": 1.6707616707616708, "grad_norm": 0.7615407401541552, "learning_rate": 3.627063077654815e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.20035895705223083, "step": 680, "valid_targets_mean": 1336.2, "valid_targets_min": 538 }, { "epoch": 1.683046683046683, "grad_norm": 0.8588070921853436, "learning_rate": 3.618706125248337e-05, "loss": 0.2054, "loss_nan_ranks": 0, "loss_rank_avg": 0.20719598233699799, "step": 685, "valid_targets_mean": 1390.2, "valid_targets_min": 747 }, { "epoch": 1.6953316953316953, "grad_norm": 0.8305147911432151, "learning_rate": 3.6102664270721275e-05, "loss": 0.2149, "loss_nan_ranks": 0, "loss_rank_avg": 0.21375998854637146, "step": 690, "valid_targets_mean": 1308.5, "valid_targets_min": 655 }, { "epoch": 1.7076167076167077, "grad_norm": 0.7458152286575466, "learning_rate": 3.601744414550589e-05, "loss": 0.206, "loss_nan_ranks": 0, "loss_rank_avg": 0.20337368547916412, "step": 695, "valid_targets_mean": 1402.0, "valid_targets_min": 563 }, { "epoch": 1.71990171990172, "grad_norm": 0.8430079820292512, "learning_rate": 3.593140523315906e-05, "loss": 0.2147, "loss_nan_ranks": 0, "loss_rank_avg": 0.2111029326915741, "step": 700, "valid_targets_mean": 1263.1, "valid_targets_min": 618 }, { "epoch": 1.7321867321867321, "grad_norm": 0.8587637085294313, "learning_rate": 3.584455193185778e-05, "loss": 0.2138, "loss_nan_ranks": 0, "loss_rank_avg": 0.20514604449272156, "step": 705, "valid_targets_mean": 1260.1, "valid_targets_min": 641 }, { "epoch": 1.7444717444717446, "grad_norm": 0.8419086609463237, "learning_rate": 3.575688868140933e-05, "loss": 0.2184, "loss_nan_ranks": 0, "loss_rank_avg": 0.20621389150619507, "step": 710, "valid_targets_mean": 1387.4, "valid_targets_min": 796 }, { "epoch": 1.7567567567567568, "grad_norm": 0.7702914519938786, "learning_rate": 3.566841996302438e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.20190760493278503, "step": 715, "valid_targets_mean": 1362.8, "valid_targets_min": 639 }, { "epoch": 1.769041769041769, "grad_norm": 0.8055966192320041, "learning_rate": 3.557915029908787e-05, "loss": 0.2151, "loss_nan_ranks": 0, "loss_rank_avg": 0.2246687412261963, "step": 720, "valid_targets_mean": 1284.2, "valid_targets_min": 775 }, { "epoch": 1.7813267813267815, "grad_norm": 0.7810151508322989, "learning_rate": 3.548908425292784e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.19987574219703674, "step": 725, "valid_targets_mean": 1195.1, "valid_targets_min": 765 }, { "epoch": 1.7936117936117935, "grad_norm": 0.7745765687362091, "learning_rate": 3.5398226428582165e-05, "loss": 0.2051, "loss_nan_ranks": 0, "loss_rank_avg": 0.1902502477169037, "step": 730, "valid_targets_mean": 1208.6, "valid_targets_min": 576 }, { "epoch": 1.805896805896806, "grad_norm": 0.7740403978164567, "learning_rate": 3.530658147056321e-05, "loss": 0.2059, "loss_nan_ranks": 0, "loss_rank_avg": 0.21077097952365875, "step": 735, "valid_targets_mean": 1501.9, "valid_targets_min": 748 }, { "epoch": 1.8181818181818183, "grad_norm": 0.8831871306665532, "learning_rate": 3.521415406362041e-05, "loss": 0.2102, "loss_nan_ranks": 0, "loss_rank_avg": 0.22450268268585205, "step": 740, "valid_targets_mean": 1230.2, "valid_targets_min": 695 }, { "epoch": 1.8304668304668303, "grad_norm": 0.8075930439615072, "learning_rate": 3.512094893250076e-05, "loss": 0.2122, "loss_nan_ranks": 0, "loss_rank_avg": 0.2014818787574768, "step": 745, "valid_targets_mean": 1086.2, "valid_targets_min": 592 }, { "epoch": 1.8427518427518428, "grad_norm": 0.9351262133752251, "learning_rate": 3.5026970841707366e-05, "loss": 0.2097, "loss_nan_ranks": 0, "loss_rank_avg": 0.22045360505580902, "step": 750, "valid_targets_mean": 1351.4, "valid_targets_min": 936 }, { "epoch": 1.855036855036855, "grad_norm": 0.8524642243083412, "learning_rate": 3.493222459525579e-05, "loss": 0.198, "loss_nan_ranks": 0, "loss_rank_avg": 0.2044043391942978, "step": 755, "valid_targets_mean": 1232.6, "valid_targets_min": 750 }, { "epoch": 1.8673218673218672, "grad_norm": 0.8233788904636303, "learning_rate": 3.483671503642858e-05, "loss": 0.2055, "loss_nan_ranks": 0, "loss_rank_avg": 0.20760342478752136, "step": 760, "valid_targets_mean": 1309.0, "valid_targets_min": 681 }, { "epoch": 1.8796068796068797, "grad_norm": 0.7752715357533787, "learning_rate": 3.474044704752761e-05, "loss": 0.209, "loss_nan_ranks": 0, "loss_rank_avg": 0.20890532433986664, "step": 765, "valid_targets_mean": 1293.1, "valid_targets_min": 868 }, { "epoch": 1.8918918918918919, "grad_norm": 0.697679262289484, "learning_rate": 3.464342554962454e-05, "loss": 0.1996, "loss_nan_ranks": 0, "loss_rank_avg": 0.20702123641967773, "step": 770, "valid_targets_mean": 1639.2, "valid_targets_min": 1076 }, { "epoch": 1.904176904176904, "grad_norm": 0.7414242700794923, "learning_rate": 3.4545655502309254e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.18738913536071777, "step": 775, "valid_targets_mean": 1272.2, "valid_targets_min": 690 }, { "epoch": 1.9164619164619165, "grad_norm": 0.9334643511915244, "learning_rate": 3.444714190343633e-05, "loss": 0.2068, "loss_nan_ranks": 0, "loss_rank_avg": 0.201995387673378, "step": 780, "valid_targets_mean": 1324.6, "valid_targets_min": 655 }, { "epoch": 1.9287469287469288, "grad_norm": 0.8252648993168636, "learning_rate": 3.434788978886957e-05, "loss": 0.2086, "loss_nan_ranks": 0, "loss_rank_avg": 0.21050789952278137, "step": 785, "valid_targets_mean": 1299.9, "valid_targets_min": 582 }, { "epoch": 1.941031941031941, "grad_norm": 0.9170958801978001, "learning_rate": 3.424790423222455e-05, "loss": 0.1949, "loss_nan_ranks": 0, "loss_rank_avg": 0.20576564967632294, "step": 790, "valid_targets_mean": 1248.1, "valid_targets_min": 578 }, { "epoch": 1.9533169533169534, "grad_norm": 0.8198947258723515, "learning_rate": 3.414719034460928e-05, "loss": 0.199, "loss_nan_ranks": 0, "loss_rank_avg": 0.20504584908485413, "step": 795, "valid_targets_mean": 1324.3, "valid_targets_min": 854 }, { "epoch": 1.9656019656019657, "grad_norm": 0.8253301027208539, "learning_rate": 3.404575327436294e-05, "loss": 0.2024, "loss_nan_ranks": 0, "loss_rank_avg": 0.1956181824207306, "step": 800, "valid_targets_mean": 1276.2, "valid_targets_min": 620 }, { "epoch": 1.9778869778869779, "grad_norm": 0.8661318138286722, "learning_rate": 3.3943598206792665e-05, "loss": 0.1978, "loss_nan_ranks": 0, "loss_rank_avg": 0.1938505470752716, "step": 805, "valid_targets_mean": 1168.2, "valid_targets_min": 665 }, { "epoch": 1.9901719901719903, "grad_norm": 0.8202639838791619, "learning_rate": 3.384073036390857e-05, "loss": 0.2013, "loss_nan_ranks": 0, "loss_rank_avg": 0.2048560529947281, "step": 810, "valid_targets_mean": 1392.2, "valid_targets_min": 720 }, { "epoch": 2.0024570024570023, "grad_norm": 0.7431550083256849, "learning_rate": 3.373715500415667e-05, "loss": 0.2027, "loss_nan_ranks": 0, "loss_rank_avg": 0.17889058589935303, "step": 815, "valid_targets_mean": 1384.7, "valid_targets_min": 758 }, { "epoch": 2.0147420147420148, "grad_norm": 0.8960360020207319, "learning_rate": 3.363287742215023e-05, "loss": 0.1729, "loss_nan_ranks": 0, "loss_rank_avg": 0.1715434193611145, "step": 820, "valid_targets_mean": 1223.9, "valid_targets_min": 806 }, { "epoch": 2.027027027027027, "grad_norm": 0.8448839647298884, "learning_rate": 3.352790294839898e-05, "loss": 0.1839, "loss_nan_ranks": 0, "loss_rank_avg": 0.17698851227760315, "step": 825, "valid_targets_mean": 1208.3, "valid_targets_min": 608 }, { "epoch": 2.039312039312039, "grad_norm": 0.8771397300799911, "learning_rate": 3.3422236949036726e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.1854882389307022, "step": 830, "valid_targets_mean": 1115.2, "valid_targets_min": 527 }, { "epoch": 2.0515970515970516, "grad_norm": 0.9375067706527694, "learning_rate": 3.331588482554697e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.1746768355369568, "step": 835, "valid_targets_mean": 1309.6, "valid_targets_min": 753 }, { "epoch": 2.063882063882064, "grad_norm": 0.9320660058665986, "learning_rate": 3.320885201448684e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.1711595505475998, "step": 840, "valid_targets_mean": 1270.1, "valid_targets_min": 865 }, { "epoch": 2.076167076167076, "grad_norm": 0.9625843914370038, "learning_rate": 3.310114398720917e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.17891713976860046, "step": 845, "valid_targets_mean": 1182.7, "valid_targets_min": 713 }, { "epoch": 2.0884520884520885, "grad_norm": 0.8667658013763913, "learning_rate": 3.299276624958281e-05, "loss": 0.1858, "loss_nan_ranks": 0, "loss_rank_avg": 0.19869863986968994, "step": 850, "valid_targets_mean": 1383.4, "valid_targets_min": 672 }, { "epoch": 2.100737100737101, "grad_norm": 0.7829119159941206, "learning_rate": 3.288372434171116e-05, "loss": 0.1767, "loss_nan_ranks": 0, "loss_rank_avg": 0.1694278120994568, "step": 855, "valid_targets_mean": 1320.6, "valid_targets_min": 742 }, { "epoch": 2.113022113022113, "grad_norm": 1.0847289260076243, "learning_rate": 3.2774023837648986e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.20229297876358032, "step": 860, "valid_targets_mean": 1242.6, "valid_targets_min": 591 }, { "epoch": 2.1253071253071254, "grad_norm": 0.7918900295560403, "learning_rate": 3.26636703451175e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.16940709948539734, "step": 865, "valid_targets_mean": 1091.4, "valid_targets_min": 536 }, { "epoch": 2.1375921375921374, "grad_norm": 0.8050057115605104, "learning_rate": 3.2552669505217646e-05, "loss": 0.1804, "loss_nan_ranks": 0, "loss_rank_avg": 0.18291515111923218, "step": 870, "valid_targets_mean": 1270.8, "valid_targets_min": 640 }, { "epoch": 2.14987714987715, "grad_norm": 0.8294882963284373, "learning_rate": 3.24410269921418e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.16050593554973602, "step": 875, "valid_targets_mean": 1112.7, "valid_targets_min": 807 }, { "epoch": 2.1621621621621623, "grad_norm": 0.8227131541030049, "learning_rate": 3.232874851288367e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.1674197018146515, "step": 880, "valid_targets_mean": 1254.1, "valid_targets_min": 706 }, { "epoch": 2.1744471744471743, "grad_norm": 0.8557010633720166, "learning_rate": 3.221583980694659e-05, "loss": 0.1827, "loss_nan_ranks": 0, "loss_rank_avg": 0.17029841244220734, "step": 885, "valid_targets_mean": 1191.7, "valid_targets_min": 742 }, { "epoch": 2.1867321867321867, "grad_norm": 0.7837923417661988, "learning_rate": 3.21023066460501e-05, "loss": 0.175, "loss_nan_ranks": 0, "loss_rank_avg": 0.18245768547058105, "step": 890, "valid_targets_mean": 1483.2, "valid_targets_min": 826 }, { "epoch": 2.199017199017199, "grad_norm": 0.8390698587520268, "learning_rate": 3.198815483383492e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.17464491724967957, "step": 895, "valid_targets_mean": 1178.8, "valid_targets_min": 474 }, { "epoch": 2.211302211302211, "grad_norm": 0.8929645135048639, "learning_rate": 3.1873390205566295e-05, "loss": 0.1809, "loss_nan_ranks": 0, "loss_rank_avg": 0.19350141286849976, "step": 900, "valid_targets_mean": 1195.6, "valid_targets_min": 647 }, { "epoch": 2.2235872235872236, "grad_norm": 0.800799760583441, "learning_rate": 3.175801862783565e-05, "loss": 0.1802, "loss_nan_ranks": 0, "loss_rank_avg": 0.18399956822395325, "step": 905, "valid_targets_mean": 1394.0, "valid_targets_min": 762 }, { "epoch": 2.235872235872236, "grad_norm": 0.861812106568346, "learning_rate": 3.164204599826077e-05, "loss": 0.1794, "loss_nan_ranks": 0, "loss_rank_avg": 0.18631041049957275, "step": 910, "valid_targets_mean": 1266.8, "valid_targets_min": 707 }, { "epoch": 2.248157248157248, "grad_norm": 0.8136719833422565, "learning_rate": 3.1525478245184245e-05, "loss": 0.1776, "loss_nan_ranks": 0, "loss_rank_avg": 0.2019607126712799, "step": 915, "valid_targets_mean": 1316.0, "valid_targets_min": 760 }, { "epoch": 2.2604422604422605, "grad_norm": 0.7104387985554499, "learning_rate": 3.140832132737051e-05, "loss": 0.1754, "loss_nan_ranks": 0, "loss_rank_avg": 0.17880454659461975, "step": 920, "valid_targets_mean": 1386.5, "valid_targets_min": 745 }, { "epoch": 2.2727272727272725, "grad_norm": 0.723347779565406, "learning_rate": 3.129058123370116e-05, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.1798139065504074, "step": 925, "valid_targets_mean": 1418.9, "valid_targets_min": 806 }, { "epoch": 2.285012285012285, "grad_norm": 0.8227450691436261, "learning_rate": 3.117226398286887e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.17978253960609436, "step": 930, "valid_targets_mean": 1198.0, "valid_targets_min": 637 }, { "epoch": 2.2972972972972974, "grad_norm": 0.8181621906002657, "learning_rate": 3.105337562306968e-05, "loss": 0.185, "loss_nan_ranks": 0, "loss_rank_avg": 0.18528032302856445, "step": 935, "valid_targets_mean": 1467.1, "valid_targets_min": 939 }, { "epoch": 2.30958230958231, "grad_norm": 0.8628823590456987, "learning_rate": 3.0933922231693854e-05, "loss": 0.1788, "loss_nan_ranks": 0, "loss_rank_avg": 0.18646690249443054, "step": 940, "valid_targets_mean": 1327.8, "valid_targets_min": 768 }, { "epoch": 2.321867321867322, "grad_norm": 0.8312067805411888, "learning_rate": 3.08139099150152e-05, "loss": 0.189, "loss_nan_ranks": 0, "loss_rank_avg": 0.19820252060890198, "step": 945, "valid_targets_mean": 1358.0, "valid_targets_min": 902 }, { "epoch": 2.3341523341523343, "grad_norm": 0.7391010728907489, "learning_rate": 3.069334480787893e-05, "loss": 0.1789, "loss_nan_ranks": 0, "loss_rank_avg": 0.17447155714035034, "step": 950, "valid_targets_mean": 1403.9, "valid_targets_min": 564 }, { "epoch": 2.3464373464373462, "grad_norm": 0.8098616372815506, "learning_rate": 3.057223307338806e-05, "loss": 0.1828, "loss_nan_ranks": 0, "loss_rank_avg": 0.18852627277374268, "step": 955, "valid_targets_mean": 1456.1, "valid_targets_min": 823 }, { "epoch": 2.3587223587223587, "grad_norm": 0.8698102007694762, "learning_rate": 3.0450580902588346e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.18752536177635193, "step": 960, "valid_targets_mean": 1266.6, "valid_targets_min": 777 }, { "epoch": 2.371007371007371, "grad_norm": 0.7876664418489986, "learning_rate": 3.032839451415182e-05, "loss": 0.1836, "loss_nan_ranks": 0, "loss_rank_avg": 0.1748538315296173, "step": 965, "valid_targets_mean": 1193.6, "valid_targets_min": 457 }, { "epoch": 2.383292383292383, "grad_norm": 0.7113855892489315, "learning_rate": 3.0205680154058904e-05, "loss": 0.1775, "loss_nan_ranks": 0, "loss_rank_avg": 0.1739535927772522, "step": 970, "valid_targets_mean": 1514.7, "valid_targets_min": 697 }, { "epoch": 2.3955773955773956, "grad_norm": 0.8142211234131692, "learning_rate": 3.0082444095279117e-05, "loss": 0.1758, "loss_nan_ranks": 0, "loss_rank_avg": 0.1813521385192871, "step": 975, "valid_targets_mean": 1334.5, "valid_targets_min": 708 }, { "epoch": 2.407862407862408, "grad_norm": 0.8197074469826403, "learning_rate": 2.9958692637450406e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.16367939114570618, "step": 980, "valid_targets_mean": 1228.6, "valid_targets_min": 643 }, { "epoch": 2.42014742014742, "grad_norm": 0.8541938784954854, "learning_rate": 2.983443210655714e-05, "loss": 0.1735, "loss_nan_ranks": 0, "loss_rank_avg": 0.17588171362876892, "step": 985, "valid_targets_mean": 1190.8, "valid_targets_min": 682 }, { "epoch": 2.4324324324324325, "grad_norm": 0.7846425314619295, "learning_rate": 2.9709668854606706e-05, "loss": 0.1882, "loss_nan_ranks": 0, "loss_rank_avg": 0.18857240676879883, "step": 990, "valid_targets_mean": 1355.1, "valid_targets_min": 614 }, { "epoch": 2.444717444717445, "grad_norm": 0.7576298642207422, "learning_rate": 2.9584409259304828e-05, "loss": 0.1844, "loss_nan_ranks": 0, "loss_rank_avg": 0.17525619268417358, "step": 995, "valid_targets_mean": 1319.9, "valid_targets_min": 770 }, { "epoch": 2.457002457002457, "grad_norm": 0.8880135398527781, "learning_rate": 2.945865972372954e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.1825505644083023, "step": 1000, "valid_targets_mean": 1444.0, "valid_targets_min": 958 }, { "epoch": 2.4692874692874693, "grad_norm": 0.744044465614355, "learning_rate": 2.9332426676003858e-05, "loss": 0.1837, "loss_nan_ranks": 0, "loss_rank_avg": 0.17693683505058289, "step": 1005, "valid_targets_mean": 1339.9, "valid_targets_min": 802 }, { "epoch": 2.4815724815724813, "grad_norm": 0.7799185661658911, "learning_rate": 2.920571656896722e-05, "loss": 0.178, "loss_nan_ranks": 0, "loss_rank_avg": 0.17789432406425476, "step": 1010, "valid_targets_mean": 1302.0, "valid_targets_min": 782 }, { "epoch": 2.493857493857494, "grad_norm": 0.8361418168804058, "learning_rate": 2.907853587984558e-05, "loss": 0.1792, "loss_nan_ranks": 0, "loss_rank_avg": 0.18084871768951416, "step": 1015, "valid_targets_mean": 1297.5, "valid_targets_min": 685 }, { "epoch": 2.506142506142506, "grad_norm": 0.8486435962691962, "learning_rate": 2.8950891109920333e-05, "loss": 0.1785, "loss_nan_ranks": 0, "loss_rank_avg": 0.18357740342617035, "step": 1020, "valid_targets_mean": 1246.6, "valid_targets_min": 770 }, { "epoch": 2.5184275184275187, "grad_norm": 0.807405719311044, "learning_rate": 2.882278878419597e-05, "loss": 0.1764, "loss_nan_ranks": 0, "loss_rank_avg": 0.1806846410036087, "step": 1025, "valid_targets_mean": 1253.2, "valid_targets_min": 579 }, { "epoch": 2.5307125307125307, "grad_norm": 0.8520779946572644, "learning_rate": 2.8694235451066538e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.1823638379573822, "step": 1030, "valid_targets_mean": 1461.3, "valid_targets_min": 856 }, { "epoch": 2.542997542997543, "grad_norm": 1.0429862912852512, "learning_rate": 2.8565237681980876e-05, "loss": 0.1734, "loss_nan_ranks": 0, "loss_rank_avg": 0.17990875244140625, "step": 1035, "valid_targets_mean": 1360.1, "valid_targets_min": 836 }, { "epoch": 2.555282555282555, "grad_norm": 0.7262570397634495, "learning_rate": 2.843580207110672e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.1686376929283142, "step": 1040, "valid_targets_mean": 1346.9, "valid_targets_min": 736 }, { "epoch": 2.5675675675675675, "grad_norm": 0.7531761897578519, "learning_rate": 2.830593523499361e-05, "loss": 0.1803, "loss_nan_ranks": 0, "loss_rank_avg": 0.18114441633224487, "step": 1045, "valid_targets_mean": 1371.8, "valid_targets_min": 771 }, { "epoch": 2.57985257985258, "grad_norm": 0.793803225751772, "learning_rate": 2.8175643812234627e-05, "loss": 0.1778, "loss_nan_ranks": 0, "loss_rank_avg": 0.17945504188537598, "step": 1050, "valid_targets_mean": 1413.5, "valid_targets_min": 826 }, { "epoch": 2.592137592137592, "grad_norm": 0.9123261601174015, "learning_rate": 2.8044934463127108e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.1872619390487671, "step": 1055, "valid_targets_mean": 1261.8, "valid_targets_min": 759 }, { "epoch": 2.6044226044226044, "grad_norm": 0.7979823264894937, "learning_rate": 2.7913813869332112e-05, "loss": 0.1753, "loss_nan_ranks": 0, "loss_rank_avg": 0.1702994406223297, "step": 1060, "valid_targets_mean": 1177.8, "valid_targets_min": 654 }, { "epoch": 2.616707616707617, "grad_norm": 0.7996971813748655, "learning_rate": 2.7782288733532915e-05, "loss": 0.1797, "loss_nan_ranks": 0, "loss_rank_avg": 0.1733815222978592, "step": 1065, "valid_targets_mean": 1196.7, "valid_targets_min": 671 }, { "epoch": 2.628992628992629, "grad_norm": 0.8323833609213411, "learning_rate": 2.7650365779092346e-05, "loss": 0.1765, "loss_nan_ranks": 0, "loss_rank_avg": 0.17033511400222778, "step": 1070, "valid_targets_mean": 1238.1, "valid_targets_min": 632 }, { "epoch": 2.6412776412776413, "grad_norm": 0.8537456313959788, "learning_rate": 2.751805174970912e-05, "loss": 0.1815, "loss_nan_ranks": 0, "loss_rank_avg": 0.1890188306570053, "step": 1075, "valid_targets_mean": 1366.6, "valid_targets_min": 724 }, { "epoch": 2.6535626535626538, "grad_norm": 0.8217031611080989, "learning_rate": 2.7385353409073093e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.1882573664188385, "step": 1080, "valid_targets_mean": 1193.4, "valid_targets_min": 626 }, { "epoch": 2.6658476658476657, "grad_norm": 0.8348829168323537, "learning_rate": 2.725227754051953e-05, "loss": 0.1816, "loss_nan_ranks": 0, "loss_rank_avg": 0.18410508334636688, "step": 1085, "valid_targets_mean": 1281.5, "valid_targets_min": 711 }, { "epoch": 2.678132678132678, "grad_norm": 0.8190757683782894, "learning_rate": 2.711883094668234e-05, "loss": 0.1741, "loss_nan_ranks": 0, "loss_rank_avg": 0.16918015480041504, "step": 1090, "valid_targets_mean": 1204.8, "valid_targets_min": 571 }, { "epoch": 2.69041769041769, "grad_norm": 0.7763515026478695, "learning_rate": 2.698502044914633e-05, "loss": 0.173, "loss_nan_ranks": 0, "loss_rank_avg": 0.18051014840602875, "step": 1095, "valid_targets_mean": 1259.6, "valid_targets_min": 814 }, { "epoch": 2.7027027027027026, "grad_norm": 0.8114087614186496, "learning_rate": 2.685085288809853e-05, "loss": 0.1812, "loss_nan_ranks": 0, "loss_rank_avg": 0.18935176730155945, "step": 1100, "valid_targets_mean": 1320.4, "valid_targets_min": 763 }, { "epoch": 2.714987714987715, "grad_norm": 0.7857431478660847, "learning_rate": 2.671633512197848e-05, "loss": 0.181, "loss_nan_ranks": 0, "loss_rank_avg": 0.18005716800689697, "step": 1105, "valid_targets_mean": 1404.3, "valid_targets_min": 1088 }, { "epoch": 2.7272727272727275, "grad_norm": 0.7736276544807723, "learning_rate": 2.658147402712768e-05, "loss": 0.1784, "loss_nan_ranks": 0, "loss_rank_avg": 0.1820794641971588, "step": 1110, "valid_targets_mean": 1390.3, "valid_targets_min": 968 }, { "epoch": 2.7395577395577395, "grad_norm": 0.9867019712115244, "learning_rate": 2.6446276497438064e-05, "loss": 0.1768, "loss_nan_ranks": 0, "loss_rank_avg": 0.18605422973632812, "step": 1115, "valid_targets_mean": 1098.2, "valid_targets_min": 700 }, { "epoch": 2.751842751842752, "grad_norm": 0.84967200704623, "learning_rate": 2.6310749443999593e-05, "loss": 0.1841, "loss_nan_ranks": 0, "loss_rank_avg": 0.1918058693408966, "step": 1120, "valid_targets_mean": 1148.2, "valid_targets_min": 782 }, { "epoch": 2.764127764127764, "grad_norm": 0.8505940380680246, "learning_rate": 2.617489979474699e-05, "loss": 0.1784, "loss_nan_ranks": 0, "loss_rank_avg": 0.18517403304576874, "step": 1125, "valid_targets_mean": 1168.7, "valid_targets_min": 620 }, { "epoch": 2.7764127764127764, "grad_norm": 0.7530757761401906, "learning_rate": 2.6038734494105562e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.1890183687210083, "step": 1130, "valid_targets_mean": 1517.5, "valid_targets_min": 865 }, { "epoch": 2.788697788697789, "grad_norm": 0.8401579570867019, "learning_rate": 2.590226050263625e-05, "loss": 0.1733, "loss_nan_ranks": 0, "loss_rank_avg": 0.16918352246284485, "step": 1135, "valid_targets_mean": 1212.0, "valid_targets_min": 710 }, { "epoch": 2.800982800982801, "grad_norm": 0.8601827378880036, "learning_rate": 2.5765484796679768e-05, "loss": 0.1774, "loss_nan_ranks": 0, "loss_rank_avg": 0.1912257969379425, "step": 1140, "valid_targets_mean": 1214.9, "valid_targets_min": 674 }, { "epoch": 2.8132678132678133, "grad_norm": 0.8033832037490392, "learning_rate": 2.5628414368000035e-05, "loss": 0.183, "loss_nan_ranks": 0, "loss_rank_avg": 0.17666852474212646, "step": 1145, "valid_targets_mean": 1377.9, "valid_targets_min": 784 }, { "epoch": 2.8255528255528253, "grad_norm": 0.7512530664621442, "learning_rate": 2.5491056223426746e-05, "loss": 0.184, "loss_nan_ranks": 0, "loss_rank_avg": 0.18542739748954773, "step": 1150, "valid_targets_mean": 1384.6, "valid_targets_min": 873 }, { "epoch": 2.8378378378378377, "grad_norm": 0.8782223426492971, "learning_rate": 2.5353417384497166e-05, "loss": 0.179, "loss_nan_ranks": 0, "loss_rank_avg": 0.1851997822523117, "step": 1155, "valid_targets_mean": 1129.2, "valid_targets_min": 631 }, { "epoch": 2.85012285012285, "grad_norm": 0.8625211224696377, "learning_rate": 2.5215504887097243e-05, "loss": 0.1826, "loss_nan_ranks": 0, "loss_rank_avg": 0.20872226357460022, "step": 1160, "valid_targets_mean": 1269.6, "valid_targets_min": 683 }, { "epoch": 2.8624078624078626, "grad_norm": 0.7562673187162171, "learning_rate": 2.5077325781101918e-05, "loss": 0.1833, "loss_nan_ranks": 0, "loss_rank_avg": 0.17310750484466553, "step": 1165, "valid_targets_mean": 1283.8, "valid_targets_min": 582 }, { "epoch": 2.8746928746928746, "grad_norm": 0.8744562203843028, "learning_rate": 2.493888713001476e-05, "loss": 0.1796, "loss_nan_ranks": 0, "loss_rank_avg": 0.18026913702487946, "step": 1170, "valid_targets_mean": 1212.1, "valid_targets_min": 691 }, { "epoch": 2.886977886977887, "grad_norm": 0.7979652681313569, "learning_rate": 2.480019601060687e-05, "loss": 0.1787, "loss_nan_ranks": 0, "loss_rank_avg": 0.19717931747436523, "step": 1175, "valid_targets_mean": 1335.1, "valid_targets_min": 830 }, { "epoch": 2.899262899262899, "grad_norm": 0.7494625305278567, "learning_rate": 2.4661259512555176e-05, "loss": 0.1813, "loss_nan_ranks": 0, "loss_rank_avg": 0.1821805238723755, "step": 1180, "valid_targets_mean": 1392.2, "valid_targets_min": 1080 }, { "epoch": 2.9115479115479115, "grad_norm": 0.8592457680594853, "learning_rate": 2.4522084738079933e-05, "loss": 0.1782, "loss_nan_ranks": 0, "loss_rank_avg": 0.19203343987464905, "step": 1185, "valid_targets_mean": 1296.5, "valid_targets_min": 773 }, { "epoch": 2.923832923832924, "grad_norm": 0.787142547780488, "learning_rate": 2.4382678801581762e-05, "loss": 0.1747, "loss_nan_ranks": 0, "loss_rank_avg": 0.16595681011676788, "step": 1190, "valid_targets_mean": 1291.5, "valid_targets_min": 633 }, { "epoch": 2.9361179361179364, "grad_norm": 0.7237730028951334, "learning_rate": 2.4243048829277916e-05, "loss": 0.1829, "loss_nan_ranks": 0, "loss_rank_avg": 0.16514533758163452, "step": 1195, "valid_targets_mean": 1309.0, "valid_targets_min": 615 }, { "epoch": 2.9484029484029484, "grad_norm": 0.8443033469283165, "learning_rate": 2.410320195883802e-05, "loss": 0.172, "loss_nan_ranks": 0, "loss_rank_avg": 0.18028348684310913, "step": 1200, "valid_targets_mean": 1211.9, "valid_targets_min": 576 }, { "epoch": 2.960687960687961, "grad_norm": 0.8259230182106898, "learning_rate": 2.396314533901918e-05, "loss": 0.1762, "loss_nan_ranks": 0, "loss_rank_avg": 0.17320460081100464, "step": 1205, "valid_targets_mean": 1226.4, "valid_targets_min": 605 }, { "epoch": 2.972972972972973, "grad_norm": 0.7764557250016658, "learning_rate": 2.3822886129300603e-05, "loss": 0.18, "loss_nan_ranks": 0, "loss_rank_avg": 0.18336926400661469, "step": 1210, "valid_targets_mean": 1345.6, "valid_targets_min": 898 }, { "epoch": 2.9852579852579852, "grad_norm": 0.8960330072091445, "learning_rate": 2.368243149951755e-05, "loss": 0.1823, "loss_nan_ranks": 0, "loss_rank_avg": 0.18257874250411987, "step": 1215, "valid_targets_mean": 1147.5, "valid_targets_min": 623 }, { "epoch": 2.9975429975429977, "grad_norm": 0.7570835868850769, "learning_rate": 2.3541788629494865e-05, "loss": 0.1805, "loss_nan_ranks": 0, "loss_rank_avg": 0.17076748609542847, "step": 1220, "valid_targets_mean": 1296.3, "valid_targets_min": 635 }, { "epoch": 3.0098280098280097, "grad_norm": 0.72326162291509, "learning_rate": 2.3400964708679944e-05, "loss": 0.1534, "loss_nan_ranks": 0, "loss_rank_avg": 0.13778720796108246, "step": 1225, "valid_targets_mean": 1254.6, "valid_targets_min": 651 }, { "epoch": 3.022113022113022, "grad_norm": 0.8572240220731201, "learning_rate": 2.325996693577522e-05, "loss": 0.1583, "loss_nan_ranks": 0, "loss_rank_avg": 0.15546341240406036, "step": 1230, "valid_targets_mean": 1392.1, "valid_targets_min": 799 }, { "epoch": 3.0343980343980346, "grad_norm": 0.8406897333538058, "learning_rate": 2.311880251837019e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.1490376889705658, "step": 1235, "valid_targets_mean": 1217.6, "valid_targets_min": 696 }, { "epoch": 3.0466830466830466, "grad_norm": 0.8128667720747944, "learning_rate": 2.2977478672572933e-05, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.15579545497894287, "step": 1240, "valid_targets_mean": 1323.8, "valid_targets_min": 666 }, { "epoch": 3.058968058968059, "grad_norm": 0.8117066580399452, "learning_rate": 2.2836002622641297e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.16121074557304382, "step": 1245, "valid_targets_mean": 1316.7, "valid_targets_min": 695 }, { "epoch": 3.0712530712530715, "grad_norm": 0.8662224455967267, "learning_rate": 2.269438160061354e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.1444993019104004, "step": 1250, "valid_targets_mean": 1238.2, "valid_targets_min": 810 }, { "epoch": 3.0835380835380835, "grad_norm": 0.8817439219548429, "learning_rate": 2.2552622845938698e-05, "loss": 0.1533, "loss_nan_ranks": 0, "loss_rank_avg": 0.15430381894111633, "step": 1255, "valid_targets_mean": 1404.1, "valid_targets_min": 857 }, { "epoch": 3.095823095823096, "grad_norm": 0.8477302153623169, "learning_rate": 2.2410733605106462e-05, "loss": 0.1564, "loss_nan_ranks": 0, "loss_rank_avg": 0.1634480059146881, "step": 1260, "valid_targets_mean": 1147.9, "valid_targets_min": 604 }, { "epoch": 3.108108108108108, "grad_norm": 0.8243597226463298, "learning_rate": 2.2268721131276805e-05, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.15756012499332428, "step": 1265, "valid_targets_mean": 1393.2, "valid_targets_min": 747 }, { "epoch": 3.1203931203931203, "grad_norm": 0.8937269373033379, "learning_rate": 2.2126592683909154e-05, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.15642580389976501, "step": 1270, "valid_targets_mean": 1184.4, "valid_targets_min": 614 }, { "epoch": 3.1326781326781328, "grad_norm": 0.8160928913633115, "learning_rate": 2.1984355528391342e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.15530337393283844, "step": 1275, "valid_targets_mean": 1350.1, "valid_targets_min": 758 }, { "epoch": 3.1449631449631448, "grad_norm": 0.8916891912210628, "learning_rate": 2.1842016935668188e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.17001807689666748, "step": 1280, "valid_targets_mean": 1380.8, "valid_targets_min": 746 }, { "epoch": 3.157248157248157, "grad_norm": 0.8639371441585546, "learning_rate": 2.169958418186982e-05, "loss": 0.1606, "loss_nan_ranks": 0, "loss_rank_avg": 0.15526992082595825, "step": 1285, "valid_targets_mean": 1277.1, "valid_targets_min": 738 }, { "epoch": 3.1695331695331697, "grad_norm": 0.8130627821075446, "learning_rate": 2.1557064547939754e-05, "loss": 0.1556, "loss_nan_ranks": 0, "loss_rank_avg": 0.14274147152900696, "step": 1290, "valid_targets_mean": 1234.9, "valid_targets_min": 810 }, { "epoch": 3.1818181818181817, "grad_norm": 0.7746615359719721, "learning_rate": 2.1414465319262666e-05, "loss": 0.1547, "loss_nan_ranks": 0, "loss_rank_avg": 0.14222201704978943, "step": 1295, "valid_targets_mean": 1286.1, "valid_targets_min": 681 }, { "epoch": 3.194103194103194, "grad_norm": 0.7520776877457452, "learning_rate": 2.1271793785291997e-05, "loss": 0.1498, "loss_nan_ranks": 0, "loss_rank_avg": 0.1390017867088318, "step": 1300, "valid_targets_mean": 1272.8, "valid_targets_min": 602 }, { "epoch": 3.2063882063882065, "grad_norm": 0.8462893075712905, "learning_rate": 2.1129057239177337e-05, "loss": 0.1551, "loss_nan_ranks": 0, "loss_rank_avg": 0.15616267919540405, "step": 1305, "valid_targets_mean": 1242.9, "valid_targets_min": 748 }, { "epoch": 3.2186732186732185, "grad_norm": 0.8539575906844962, "learning_rate": 2.0986262977391577e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.1531214714050293, "step": 1310, "valid_targets_mean": 1199.8, "valid_targets_min": 728 }, { "epoch": 3.230958230958231, "grad_norm": 0.8428538051981783, "learning_rate": 2.084341829935796e-05, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.1577906310558319, "step": 1315, "valid_targets_mean": 1258.8, "valid_targets_min": 664 }, { "epoch": 3.2432432432432434, "grad_norm": 0.84603528658779, "learning_rate": 2.0700530507076916e-05, "loss": 0.1472, "loss_nan_ranks": 0, "loss_rank_avg": 0.14432299137115479, "step": 1320, "valid_targets_mean": 1210.4, "valid_targets_min": 807 }, { "epoch": 3.2555282555282554, "grad_norm": 0.9102137746252226, "learning_rate": 2.0557606904752833e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.15487079322338104, "step": 1325, "valid_targets_mean": 1167.1, "valid_targets_min": 474 }, { "epoch": 3.267813267813268, "grad_norm": 0.8050078740673396, "learning_rate": 2.0414654798420622e-05, "loss": 0.1443, "loss_nan_ranks": 0, "loss_rank_avg": 0.15707707405090332, "step": 1330, "valid_targets_mean": 1354.5, "valid_targets_min": 772 }, { "epoch": 3.2800982800982803, "grad_norm": 0.8353880109503813, "learning_rate": 2.02716814955723e-05, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.14280740916728973, "step": 1335, "valid_targets_mean": 1208.4, "valid_targets_min": 597 }, { "epoch": 3.2923832923832923, "grad_norm": 0.8659682584614259, "learning_rate": 2.0128694304783406e-05, "loss": 0.1551, "loss_nan_ranks": 0, "loss_rank_avg": 0.15830692648887634, "step": 1340, "valid_targets_mean": 1201.9, "valid_targets_min": 730 }, { "epoch": 3.3046683046683047, "grad_norm": 0.8379988002065017, "learning_rate": 1.9985700535339406e-05, "loss": 0.1569, "loss_nan_ranks": 0, "loss_rank_avg": 0.1467028260231018, "step": 1345, "valid_targets_mean": 1127.9, "valid_targets_min": 845 }, { "epoch": 3.3169533169533167, "grad_norm": 1.1917573647951119, "learning_rate": 1.984270749686207e-05, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.13254572451114655, "step": 1350, "valid_targets_mean": 1263.1, "valid_targets_min": 536 }, { "epoch": 3.329238329238329, "grad_norm": 0.8655024458620978, "learning_rate": 1.9699722498935786e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.15300899744033813, "step": 1355, "valid_targets_mean": 1207.4, "valid_targets_min": 563 }, { "epoch": 3.3415233415233416, "grad_norm": 0.7847387083906133, "learning_rate": 1.9556752850733933e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.13689152896404266, "step": 1360, "valid_targets_mean": 1255.2, "valid_targets_min": 706 }, { "epoch": 3.3538083538083536, "grad_norm": 0.8693425075316302, "learning_rate": 1.9413805860645242e-05, "loss": 0.1609, "loss_nan_ranks": 0, "loss_rank_avg": 0.17255070805549622, "step": 1365, "valid_targets_mean": 1268.3, "valid_targets_min": 692 }, { "epoch": 3.366093366093366, "grad_norm": 0.8576356082893154, "learning_rate": 1.9270888835900165e-05, "loss": 0.1616, "loss_nan_ranks": 0, "loss_rank_avg": 0.1623215675354004, "step": 1370, "valid_targets_mean": 1256.3, "valid_targets_min": 700 }, { "epoch": 3.3783783783783785, "grad_norm": 0.8842690706850099, "learning_rate": 1.9128009082197417e-05, "loss": 0.1504, "loss_nan_ranks": 0, "loss_rank_avg": 0.14834919571876526, "step": 1375, "valid_targets_mean": 1141.1, "valid_targets_min": 685 }, { "epoch": 3.3906633906633905, "grad_norm": 0.803567248692513, "learning_rate": 1.8985173903330428e-05, "loss": 0.1521, "loss_nan_ranks": 0, "loss_rank_avg": 0.15296560525894165, "step": 1380, "valid_targets_mean": 1291.1, "valid_targets_min": 494 }, { "epoch": 3.402948402948403, "grad_norm": 0.8228636441386455, "learning_rate": 1.884239060081407e-05, "loss": 0.1442, "loss_nan_ranks": 0, "loss_rank_avg": 0.14132916927337646, "step": 1385, "valid_targets_mean": 1182.8, "valid_targets_min": 808 }, { "epoch": 3.4152334152334154, "grad_norm": 0.8389934209523321, "learning_rate": 1.869966647351135e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.1495848149061203, "step": 1390, "valid_targets_mean": 1253.1, "valid_targets_min": 667 }, { "epoch": 3.4275184275184274, "grad_norm": 0.7601245259644186, "learning_rate": 1.8557008817260343e-05, "loss": 0.1554, "loss_nan_ranks": 0, "loss_rank_avg": 0.14485347270965576, "step": 1395, "valid_targets_mean": 1379.3, "valid_targets_min": 871 }, { "epoch": 3.43980343980344, "grad_norm": 0.8713323917939153, "learning_rate": 1.8414424924501222e-05, "loss": 0.1596, "loss_nan_ranks": 0, "loss_rank_avg": 0.1464325487613678, "step": 1400, "valid_targets_mean": 1344.7, "valid_targets_min": 681 }, { "epoch": 3.4520884520884523, "grad_norm": 0.8116825428322517, "learning_rate": 1.827192208390347e-05, "loss": 0.1482, "loss_nan_ranks": 0, "loss_rank_avg": 0.14812307059764862, "step": 1405, "valid_targets_mean": 1292.6, "valid_targets_min": 532 }, { "epoch": 3.4643734643734643, "grad_norm": 0.830495465611543, "learning_rate": 1.812950757999334e-05, "loss": 0.1553, "loss_nan_ranks": 0, "loss_rank_avg": 0.14193110167980194, "step": 1410, "valid_targets_mean": 1182.0, "valid_targets_min": 516 }, { "epoch": 3.4766584766584767, "grad_norm": 0.8420966729919014, "learning_rate": 1.7987188692781417e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.15079256892204285, "step": 1415, "valid_targets_mean": 1302.2, "valid_targets_min": 828 }, { "epoch": 3.488943488943489, "grad_norm": 0.805934689519132, "learning_rate": 1.784497269739052e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.14082270860671997, "step": 1420, "valid_targets_mean": 1309.8, "valid_targets_min": 477 }, { "epoch": 3.501228501228501, "grad_norm": 0.9110728170126068, "learning_rate": 1.770286686368381e-05, "loss": 0.1516, "loss_nan_ranks": 0, "loss_rank_avg": 0.15163275599479675, "step": 1425, "valid_targets_mean": 1216.3, "valid_targets_min": 755 }, { "epoch": 3.5135135135135136, "grad_norm": 1.010011400261342, "learning_rate": 1.756087845589312e-05, "loss": 0.1557, "loss_nan_ranks": 0, "loss_rank_avg": 0.1431485116481781, "step": 1430, "valid_targets_mean": 1191.9, "valid_targets_min": 599 }, { "epoch": 3.5257985257985256, "grad_norm": 0.8232817829751108, "learning_rate": 1.7419014732247683e-05, "loss": 0.1573, "loss_nan_ranks": 0, "loss_rank_avg": 0.16463416814804077, "step": 1435, "valid_targets_mean": 1286.1, "valid_targets_min": 736 }, { "epoch": 3.538083538083538, "grad_norm": 0.9408275175657097, "learning_rate": 1.7277282944603047e-05, "loss": 0.1611, "loss_nan_ranks": 0, "loss_rank_avg": 0.1658443808555603, "step": 1440, "valid_targets_mean": 1391.1, "valid_targets_min": 700 }, { "epoch": 3.5503685503685505, "grad_norm": 0.8964394826069799, "learning_rate": 1.713569033807041e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.14551150798797607, "step": 1445, "valid_targets_mean": 1158.6, "valid_targets_min": 516 }, { "epoch": 3.562653562653563, "grad_norm": 0.6983703036178323, "learning_rate": 1.6994244150646244e-05, "loss": 0.1494, "loss_nan_ranks": 0, "loss_rank_avg": 0.13444580137729645, "step": 1450, "valid_targets_mean": 1367.5, "valid_targets_min": 618 }, { "epoch": 3.574938574938575, "grad_norm": 0.8407855929126276, "learning_rate": 1.6852951612842278e-05, "loss": 0.1542, "loss_nan_ranks": 0, "loss_rank_avg": 0.15283367037773132, "step": 1455, "valid_targets_mean": 1407.4, "valid_targets_min": 922 }, { "epoch": 3.5872235872235874, "grad_norm": 0.8242889096179601, "learning_rate": 1.671181994731595e-05, "loss": 0.1511, "loss_nan_ranks": 0, "loss_rank_avg": 0.146068274974823, "step": 1460, "valid_targets_mean": 1294.8, "valid_targets_min": 755 }, { "epoch": 3.5995085995085994, "grad_norm": 0.8648972544384124, "learning_rate": 1.6570856368501108e-05, "loss": 0.1578, "loss_nan_ranks": 0, "loss_rank_avg": 0.17492206394672394, "step": 1465, "valid_targets_mean": 1290.1, "valid_targets_min": 640 }, { "epoch": 3.611793611793612, "grad_norm": 0.8457602915141741, "learning_rate": 1.643006808223931e-05, "loss": 0.1505, "loss_nan_ranks": 0, "loss_rank_avg": 0.14468783140182495, "step": 1470, "valid_targets_mean": 1287.5, "valid_targets_min": 576 }, { "epoch": 3.6240786240786242, "grad_norm": 0.8532991002467062, "learning_rate": 1.6289462285411387e-05, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.1533271074295044, "step": 1475, "valid_targets_mean": 1243.2, "valid_targets_min": 754 }, { "epoch": 3.6363636363636362, "grad_norm": 0.8803826617627987, "learning_rate": 1.614904616556962e-05, "loss": 0.1445, "loss_nan_ranks": 0, "loss_rank_avg": 0.14523166418075562, "step": 1480, "valid_targets_mean": 1301.2, "valid_targets_min": 684 }, { "epoch": 3.6486486486486487, "grad_norm": 0.8542006788844356, "learning_rate": 1.6008826900570294e-05, "loss": 0.1506, "loss_nan_ranks": 0, "loss_rank_avg": 0.14371222257614136, "step": 1485, "valid_targets_mean": 1139.2, "valid_targets_min": 699 }, { "epoch": 3.6609336609336607, "grad_norm": 0.8745016942367656, "learning_rate": 1.586881165820675e-05, "loss": 0.1548, "loss_nan_ranks": 0, "loss_rank_avg": 0.154458150267601, "step": 1490, "valid_targets_mean": 1155.7, "valid_targets_min": 621 }, { "epoch": 3.673218673218673, "grad_norm": 0.8703992302998022, "learning_rate": 1.5729007595843037e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.14299608767032623, "step": 1495, "valid_targets_mean": 1268.3, "valid_targets_min": 776 }, { "epoch": 3.6855036855036856, "grad_norm": 0.8095249679573774, "learning_rate": 1.5589421860047986e-05, "loss": 0.1544, "loss_nan_ranks": 0, "loss_rank_avg": 0.15553806722164154, "step": 1500, "valid_targets_mean": 1325.9, "valid_targets_min": 868 }, { "epoch": 3.697788697788698, "grad_norm": 0.8758318030682021, "learning_rate": 1.5450061586229903e-05, "loss": 0.1552, "loss_nan_ranks": 0, "loss_rank_avg": 0.15329515933990479, "step": 1505, "valid_targets_mean": 1132.9, "valid_targets_min": 679 }, { "epoch": 3.71007371007371, "grad_norm": 0.8363686738335151, "learning_rate": 1.5310933898271864e-05, "loss": 0.1515, "loss_nan_ranks": 0, "loss_rank_avg": 0.15566831827163696, "step": 1510, "valid_targets_mean": 1268.0, "valid_targets_min": 627 }, { "epoch": 3.7223587223587224, "grad_norm": 0.9279177914708184, "learning_rate": 1.5172045908167462e-05, "loss": 0.149, "loss_nan_ranks": 0, "loss_rank_avg": 0.14874522387981415, "step": 1515, "valid_targets_mean": 1278.6, "valid_targets_min": 619 }, { "epoch": 3.7346437346437344, "grad_norm": 0.8889669951596095, "learning_rate": 1.5033404715657344e-05, "loss": 0.152, "loss_nan_ranks": 0, "loss_rank_avg": 0.1446603238582611, "step": 1520, "valid_targets_mean": 1261.3, "valid_targets_min": 639 }, { "epoch": 3.746928746928747, "grad_norm": 0.9294511912472954, "learning_rate": 1.4895017407866217e-05, "loss": 0.1575, "loss_nan_ranks": 0, "loss_rank_avg": 0.15708409249782562, "step": 1525, "valid_targets_mean": 1087.5, "valid_targets_min": 578 }, { "epoch": 3.7592137592137593, "grad_norm": 0.7974453732071705, "learning_rate": 1.4756891058940606e-05, "loss": 0.1559, "loss_nan_ranks": 0, "loss_rank_avg": 0.16070222854614258, "step": 1530, "valid_targets_mean": 1359.7, "valid_targets_min": 631 }, { "epoch": 3.7714987714987718, "grad_norm": 0.7840160517261555, "learning_rate": 1.4619032729687223e-05, "loss": 0.1519, "loss_nan_ranks": 0, "loss_rank_avg": 0.15777051448822021, "step": 1535, "valid_targets_mean": 1339.7, "valid_targets_min": 703 }, { "epoch": 3.7837837837837838, "grad_norm": 0.8550911396739045, "learning_rate": 1.4481449467212004e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.14654958248138428, "step": 1540, "valid_targets_mean": 1197.9, "valid_targets_min": 661 }, { "epoch": 3.796068796068796, "grad_norm": 1.0416276131378706, "learning_rate": 1.4344148304559926e-05, "loss": 0.1508, "loss_nan_ranks": 0, "loss_rank_avg": 0.1543717384338379, "step": 1545, "valid_targets_mean": 1387.0, "valid_targets_min": 930 }, { "epoch": 3.808353808353808, "grad_norm": 0.7971903127956029, "learning_rate": 1.4207136260355426e-05, "loss": 0.1501, "loss_nan_ranks": 0, "loss_rank_avg": 0.15580767393112183, "step": 1550, "valid_targets_mean": 1369.1, "valid_targets_min": 844 }, { "epoch": 3.8206388206388207, "grad_norm": 0.8302888094156373, "learning_rate": 1.4070420338443667e-05, "loss": 0.1558, "loss_nan_ranks": 0, "loss_rank_avg": 0.15264888107776642, "step": 1555, "valid_targets_mean": 1372.4, "valid_targets_min": 652 }, { "epoch": 3.832923832923833, "grad_norm": 0.8113952097335243, "learning_rate": 1.3934007527532494e-05, "loss": 0.1541, "loss_nan_ranks": 0, "loss_rank_avg": 0.15965667366981506, "step": 1560, "valid_targets_mean": 1547.5, "valid_targets_min": 1012 }, { "epoch": 3.845208845208845, "grad_norm": 0.8016515224809283, "learning_rate": 1.3797904800835174e-05, "loss": 0.1517, "loss_nan_ranks": 0, "loss_rank_avg": 0.14814619719982147, "step": 1565, "valid_targets_mean": 1327.5, "valid_targets_min": 680 }, { "epoch": 3.8574938574938575, "grad_norm": 0.8101546175320481, "learning_rate": 1.3662119115713968e-05, "loss": 0.1543, "loss_nan_ranks": 0, "loss_rank_avg": 0.13531778752803802, "step": 1570, "valid_targets_mean": 1317.8, "valid_targets_min": 946 }, { "epoch": 3.8697788697788695, "grad_norm": 0.8752081945344778, "learning_rate": 1.3526657413324427e-05, "loss": 0.1483, "loss_nan_ranks": 0, "loss_rank_avg": 0.1407470703125, "step": 1575, "valid_targets_mean": 1331.0, "valid_targets_min": 755 }, { "epoch": 3.882063882063882, "grad_norm": 0.8025227410206387, "learning_rate": 1.3391526618260636e-05, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.15067920088768005, "step": 1580, "valid_targets_mean": 1262.4, "valid_targets_min": 640 }, { "epoch": 3.8943488943488944, "grad_norm": 0.8935145822922234, "learning_rate": 1.3256733638201172e-05, "loss": 0.1518, "loss_nan_ranks": 0, "loss_rank_avg": 0.15884637832641602, "step": 1585, "valid_targets_mean": 1158.1, "valid_targets_min": 683 }, { "epoch": 3.906633906633907, "grad_norm": 0.7708791703581477, "learning_rate": 1.3122285363556053e-05, "loss": 0.15, "loss_nan_ranks": 0, "loss_rank_avg": 0.14581814408302307, "step": 1590, "valid_targets_mean": 1297.9, "valid_targets_min": 552 }, { "epoch": 3.918918918918919, "grad_norm": 0.8888029980587986, "learning_rate": 1.2988188667114487e-05, "loss": 0.1509, "loss_nan_ranks": 0, "loss_rank_avg": 0.1706969141960144, "step": 1595, "valid_targets_mean": 1370.7, "valid_targets_min": 749 }, { "epoch": 3.9312039312039313, "grad_norm": 0.8292708834052593, "learning_rate": 1.2854450403693526e-05, "loss": 0.154, "loss_nan_ranks": 0, "loss_rank_avg": 0.15968310832977295, "step": 1600, "valid_targets_mean": 1313.7, "valid_targets_min": 670 }, { "epoch": 3.9434889434889433, "grad_norm": 0.788269813578671, "learning_rate": 1.272107740978769e-05, "loss": 0.1535, "loss_nan_ranks": 0, "loss_rank_avg": 0.1440616101026535, "step": 1605, "valid_targets_mean": 1278.4, "valid_targets_min": 612 }, { "epoch": 3.9557739557739557, "grad_norm": 0.8037047070644282, "learning_rate": 1.2588076503219475e-05, "loss": 0.1532, "loss_nan_ranks": 0, "loss_rank_avg": 0.1564336121082306, "step": 1610, "valid_targets_mean": 1324.2, "valid_targets_min": 792 }, { "epoch": 3.968058968058968, "grad_norm": 0.7845890150943812, "learning_rate": 1.2455454482790859e-05, "loss": 0.1565, "loss_nan_ranks": 0, "loss_rank_avg": 0.1552063524723053, "step": 1615, "valid_targets_mean": 1362.6, "valid_targets_min": 680 }, { "epoch": 3.98034398034398, "grad_norm": 0.7747181055399516, "learning_rate": 1.2323218127935714e-05, "loss": 0.1481, "loss_nan_ranks": 0, "loss_rank_avg": 0.1518639624118805, "step": 1620, "valid_targets_mean": 1321.4, "valid_targets_min": 706 }, { "epoch": 3.9926289926289926, "grad_norm": 0.8558446375986389, "learning_rate": 1.2191374198373309e-05, "loss": 0.1523, "loss_nan_ranks": 0, "loss_rank_avg": 0.1543593853712082, "step": 1625, "valid_targets_mean": 1155.8, "valid_targets_min": 693 }, { "epoch": 4.004914004914005, "grad_norm": 0.781627123143895, "learning_rate": 1.2059929433762734e-05, "loss": 0.1497, "loss_nan_ranks": 0, "loss_rank_avg": 0.13371559977531433, "step": 1630, "valid_targets_mean": 1401.8, "valid_targets_min": 710 }, { "epoch": 4.017199017199017, "grad_norm": 0.7723114766334374, "learning_rate": 1.1928890553358352e-05, "loss": 0.1353, "loss_nan_ranks": 0, "loss_rank_avg": 0.135203018784523, "step": 1635, "valid_targets_mean": 1515.5, "valid_targets_min": 987 }, { "epoch": 4.0294840294840295, "grad_norm": 0.8735823383942167, "learning_rate": 1.1798264255666387e-05, "loss": 0.1315, "loss_nan_ranks": 0, "loss_rank_avg": 0.14232441782951355, "step": 1640, "valid_targets_mean": 1276.2, "valid_targets_min": 602 }, { "epoch": 4.041769041769042, "grad_norm": 0.8192596996969622, "learning_rate": 1.1668057218102436e-05, "loss": 0.1286, "loss_nan_ranks": 0, "loss_rank_avg": 0.11941641569137573, "step": 1645, "valid_targets_mean": 1408.4, "valid_targets_min": 597 }, { "epoch": 4.054054054054054, "grad_norm": 0.8924526222951878, "learning_rate": 1.1538276096650175e-05, "loss": 0.1298, "loss_nan_ranks": 0, "loss_rank_avg": 0.1319366693496704, "step": 1650, "valid_targets_mean": 1181.8, "valid_targets_min": 510 }, { "epoch": 4.066339066339066, "grad_norm": 0.7699089718854191, "learning_rate": 1.1408927525521118e-05, "loss": 0.1333, "loss_nan_ranks": 0, "loss_rank_avg": 0.1287621706724167, "step": 1655, "valid_targets_mean": 1414.1, "valid_targets_min": 768 }, { "epoch": 4.078624078624078, "grad_norm": 0.8099063799012394, "learning_rate": 1.1280018116815438e-05, "loss": 0.1308, "loss_nan_ranks": 0, "loss_rank_avg": 0.1263992041349411, "step": 1660, "valid_targets_mean": 1322.7, "valid_targets_min": 675 }, { "epoch": 4.090909090909091, "grad_norm": 0.8792757959344022, "learning_rate": 1.115155446018404e-05, "loss": 0.1297, "loss_nan_ranks": 0, "loss_rank_avg": 0.12545448541641235, "step": 1665, "valid_targets_mean": 1129.1, "valid_targets_min": 618 }, { "epoch": 4.103194103194103, "grad_norm": 0.8012256945891334, "learning_rate": 1.1023543122491626e-05, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.13978534936904907, "step": 1670, "valid_targets_mean": 1432.0, "valid_targets_min": 619 }, { "epoch": 4.115479115479116, "grad_norm": 0.8588845221042121, "learning_rate": 1.089599064748108e-05, "loss": 0.1319, "loss_nan_ranks": 0, "loss_rank_avg": 0.12195970118045807, "step": 1675, "valid_targets_mean": 1170.1, "valid_targets_min": 829 }, { "epoch": 4.127764127764128, "grad_norm": 0.8611293324266706, "learning_rate": 1.0768903555438927e-05, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.1330062747001648, "step": 1680, "valid_targets_mean": 1203.4, "valid_targets_min": 866 }, { "epoch": 4.14004914004914, "grad_norm": 0.8547247627858316, "learning_rate": 1.0642288342862007e-05, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.1295037716627121, "step": 1685, "valid_targets_mean": 1327.2, "valid_targets_min": 821 }, { "epoch": 4.152334152334152, "grad_norm": 0.9284978728629667, "learning_rate": 1.051615148212544e-05, "loss": 0.1302, "loss_nan_ranks": 0, "loss_rank_avg": 0.13765308260917664, "step": 1690, "valid_targets_mean": 1221.8, "valid_targets_min": 673 }, { "epoch": 4.164619164619165, "grad_norm": 0.8420408633139839, "learning_rate": 1.0390499421151706e-05, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.12419085204601288, "step": 1695, "valid_targets_mean": 1425.6, "valid_targets_min": 838 }, { "epoch": 4.176904176904177, "grad_norm": 0.9003128577554333, "learning_rate": 1.0265338583081088e-05, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.1306770145893097, "step": 1700, "valid_targets_mean": 1178.5, "valid_targets_min": 644 }, { "epoch": 4.1891891891891895, "grad_norm": 0.9195424473786398, "learning_rate": 1.0140675365943284e-05, "loss": 0.1316, "loss_nan_ranks": 0, "loss_rank_avg": 0.13825950026512146, "step": 1705, "valid_targets_mean": 1205.4, "valid_targets_min": 740 }, { "epoch": 4.201474201474202, "grad_norm": 0.8994495082648482, "learning_rate": 1.0016516142330404e-05, "loss": 0.1336, "loss_nan_ranks": 0, "loss_rank_avg": 0.13527360558509827, "step": 1710, "valid_targets_mean": 1221.3, "valid_targets_min": 817 }, { "epoch": 4.2137592137592135, "grad_norm": 0.8912252331597237, "learning_rate": 9.89286725907117e-06, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.13443750143051147, "step": 1715, "valid_targets_mean": 1249.4, "valid_targets_min": 764 }, { "epoch": 4.226044226044226, "grad_norm": 0.8920482099817841, "learning_rate": 9.769735036906475e-06, "loss": 0.1333, "loss_nan_ranks": 0, "loss_rank_avg": 0.1290460228919983, "step": 1720, "valid_targets_mean": 1142.9, "valid_targets_min": 686 }, { "epoch": 4.238329238329238, "grad_norm": 0.8527908969918075, "learning_rate": 9.647125770166321e-06, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.13044829666614532, "step": 1725, "valid_targets_mean": 1256.8, "valid_targets_min": 582 }, { "epoch": 4.250614250614251, "grad_norm": 0.8841584686314972, "learning_rate": 9.525045726448001e-06, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.13348722457885742, "step": 1730, "valid_targets_mean": 1273.6, "valid_targets_min": 708 }, { "epoch": 4.262899262899263, "grad_norm": 0.8702023826857563, "learning_rate": 9.40350114629577e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.13443559408187866, "step": 1735, "valid_targets_mean": 1183.1, "valid_targets_min": 702 }, { "epoch": 4.275184275184275, "grad_norm": 0.8992471857795535, "learning_rate": 9.282498242881784e-06, "loss": 0.1322, "loss_nan_ranks": 0, "loss_rank_avg": 0.13517756760120392, "step": 1740, "valid_targets_mean": 1307.1, "valid_targets_min": 687 }, { "epoch": 4.287469287469287, "grad_norm": 0.796244329414364, "learning_rate": 9.162043201688517e-06, "loss": 0.1311, "loss_nan_ranks": 0, "loss_rank_avg": 0.12337645888328552, "step": 1745, "valid_targets_mean": 1191.1, "valid_targets_min": 695 }, { "epoch": 4.2997542997543, "grad_norm": 0.8370509126157433, "learning_rate": 9.042142180192596e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.13218200206756592, "step": 1750, "valid_targets_mean": 1195.6, "valid_targets_min": 750 }, { "epoch": 4.312039312039312, "grad_norm": 0.8895263747387979, "learning_rate": 8.92280130754998e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.1353050172328949, "step": 1755, "valid_targets_mean": 1278.0, "valid_targets_min": 683 }, { "epoch": 4.324324324324325, "grad_norm": 0.8271582266915379, "learning_rate": 8.804026684282694e-06, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.13450637459754944, "step": 1760, "valid_targets_mean": 1315.7, "valid_targets_min": 723 }, { "epoch": 4.336609336609337, "grad_norm": 0.9520857741575197, "learning_rate": 8.685824381966975e-06, "loss": 0.1317, "loss_nan_ranks": 0, "loss_rank_avg": 0.13987067341804504, "step": 1765, "valid_targets_mean": 1201.6, "valid_targets_min": 661 }, { "epoch": 4.348894348894349, "grad_norm": 0.8757634606289378, "learning_rate": 8.568200442922865e-06, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.13092288374900818, "step": 1770, "valid_targets_mean": 1367.1, "valid_targets_min": 624 }, { "epoch": 4.361179361179361, "grad_norm": 0.8821249974469216, "learning_rate": 8.451160879905398e-06, "loss": 0.1331, "loss_nan_ranks": 0, "loss_rank_avg": 0.1396908462047577, "step": 1775, "valid_targets_mean": 1268.4, "valid_targets_min": 699 }, { "epoch": 4.3734643734643734, "grad_norm": 0.8236753936558183, "learning_rate": 8.33471167579717e-06, "loss": 0.1344, "loss_nan_ranks": 0, "loss_rank_avg": 0.13866353034973145, "step": 1780, "valid_targets_mean": 1363.2, "valid_targets_min": 925 }, { "epoch": 4.385749385749386, "grad_norm": 0.8390859558509741, "learning_rate": 8.218858783302566e-06, "loss": 0.1374, "loss_nan_ranks": 0, "loss_rank_avg": 0.13545829057693481, "step": 1785, "valid_targets_mean": 1287.6, "valid_targets_min": 619 }, { "epoch": 4.398034398034398, "grad_norm": 0.8518188407674924, "learning_rate": 8.103608124643412e-06, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.1234915554523468, "step": 1790, "valid_targets_mean": 1293.2, "valid_targets_min": 745 }, { "epoch": 4.41031941031941, "grad_norm": 0.890765851149973, "learning_rate": 7.988965591256284e-06, "loss": 0.1386, "loss_nan_ranks": 0, "loss_rank_avg": 0.1416628658771515, "step": 1795, "valid_targets_mean": 1274.9, "valid_targets_min": 677 }, { "epoch": 4.422604422604422, "grad_norm": 0.8536233960569621, "learning_rate": 7.874937043491331e-06, "loss": 0.1358, "loss_nan_ranks": 0, "loss_rank_avg": 0.13207730650901794, "step": 1800, "valid_targets_mean": 1314.8, "valid_targets_min": 654 }, { "epoch": 4.434889434889435, "grad_norm": 0.8547910171850943, "learning_rate": 7.761528310312679e-06, "loss": 0.1339, "loss_nan_ranks": 0, "loss_rank_avg": 0.1310330182313919, "step": 1805, "valid_targets_mean": 1319.5, "valid_targets_min": 658 }, { "epoch": 4.447174447174447, "grad_norm": 0.8440973307304958, "learning_rate": 7.648745189000511e-06, "loss": 0.1276, "loss_nan_ranks": 0, "loss_rank_avg": 0.12474372982978821, "step": 1810, "valid_targets_mean": 1266.9, "valid_targets_min": 607 }, { "epoch": 4.45945945945946, "grad_norm": 0.8526523335996494, "learning_rate": 7.536593444854663e-06, "loss": 0.132, "loss_nan_ranks": 0, "loss_rank_avg": 0.13603094220161438, "step": 1815, "valid_targets_mean": 1392.1, "valid_targets_min": 679 }, { "epoch": 4.471744471744472, "grad_norm": 0.9451445141228779, "learning_rate": 7.4250788108999686e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.13309922814369202, "step": 1820, "valid_targets_mean": 1134.2, "valid_targets_min": 640 }, { "epoch": 4.484029484029484, "grad_norm": 0.8373347844464977, "learning_rate": 7.314206987593162e-06, "loss": 0.1388, "loss_nan_ranks": 0, "loss_rank_avg": 0.13399043679237366, "step": 1825, "valid_targets_mean": 1223.4, "valid_targets_min": 776 }, { "epoch": 4.496314496314496, "grad_norm": 0.8625925922345389, "learning_rate": 7.203983642531462e-06, "loss": 0.1352, "loss_nan_ranks": 0, "loss_rank_avg": 0.13259084522724152, "step": 1830, "valid_targets_mean": 1311.8, "valid_targets_min": 619 }, { "epoch": 4.5085995085995085, "grad_norm": 0.8870716782947434, "learning_rate": 7.094414410162913e-06, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.1382933109998703, "step": 1835, "valid_targets_mean": 1195.8, "valid_targets_min": 689 }, { "epoch": 4.520884520884521, "grad_norm": 0.7998309016979608, "learning_rate": 6.985504891498291e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.11957763135433197, "step": 1840, "valid_targets_mean": 1288.3, "valid_targets_min": 661 }, { "epoch": 4.533169533169533, "grad_norm": 0.874780743207264, "learning_rate": 6.8772606538248285e-06, "loss": 0.1335, "loss_nan_ranks": 0, "loss_rank_avg": 0.1352095603942871, "step": 1845, "valid_targets_mean": 1310.2, "valid_targets_min": 680 }, { "epoch": 4.545454545454545, "grad_norm": 0.862924674798308, "learning_rate": 6.769687230421638e-06, "loss": 0.1332, "loss_nan_ranks": 0, "loss_rank_avg": 0.1378445029258728, "step": 1850, "valid_targets_mean": 1357.0, "valid_targets_min": 637 }, { "epoch": 4.557739557739557, "grad_norm": 0.8663590326432032, "learning_rate": 6.662790120276803e-06, "loss": 0.1354, "loss_nan_ranks": 0, "loss_rank_avg": 0.13520276546478271, "step": 1855, "valid_targets_mean": 1397.5, "valid_targets_min": 802 }, { "epoch": 4.57002457002457, "grad_norm": 0.9327490817540963, "learning_rate": 6.556574787806344e-06, "loss": 0.1325, "loss_nan_ranks": 0, "loss_rank_avg": 0.13693825900554657, "step": 1860, "valid_targets_mean": 1106.2, "valid_targets_min": 578 }, { "epoch": 4.582309582309582, "grad_norm": 0.9638863910492748, "learning_rate": 6.451046662574831e-06, "loss": 0.1362, "loss_nan_ranks": 0, "loss_rank_avg": 0.13662275671958923, "step": 1865, "valid_targets_mean": 1150.8, "valid_targets_min": 640 }, { "epoch": 4.594594594594595, "grad_norm": 0.8426325810722405, "learning_rate": 6.346211139017877e-06, "loss": 0.135, "loss_nan_ranks": 0, "loss_rank_avg": 0.1304231733083725, "step": 1870, "valid_targets_mean": 1320.3, "valid_targets_min": 684 }, { "epoch": 4.606879606879607, "grad_norm": 0.9787706797182959, "learning_rate": 6.242073576166337e-06, "loss": 0.1313, "loss_nan_ranks": 0, "loss_rank_avg": 0.13047711551189423, "step": 1875, "valid_targets_mean": 1202.9, "valid_targets_min": 700 }, { "epoch": 4.61916461916462, "grad_norm": 0.9005324833030341, "learning_rate": 6.138639297372404e-06, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.13522884249687195, "step": 1880, "valid_targets_mean": 1393.9, "valid_targets_min": 873 }, { "epoch": 4.631449631449631, "grad_norm": 0.9236230373157407, "learning_rate": 6.035913590037479e-06, "loss": 0.1304, "loss_nan_ranks": 0, "loss_rank_avg": 0.13806456327438354, "step": 1885, "valid_targets_mean": 1168.8, "valid_targets_min": 726 }, { "epoch": 4.643734643734644, "grad_norm": 1.0647383277495284, "learning_rate": 5.933901705341851e-06, "loss": 0.134, "loss_nan_ranks": 0, "loss_rank_avg": 0.13539758324623108, "step": 1890, "valid_targets_mean": 1166.5, "valid_targets_min": 582 }, { "epoch": 4.656019656019656, "grad_norm": 0.855176271796815, "learning_rate": 5.832608857976321e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.14015159010887146, "step": 1895, "valid_targets_mean": 1385.6, "valid_targets_min": 604 }, { "epoch": 4.6683046683046685, "grad_norm": 0.9385615083346516, "learning_rate": 5.732040225875584e-06, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.1414608359336853, "step": 1900, "valid_targets_mean": 1284.1, "valid_targets_min": 740 }, { "epoch": 4.680589680589681, "grad_norm": 0.8787370830329286, "learning_rate": 5.632200949953579e-06, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.12882032990455627, "step": 1905, "valid_targets_mean": 1343.2, "valid_targets_min": 508 }, { "epoch": 4.6928746928746925, "grad_norm": 0.8641680753533743, "learning_rate": 5.533096133840677e-06, "loss": 0.1295, "loss_nan_ranks": 0, "loss_rank_avg": 0.12614941596984863, "step": 1910, "valid_targets_mean": 1258.2, "valid_targets_min": 624 }, { "epoch": 4.705159705159705, "grad_norm": 0.802865831972532, "learning_rate": 5.434730843622778e-06, "loss": 0.1269, "loss_nan_ranks": 0, "loss_rank_avg": 0.1227787509560585, "step": 1915, "valid_targets_mean": 1437.7, "valid_targets_min": 941 }, { "epoch": 4.717444717444717, "grad_norm": 0.8310677761380986, "learning_rate": 5.337110107582377e-06, "loss": 0.1301, "loss_nan_ranks": 0, "loss_rank_avg": 0.12943677604198456, "step": 1920, "valid_targets_mean": 1451.6, "valid_targets_min": 933 }, { "epoch": 4.72972972972973, "grad_norm": 0.8358326381216636, "learning_rate": 5.2402389159414755e-06, "loss": 0.1334, "loss_nan_ranks": 0, "loss_rank_avg": 0.12806978821754456, "step": 1925, "valid_targets_mean": 1312.1, "valid_targets_min": 631 }, { "epoch": 4.742014742014742, "grad_norm": 0.8665797867751196, "learning_rate": 5.144122220606542e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.1268056482076645, "step": 1930, "valid_targets_mean": 1296.8, "valid_targets_min": 836 }, { "epoch": 4.754299754299755, "grad_norm": 0.8718443726733912, "learning_rate": 5.048764934915349e-06, "loss": 0.1326, "loss_nan_ranks": 0, "loss_rank_avg": 0.12933708727359772, "step": 1935, "valid_targets_mean": 1270.9, "valid_targets_min": 690 }, { "epoch": 4.766584766584766, "grad_norm": 0.8487591221702341, "learning_rate": 4.954171933385805e-06, "loss": 0.1296, "loss_nan_ranks": 0, "loss_rank_avg": 0.12197130918502808, "step": 1940, "valid_targets_mean": 1190.5, "valid_targets_min": 664 }, { "epoch": 4.778869778869779, "grad_norm": 0.84375197913285, "learning_rate": 4.8603480514667836e-06, "loss": 0.1369, "loss_nan_ranks": 0, "loss_rank_avg": 0.1338123381137848, "step": 1945, "valid_targets_mean": 1458.1, "valid_targets_min": 1046 }, { "epoch": 4.791154791154791, "grad_norm": 0.9416639364152577, "learning_rate": 4.767298085290963e-06, "loss": 0.1397, "loss_nan_ranks": 0, "loss_rank_avg": 0.13794106245040894, "step": 1950, "valid_targets_mean": 1145.6, "valid_targets_min": 814 }, { "epoch": 4.803439803439804, "grad_norm": 1.04032915765231, "learning_rate": 4.675026791429624e-06, "loss": 0.131, "loss_nan_ranks": 0, "loss_rank_avg": 0.1345062255859375, "step": 1955, "valid_targets_mean": 1348.6, "valid_targets_min": 618 }, { "epoch": 4.815724815724816, "grad_norm": 0.8449040208170585, "learning_rate": 4.583538886649525e-06, "loss": 0.1273, "loss_nan_ranks": 0, "loss_rank_avg": 0.1189974918961525, "step": 1960, "valid_targets_mean": 1187.4, "valid_targets_min": 769 }, { "epoch": 4.828009828009828, "grad_norm": 0.8678888365592436, "learning_rate": 4.492839047671764e-06, "loss": 0.1371, "loss_nan_ranks": 0, "loss_rank_avg": 0.13721004128456116, "step": 1965, "valid_targets_mean": 1184.3, "valid_targets_min": 716 }, { "epoch": 4.84029484029484, "grad_norm": 0.8554646724635764, "learning_rate": 4.4029319109327465e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.12759876251220703, "step": 1970, "valid_targets_mean": 1261.1, "valid_targets_min": 569 }, { "epoch": 4.8525798525798525, "grad_norm": 0.8085855019791796, "learning_rate": 4.313822072347136e-06, "loss": 0.1279, "loss_nan_ranks": 0, "loss_rank_avg": 0.12948501110076904, "step": 1975, "valid_targets_mean": 1355.0, "valid_targets_min": 802 }, { "epoch": 4.864864864864865, "grad_norm": 0.8874100205326839, "learning_rate": 4.22551408707296e-06, "loss": 0.1252, "loss_nan_ranks": 0, "loss_rank_avg": 0.12678705155849457, "step": 1980, "valid_targets_mean": 1195.2, "valid_targets_min": 608 }, { "epoch": 4.877149877149877, "grad_norm": 0.8319449998626455, "learning_rate": 4.138012469278714e-06, "loss": 0.1285, "loss_nan_ranks": 0, "loss_rank_avg": 0.12549124658107758, "step": 1985, "valid_targets_mean": 1413.9, "valid_targets_min": 754 }, { "epoch": 4.88943488943489, "grad_norm": 0.8716998013685486, "learning_rate": 4.051321691912649e-06, "loss": 0.1314, "loss_nan_ranks": 0, "loss_rank_avg": 0.12598586082458496, "step": 1990, "valid_targets_mean": 1264.1, "valid_targets_min": 837 }, { "epoch": 4.901719901719901, "grad_norm": 0.8898202785026332, "learning_rate": 3.9654461864740935e-06, "loss": 0.1289, "loss_nan_ranks": 0, "loss_rank_avg": 0.12699808180332184, "step": 1995, "valid_targets_mean": 1339.1, "valid_targets_min": 808 }, { "epoch": 4.914004914004914, "grad_norm": 0.8810415756398233, "learning_rate": 3.880390342786915e-06, "loss": 0.1288, "loss_nan_ranks": 0, "loss_rank_avg": 0.1320217102766037, "step": 2000, "valid_targets_mean": 1336.9, "valid_targets_min": 683 }, { "epoch": 4.926289926289926, "grad_norm": 0.8849692575005523, "learning_rate": 3.7961585087751516e-06, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.1198081374168396, "step": 2005, "valid_targets_mean": 1173.9, "valid_targets_min": 655 }, { "epoch": 4.938574938574939, "grad_norm": 0.8999635972244436, "learning_rate": 3.71275499024071e-06, "loss": 0.1309, "loss_nan_ranks": 0, "loss_rank_avg": 0.12783324718475342, "step": 2010, "valid_targets_mean": 1133.1, "valid_targets_min": 700 }, { "epoch": 4.950859950859951, "grad_norm": 0.867591599040516, "learning_rate": 3.6301840506433083e-06, "loss": 0.1287, "loss_nan_ranks": 0, "loss_rank_avg": 0.12289173156023026, "step": 2015, "valid_targets_mean": 1201.3, "valid_targets_min": 672 }, { "epoch": 4.963144963144963, "grad_norm": 1.1069039602237263, "learning_rate": 3.5484499108824853e-06, "loss": 0.1326, "loss_nan_ranks": 0, "loss_rank_avg": 0.13468243181705475, "step": 2020, "valid_targets_mean": 1119.6, "valid_targets_min": 685 }, { "epoch": 4.975429975429975, "grad_norm": 0.8588147361301989, "learning_rate": 3.4675567490818727e-06, "loss": 0.139, "loss_nan_ranks": 0, "loss_rank_avg": 0.13931423425674438, "step": 2025, "valid_targets_mean": 1295.9, "valid_targets_min": 600 }, { "epoch": 4.987714987714988, "grad_norm": 0.9052294954681119, "learning_rate": 3.3875087003756036e-06, "loss": 0.1306, "loss_nan_ranks": 0, "loss_rank_avg": 0.12855863571166992, "step": 2030, "valid_targets_mean": 1279.2, "valid_targets_min": 714 }, { "epoch": 5.0, "grad_norm": 0.8268644277482449, "learning_rate": 3.30830985669691e-06, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.12387026846408844, "step": 2035, "valid_targets_mean": 1328.5, "valid_targets_min": 603 }, { "epoch": 5.012285012285012, "grad_norm": 0.7999113943897552, "learning_rate": 3.22996426656899e-06, "loss": 0.1227, "loss_nan_ranks": 0, "loss_rank_avg": 0.11524771898984909, "step": 2040, "valid_targets_mean": 1326.2, "valid_targets_min": 818 }, { "epoch": 5.024570024570025, "grad_norm": 0.8985607563199448, "learning_rate": 3.1524759348980096e-06, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.12038896977901459, "step": 2045, "valid_targets_mean": 1191.4, "valid_targets_min": 668 }, { "epoch": 5.036855036855036, "grad_norm": 0.8643167001377622, "learning_rate": 3.0758488227684212e-06, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.12632206082344055, "step": 2050, "valid_targets_mean": 1276.1, "valid_targets_min": 546 }, { "epoch": 5.049140049140049, "grad_norm": 0.9365236976935931, "learning_rate": 3.0000868472404423e-06, "loss": 0.1242, "loss_nan_ranks": 0, "loss_rank_avg": 0.1172647699713707, "step": 2055, "valid_targets_mean": 1160.2, "valid_targets_min": 666 }, { "epoch": 5.061425061425061, "grad_norm": 0.9196384353165374, "learning_rate": 2.9251938811498436e-06, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.11617661267518997, "step": 2060, "valid_targets_mean": 1141.0, "valid_targets_min": 571 }, { "epoch": 5.073710073710074, "grad_norm": 0.8727744261465432, "learning_rate": 2.8511737529099704e-06, "loss": 0.1197, "loss_nan_ranks": 0, "loss_rank_avg": 0.11832496523857117, "step": 2065, "valid_targets_mean": 1291.8, "valid_targets_min": 741 }, { "epoch": 5.085995085995086, "grad_norm": 0.9478190878710969, "learning_rate": 2.7780302463160235e-06, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.12878839671611786, "step": 2070, "valid_targets_mean": 1140.1, "valid_targets_min": 754 }, { "epoch": 5.098280098280099, "grad_norm": 0.8266940619604733, "learning_rate": 2.705767100351673e-06, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.11219193786382675, "step": 2075, "valid_targets_mean": 1320.9, "valid_targets_min": 564 }, { "epoch": 5.11056511056511, "grad_norm": 0.9024231945394202, "learning_rate": 2.634388008997899e-06, "loss": 0.127, "loss_nan_ranks": 0, "loss_rank_avg": 0.12351719290018082, "step": 2080, "valid_targets_mean": 1220.6, "valid_targets_min": 802 }, { "epoch": 5.122850122850123, "grad_norm": 0.8549275302001442, "learning_rate": 2.5638966210441597e-06, "loss": 0.1172, "loss_nan_ranks": 0, "loss_rank_avg": 0.11528341472148895, "step": 2085, "valid_targets_mean": 1270.9, "valid_targets_min": 680 }, { "epoch": 5.135135135135135, "grad_norm": 1.0114375126497932, "learning_rate": 2.4942965399018926e-06, "loss": 0.122, "loss_nan_ranks": 0, "loss_rank_avg": 0.12501320242881775, "step": 2090, "valid_targets_mean": 1199.1, "valid_targets_min": 477 }, { "epoch": 5.1474201474201475, "grad_norm": 0.8425339847473776, "learning_rate": 2.425591323420289e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.12430179864168167, "step": 2095, "valid_targets_mean": 1389.4, "valid_targets_min": 725 }, { "epoch": 5.15970515970516, "grad_norm": 0.9764933250131361, "learning_rate": 2.357784483704444e-06, "loss": 0.1205, "loss_nan_ranks": 0, "loss_rank_avg": 0.1201491504907608, "step": 2100, "valid_targets_mean": 1180.0, "valid_targets_min": 618 }, { "epoch": 5.171990171990172, "grad_norm": 0.9012198614613685, "learning_rate": 2.2908794869358044e-06, "loss": 0.1199, "loss_nan_ranks": 0, "loss_rank_avg": 0.11872012913227081, "step": 2105, "valid_targets_mean": 1228.8, "valid_targets_min": 669 }, { "epoch": 5.184275184275184, "grad_norm": 0.8761086525856171, "learning_rate": 2.2248797531949952e-06, "loss": 0.1219, "loss_nan_ranks": 0, "loss_rank_avg": 0.11814196407794952, "step": 2110, "valid_targets_mean": 1259.1, "valid_targets_min": 600 }, { "epoch": 5.196560196560196, "grad_norm": 0.8625032263605917, "learning_rate": 2.1597886562869917e-06, "loss": 0.1228, "loss_nan_ranks": 0, "loss_rank_avg": 0.12705105543136597, "step": 2115, "valid_targets_mean": 1289.2, "valid_targets_min": 609 }, { "epoch": 5.208845208845209, "grad_norm": 0.8323607979530334, "learning_rate": 2.095609523568638e-06, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.11345008760690689, "step": 2120, "valid_targets_mean": 1408.8, "valid_targets_min": 800 }, { "epoch": 5.221130221130221, "grad_norm": 0.9066171525552188, "learning_rate": 2.0323456357785855e-06, "loss": 0.1204, "loss_nan_ranks": 0, "loss_rank_avg": 0.11503900587558746, "step": 2125, "valid_targets_mean": 1233.6, "valid_targets_min": 736 }, { "epoch": 5.233415233415234, "grad_norm": 0.8470818657488131, "learning_rate": 1.970000226869553e-06, "loss": 0.1193, "loss_nan_ranks": 0, "loss_rank_avg": 0.11597542464733124, "step": 2130, "valid_targets_mean": 1239.8, "valid_targets_min": 698 }, { "epoch": 5.245700245700245, "grad_norm": 0.960572215465082, "learning_rate": 1.90857648384305e-06, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.11610577255487442, "step": 2135, "valid_targets_mean": 1139.8, "valid_targets_min": 849 }, { "epoch": 5.257985257985258, "grad_norm": 0.8836353809793225, "learning_rate": 1.848077546586431e-06, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.119760662317276, "step": 2140, "valid_targets_mean": 1274.1, "valid_targets_min": 585 }, { "epoch": 5.27027027027027, "grad_norm": 0.934917710885557, "learning_rate": 1.7885065077123976e-06, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.1165575161576271, "step": 2145, "valid_targets_mean": 1192.0, "valid_targets_min": 700 }, { "epoch": 5.282555282555283, "grad_norm": 0.9435945221488572, "learning_rate": 1.7298664124009245e-06, "loss": 0.1238, "loss_nan_ranks": 0, "loss_rank_avg": 0.12441343069076538, "step": 2150, "valid_targets_mean": 1200.3, "valid_targets_min": 774 }, { "epoch": 5.294840294840295, "grad_norm": 0.9104365691078795, "learning_rate": 1.672160258243567e-06, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.11665159463882446, "step": 2155, "valid_targets_mean": 1109.1, "valid_targets_min": 577 }, { "epoch": 5.3071253071253075, "grad_norm": 0.9096445128425704, "learning_rate": 1.615390995090258e-06, "loss": 0.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.1253010630607605, "step": 2160, "valid_targets_mean": 1146.1, "valid_targets_min": 716 }, { "epoch": 5.319410319410319, "grad_norm": 0.9157686991554701, "learning_rate": 1.559561524898492e-06, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.12084513902664185, "step": 2165, "valid_targets_mean": 1176.6, "valid_targets_min": 697 }, { "epoch": 5.3316953316953315, "grad_norm": 0.8993452301524155, "learning_rate": 1.5046747015849893e-06, "loss": 0.1168, "loss_nan_ranks": 0, "loss_rank_avg": 0.12099088728427887, "step": 2170, "valid_targets_mean": 1287.6, "valid_targets_min": 943 }, { "epoch": 5.343980343980344, "grad_norm": 0.9188461360035166, "learning_rate": 1.4507333308798255e-06, "loss": 0.1233, "loss_nan_ranks": 0, "loss_rank_avg": 0.11140099167823792, "step": 2175, "valid_targets_mean": 1155.9, "valid_targets_min": 680 }, { "epoch": 5.356265356265356, "grad_norm": 0.8332971885732899, "learning_rate": 1.3977401701829752e-06, "loss": 0.1129, "loss_nan_ranks": 0, "loss_rank_avg": 0.10656285285949707, "step": 2180, "valid_targets_mean": 1380.5, "valid_targets_min": 673 }, { "epoch": 5.368550368550369, "grad_norm": 0.8921983319069042, "learning_rate": 1.345697928423384e-06, "loss": 0.119, "loss_nan_ranks": 0, "loss_rank_avg": 0.1141204684972763, "step": 2185, "valid_targets_mean": 1309.9, "valid_targets_min": 841 }, { "epoch": 5.38083538083538, "grad_norm": 0.934941810302748, "learning_rate": 1.2946092659204767e-06, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.11862413585186005, "step": 2190, "valid_targets_mean": 1051.9, "valid_targets_min": 626 }, { "epoch": 5.393120393120393, "grad_norm": 0.9380461194253754, "learning_rate": 1.244476794248175e-06, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.12333647906780243, "step": 2195, "valid_targets_mean": 1232.8, "valid_targets_min": 690 }, { "epoch": 5.405405405405405, "grad_norm": 0.9552431951880422, "learning_rate": 1.1953030761014017e-06, "loss": 0.1172, "loss_nan_ranks": 0, "loss_rank_avg": 0.12513390183448792, "step": 2200, "valid_targets_mean": 1074.1, "valid_targets_min": 587 }, { "epoch": 5.417690417690418, "grad_norm": 0.9014567009232736, "learning_rate": 1.147090625165055e-06, "loss": 0.1176, "loss_nan_ranks": 0, "loss_rank_avg": 0.11377055943012238, "step": 2205, "valid_targets_mean": 1243.6, "valid_targets_min": 650 }, { "epoch": 5.42997542997543, "grad_norm": 0.8599695105481259, "learning_rate": 1.0998419059855503e-06, "loss": 0.1223, "loss_nan_ranks": 0, "loss_rank_avg": 0.10883887857198715, "step": 2210, "valid_targets_mean": 1235.0, "valid_targets_min": 693 }, { "epoch": 5.442260442260443, "grad_norm": 0.9571634722287222, "learning_rate": 1.053559333844798e-06, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.12232570350170135, "step": 2215, "valid_targets_mean": 1088.8, "valid_targets_min": 619 }, { "epoch": 5.454545454545454, "grad_norm": 0.8940592339142096, "learning_rate": 1.0082452746367721e-06, "loss": 0.1164, "loss_nan_ranks": 0, "loss_rank_avg": 0.12069477140903473, "step": 2220, "valid_targets_mean": 1340.8, "valid_targets_min": 695 }, { "epoch": 5.466830466830467, "grad_norm": 0.8180480402297732, "learning_rate": 9.639020447465475e-07, "loss": 0.1214, "loss_nan_ranks": 0, "loss_rank_avg": 0.12307047843933105, "step": 2225, "valid_targets_mean": 1483.2, "valid_targets_min": 864 }, { "epoch": 5.479115479115479, "grad_norm": 0.8733335204397944, "learning_rate": 9.205319109318922e-07, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.11095479130744934, "step": 2230, "valid_targets_mean": 1155.1, "valid_targets_min": 692 }, { "epoch": 5.4914004914004915, "grad_norm": 0.9078213183092334, "learning_rate": 8.781370902074049e-07, "loss": 0.1185, "loss_nan_ranks": 0, "loss_rank_avg": 0.11644881963729858, "step": 2235, "valid_targets_mean": 1464.8, "valid_targets_min": 789 }, { "epoch": 5.503685503685504, "grad_norm": 0.8376491911217916, "learning_rate": 8.367197497311719e-07, "loss": 0.1221, "loss_nan_ranks": 0, "loss_rank_avg": 0.11460597068071365, "step": 2240, "valid_targets_mean": 1391.9, "valid_targets_min": 881 }, { "epoch": 5.515970515970516, "grad_norm": 0.9312884060452975, "learning_rate": 7.962820066939958e-07, "loss": 0.1236, "loss_nan_ranks": 0, "loss_rank_avg": 0.12043467909097672, "step": 2245, "valid_targets_mean": 1218.1, "valid_targets_min": 651 }, { "epoch": 5.528255528255528, "grad_norm": 0.9108572118360622, "learning_rate": 7.568259282111645e-07, "loss": 0.1208, "loss_nan_ranks": 0, "loss_rank_avg": 0.12171508371829987, "step": 2250, "valid_targets_mean": 1225.9, "valid_targets_min": 525 }, { "epoch": 5.54054054054054, "grad_norm": 1.043375173851359, "learning_rate": 7.183535312167755e-07, "loss": 0.1248, "loss_nan_ranks": 0, "loss_rank_avg": 0.12365029007196426, "step": 2255, "valid_targets_mean": 1268.5, "valid_targets_min": 711 }, { "epoch": 5.552825552825553, "grad_norm": 0.8221303890361632, "learning_rate": 6.808667823606474e-07, "loss": 0.1177, "loss_nan_ranks": 0, "loss_rank_avg": 0.10972858965396881, "step": 2260, "valid_targets_mean": 1217.7, "valid_targets_min": 633 }, { "epoch": 5.565110565110565, "grad_norm": 0.9943052251443346, "learning_rate": 6.443675979077779e-07, "loss": 0.1187, "loss_nan_ranks": 0, "loss_rank_avg": 0.11821258068084717, "step": 2265, "valid_targets_mean": 1140.2, "valid_targets_min": 648 }, { "epoch": 5.577395577395578, "grad_norm": 0.8837595753139642, "learning_rate": 6.088578436403847e-07, "loss": 0.118, "loss_nan_ranks": 0, "loss_rank_avg": 0.11932357400655746, "step": 2270, "valid_targets_mean": 1177.3, "valid_targets_min": 773 }, { "epoch": 5.58968058968059, "grad_norm": 0.9037106518704484, "learning_rate": 5.743393347625436e-07, "loss": 0.1183, "loss_nan_ranks": 0, "loss_rank_avg": 0.12482412159442902, "step": 2275, "valid_targets_mean": 1232.4, "valid_targets_min": 682 }, { "epoch": 5.601965601965602, "grad_norm": 0.909686971601023, "learning_rate": 5.408138358073833e-07, "loss": 0.1194, "loss_nan_ranks": 0, "loss_rank_avg": 0.11696803569793701, "step": 2280, "valid_targets_mean": 1211.9, "valid_targets_min": 817 }, { "epoch": 5.614250614250614, "grad_norm": 0.8679916324190773, "learning_rate": 5.082830605468969e-07, "loss": 0.1224, "loss_nan_ranks": 0, "loss_rank_avg": 0.11813192814588547, "step": 2285, "valid_targets_mean": 1354.4, "valid_targets_min": 693 }, { "epoch": 5.6265356265356266, "grad_norm": 0.8884471818216881, "learning_rate": 4.767486719043235e-07, "loss": 0.1237, "loss_nan_ranks": 0, "loss_rank_avg": 0.12548132240772247, "step": 2290, "valid_targets_mean": 1283.0, "valid_targets_min": 618 }, { "epoch": 5.638820638820639, "grad_norm": 0.8715795708444471, "learning_rate": 4.4621228186915833e-07, "loss": 0.1189, "loss_nan_ranks": 0, "loss_rank_avg": 0.11673951148986816, "step": 2295, "valid_targets_mean": 1328.6, "valid_targets_min": 663 }, { "epoch": 5.651105651105651, "grad_norm": 0.865429287358642, "learning_rate": 4.166754514147275e-07, "loss": 0.1192, "loss_nan_ranks": 0, "loss_rank_avg": 0.1132473275065422, "step": 2300, "valid_targets_mean": 1261.5, "valid_targets_min": 694 }, { "epoch": 5.663390663390663, "grad_norm": 0.8741499140536886, "learning_rate": 3.881396904184231e-07, "loss": 0.1231, "loss_nan_ranks": 0, "loss_rank_avg": 0.13480767607688904, "step": 2305, "valid_targets_mean": 1423.6, "valid_targets_min": 857 }, { "epoch": 5.675675675675675, "grad_norm": 0.8345784138645265, "learning_rate": 3.6060645758449584e-07, "loss": 0.1159, "loss_nan_ranks": 0, "loss_rank_avg": 0.10352207720279694, "step": 2310, "valid_targets_mean": 1274.6, "valid_targets_min": 748 }, { "epoch": 5.687960687960688, "grad_norm": 1.0316462146052467, "learning_rate": 3.34077160369497e-07, "loss": 0.1215, "loss_nan_ranks": 0, "loss_rank_avg": 0.12712368369102478, "step": 2315, "valid_targets_mean": 1247.8, "valid_targets_min": 648 }, { "epoch": 5.7002457002457, "grad_norm": 0.8815652322621401, "learning_rate": 3.08553154910336e-07, "loss": 0.1217, "loss_nan_ranks": 0, "loss_rank_avg": 0.11496353149414062, "step": 2320, "valid_targets_mean": 1219.0, "valid_targets_min": 745 }, { "epoch": 5.712530712530713, "grad_norm": 0.9889734864928303, "learning_rate": 2.840357459549492e-07, "loss": 0.1198, "loss_nan_ranks": 0, "loss_rank_avg": 0.12958207726478577, "step": 2325, "valid_targets_mean": 1281.6, "valid_targets_min": 673 }, { "epoch": 5.724815724815725, "grad_norm": 0.8735025249752323, "learning_rate": 2.6052618679560884e-07, "loss": 0.1207, "loss_nan_ranks": 0, "loss_rank_avg": 0.1203438937664032, "step": 2330, "valid_targets_mean": 1358.6, "valid_targets_min": 586 }, { "epoch": 5.737100737100737, "grad_norm": 0.9487732323352747, "learning_rate": 2.380256792048541e-07, "loss": 0.1154, "loss_nan_ranks": 0, "loss_rank_avg": 0.10913722962141037, "step": 2335, "valid_targets_mean": 1167.6, "valid_targets_min": 690 }, { "epoch": 5.749385749385749, "grad_norm": 0.9354429013108673, "learning_rate": 2.1653537337405383e-07, "loss": 0.1175, "loss_nan_ranks": 0, "loss_rank_avg": 0.12233065068721771, "step": 2340, "valid_targets_mean": 1233.7, "valid_targets_min": 683 }, { "epoch": 5.761670761670762, "grad_norm": 0.8361440623034612, "learning_rate": 1.9605636785462234e-07, "loss": 0.1167, "loss_nan_ranks": 0, "loss_rank_avg": 0.11600156873464584, "step": 2345, "valid_targets_mean": 1423.9, "valid_targets_min": 647 }, { "epoch": 5.773955773955774, "grad_norm": 0.88426141655337, "learning_rate": 1.7658970950185095e-07, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.11672552675008774, "step": 2350, "valid_targets_mean": 1327.4, "valid_targets_min": 627 }, { "epoch": 5.7862407862407865, "grad_norm": 0.8958608074003424, "learning_rate": 1.5813639342140197e-07, "loss": 0.1179, "loss_nan_ranks": 0, "loss_rank_avg": 0.121670201420784, "step": 2355, "valid_targets_mean": 1360.6, "valid_targets_min": 559 }, { "epoch": 5.798525798525798, "grad_norm": 0.8690995889535993, "learning_rate": 1.4069736291843605e-07, "loss": 0.1201, "loss_nan_ranks": 0, "loss_rank_avg": 0.12032966315746307, "step": 2360, "valid_targets_mean": 1345.8, "valid_targets_min": 769 }, { "epoch": 5.8108108108108105, "grad_norm": 0.9609941874663688, "learning_rate": 1.242735094493952e-07, "loss": 0.1249, "loss_nan_ranks": 0, "loss_rank_avg": 0.1279018074274063, "step": 2365, "valid_targets_mean": 1229.7, "valid_targets_min": 709 }, { "epoch": 5.823095823095823, "grad_norm": 0.8488632044982599, "learning_rate": 1.0886567257643033e-07, "loss": 0.1229, "loss_nan_ranks": 0, "loss_rank_avg": 0.13311204314231873, "step": 2370, "valid_targets_mean": 1436.2, "valid_targets_min": 754 }, { "epoch": 5.835380835380835, "grad_norm": 0.8912292020833572, "learning_rate": 9.447463992448891e-08, "loss": 0.1203, "loss_nan_ranks": 0, "loss_rank_avg": 0.12233321368694305, "step": 2375, "valid_targets_mean": 1253.7, "valid_targets_min": 728 }, { "epoch": 5.847665847665848, "grad_norm": 0.866161605046653, "learning_rate": 8.110114714104277e-08, "loss": 0.1181, "loss_nan_ranks": 0, "loss_rank_avg": 0.11839167773723602, "step": 2380, "valid_targets_mean": 1312.7, "valid_targets_min": 798 }, { "epoch": 5.85995085995086, "grad_norm": 0.8639388177292349, "learning_rate": 6.874587785849152e-08, "loss": 0.1139, "loss_nan_ranks": 0, "loss_rank_avg": 0.10952752083539963, "step": 2385, "valid_targets_mean": 1177.9, "valid_targets_min": 563 }, { "epoch": 5.872235872235873, "grad_norm": 0.8346070029983881, "learning_rate": 5.7409463659219286e-08, "loss": 0.1241, "loss_nan_ranks": 0, "loss_rank_avg": 0.1254696249961853, "step": 2390, "valid_targets_mean": 1511.4, "valid_targets_min": 639 }, { "epoch": 5.884520884520884, "grad_norm": 0.8504954108670092, "learning_rate": 4.709248404329625e-08, "loss": 0.1163, "loss_nan_ranks": 0, "loss_rank_avg": 0.1132640540599823, "step": 2395, "valid_targets_mean": 1198.4, "valid_targets_min": 783 }, { "epoch": 5.896805896805897, "grad_norm": 0.9088038628349666, "learning_rate": 3.7795466398868885e-08, "loss": 0.1191, "loss_nan_ranks": 0, "loss_rank_avg": 0.11657664179801941, "step": 2400, "valid_targets_mean": 1197.9, "valid_targets_min": 633 }, { "epoch": 5.909090909090909, "grad_norm": 0.8865491567876178, "learning_rate": 2.9518885975192702e-08, "loss": 0.121, "loss_nan_ranks": 0, "loss_rank_avg": 0.12183408439159393, "step": 2405, "valid_targets_mean": 1268.6, "valid_targets_min": 679 }, { "epoch": 5.921375921375922, "grad_norm": 0.9382041318188953, "learning_rate": 2.226316585833832e-08, "loss": 0.1221, "loss_nan_ranks": 0, "loss_rank_avg": 0.13483551144599915, "step": 2410, "valid_targets_mean": 1244.8, "valid_targets_min": 538 }, { "epoch": 5.933660933660933, "grad_norm": 0.9374744604838307, "learning_rate": 1.6028676949570997e-08, "loss": 0.1261, "loss_nan_ranks": 0, "loss_rank_avg": 0.12365995347499847, "step": 2415, "valid_targets_mean": 1196.9, "valid_targets_min": 770 }, { "epoch": 5.945945945945946, "grad_norm": 0.894291909380334, "learning_rate": 1.0815737946383575e-08, "loss": 0.1169, "loss_nan_ranks": 0, "loss_rank_avg": 0.11816893517971039, "step": 2420, "valid_targets_mean": 1345.9, "valid_targets_min": 965 }, { "epoch": 5.958230958230958, "grad_norm": 0.8845005806783053, "learning_rate": 6.624615326207284e-09, "loss": 0.117, "loss_nan_ranks": 0, "loss_rank_avg": 0.1128786951303482, "step": 2425, "valid_targets_mean": 1206.6, "valid_targets_min": 575 }, { "epoch": 5.9705159705159705, "grad_norm": 0.8107444415043257, "learning_rate": 3.4555233327893124e-09, "loss": 0.1275, "loss_nan_ranks": 0, "loss_rank_avg": 0.11094975471496582, "step": 2430, "valid_targets_mean": 1371.6, "valid_targets_min": 724 }, { "epoch": 5.982800982800983, "grad_norm": 0.8488528893584344, "learning_rate": 1.3086239652415621e-09, "loss": 0.1178, "loss_nan_ranks": 0, "loss_rank_avg": 0.10983407497406006, "step": 2435, "valid_targets_mean": 1295.4, "valid_targets_min": 751 }, { "epoch": 5.995085995085995, "grad_norm": 0.9189796749562797, "learning_rate": 1.840269697628294e-10, "loss": 0.1182, "loss_nan_ranks": 0, "loss_rank_avg": 0.11939200758934021, "step": 2440, "valid_targets_mean": 1261.1, "valid_targets_min": 687 }, { "epoch": 6.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.11800891160964966, "step": 2442, "total_flos": 247694803206144.0, "train_loss": 0.1872950934367918, "train_runtime": 7715.4233, "train_samples_per_second": 5.057, "train_steps_per_second": 0.317, "valid_targets_mean": 1261.1, "valid_targets_min": 857 } ], "logging_steps": 5, "max_steps": 2442, "num_input_tokens_seen": 0, "num_train_epochs": 6, "save_steps": 100, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 247694803206144.0, "train_batch_size": 1, "trial_name": null, "trial_params": null }