| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 6664, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.005252100840336135, |
| "grad_norm": 12.87344450799192, |
| "learning_rate": 2.39880059970015e-07, |
| "loss": 0.7749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7653565406799316, |
| "step": 5, |
| "valid_targets_mean": 2484.8, |
| "valid_targets_min": 784 |
| }, |
| { |
| "epoch": 0.01050420168067227, |
| "grad_norm": 12.707723147793125, |
| "learning_rate": 5.397301349325338e-07, |
| "loss": 0.7606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7621961236000061, |
| "step": 10, |
| "valid_targets_mean": 2830.7, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 0.015756302521008403, |
| "grad_norm": 11.204400117593265, |
| "learning_rate": 8.395802098950526e-07, |
| "loss": 0.7482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7473458051681519, |
| "step": 15, |
| "valid_targets_mean": 3091.0, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 0.02100840336134454, |
| "grad_norm": 9.688069489628813, |
| "learning_rate": 1.1394302848575713e-06, |
| "loss": 0.7466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7422138452529907, |
| "step": 20, |
| "valid_targets_mean": 2413.2, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 0.026260504201680673, |
| "grad_norm": 7.62742888265603, |
| "learning_rate": 1.43928035982009e-06, |
| "loss": 0.7287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7463569045066833, |
| "step": 25, |
| "valid_targets_mean": 2688.5, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 0.031512605042016806, |
| "grad_norm": 5.508936794357446, |
| "learning_rate": 1.7391304347826088e-06, |
| "loss": 0.6518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6350823640823364, |
| "step": 30, |
| "valid_targets_mean": 2500.6, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 0.03676470588235294, |
| "grad_norm": 4.810314643948938, |
| "learning_rate": 2.0389805097451275e-06, |
| "loss": 0.6558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6311067938804626, |
| "step": 35, |
| "valid_targets_mean": 2686.3, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 0.04201680672268908, |
| "grad_norm": 4.8557060388176545, |
| "learning_rate": 2.3388305847076464e-06, |
| "loss": 0.6284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6066815257072449, |
| "step": 40, |
| "valid_targets_mean": 2177.2, |
| "valid_targets_min": 1080 |
| }, |
| { |
| "epoch": 0.04726890756302521, |
| "grad_norm": 2.9119019293559685, |
| "learning_rate": 2.6386806596701653e-06, |
| "loss": 0.6094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6400288343429565, |
| "step": 45, |
| "valid_targets_mean": 2633.9, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 0.052521008403361345, |
| "grad_norm": 2.5325988257181504, |
| "learning_rate": 2.9385307346326843e-06, |
| "loss": 0.5741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5878869891166687, |
| "step": 50, |
| "valid_targets_mean": 2203.5, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 0.05777310924369748, |
| "grad_norm": 1.6332369639610234, |
| "learning_rate": 3.2383808095952024e-06, |
| "loss": 0.5072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.49458950757980347, |
| "step": 55, |
| "valid_targets_mean": 3035.3, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 0.06302521008403361, |
| "grad_norm": 1.2034100946296309, |
| "learning_rate": 3.5382308845577213e-06, |
| "loss": 0.5137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4873230755329132, |
| "step": 60, |
| "valid_targets_mean": 2940.2, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 0.06827731092436974, |
| "grad_norm": 1.1067968813199072, |
| "learning_rate": 3.83808095952024e-06, |
| "loss": 0.511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4636586606502533, |
| "step": 65, |
| "valid_targets_mean": 2532.8, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 0.07352941176470588, |
| "grad_norm": 1.2850520360535964, |
| "learning_rate": 4.137931034482759e-06, |
| "loss": 0.4961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4967666566371918, |
| "step": 70, |
| "valid_targets_mean": 1951.5, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 0.07878151260504201, |
| "grad_norm": 0.8971762854941586, |
| "learning_rate": 4.437781109445278e-06, |
| "loss": 0.4949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43605613708496094, |
| "step": 75, |
| "valid_targets_mean": 2723.1, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 0.08403361344537816, |
| "grad_norm": 0.9430146035301179, |
| "learning_rate": 4.737631184407796e-06, |
| "loss": 0.4615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4186355173587799, |
| "step": 80, |
| "valid_targets_mean": 2138.4, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 0.08928571428571429, |
| "grad_norm": 0.9397684354473573, |
| "learning_rate": 5.037481259370315e-06, |
| "loss": 0.4629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.447378933429718, |
| "step": 85, |
| "valid_targets_mean": 2195.4, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 0.09453781512605042, |
| "grad_norm": 0.9254373058058498, |
| "learning_rate": 5.337331334332834e-06, |
| "loss": 0.4579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44608554244041443, |
| "step": 90, |
| "valid_targets_mean": 2305.1, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 0.09978991596638656, |
| "grad_norm": 0.8895449710201235, |
| "learning_rate": 5.6371814092953526e-06, |
| "loss": 0.4429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4577831029891968, |
| "step": 95, |
| "valid_targets_mean": 2365.8, |
| "valid_targets_min": 1000 |
| }, |
| { |
| "epoch": 0.10504201680672269, |
| "grad_norm": 0.8582249839693272, |
| "learning_rate": 5.937031484257871e-06, |
| "loss": 0.4524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43060487508773804, |
| "step": 100, |
| "valid_targets_mean": 2525.8, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 0.11029411764705882, |
| "grad_norm": 0.8328052594807136, |
| "learning_rate": 6.2368815592203904e-06, |
| "loss": 0.4351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43569284677505493, |
| "step": 105, |
| "valid_targets_mean": 2433.1, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 0.11554621848739496, |
| "grad_norm": 0.8004894157898372, |
| "learning_rate": 6.536731634182909e-06, |
| "loss": 0.435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4115639328956604, |
| "step": 110, |
| "valid_targets_mean": 2809.9, |
| "valid_targets_min": 1462 |
| }, |
| { |
| "epoch": 0.1207983193277311, |
| "grad_norm": 0.8370123985640117, |
| "learning_rate": 6.8365817091454274e-06, |
| "loss": 0.4329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40281569957733154, |
| "step": 115, |
| "valid_targets_mean": 2199.2, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 0.12605042016806722, |
| "grad_norm": 0.8695717739921266, |
| "learning_rate": 7.136431784107947e-06, |
| "loss": 0.4223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4021134674549103, |
| "step": 120, |
| "valid_targets_mean": 2273.1, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 0.13130252100840337, |
| "grad_norm": 0.8006986968807501, |
| "learning_rate": 7.436281859070465e-06, |
| "loss": 0.4335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4061618447303772, |
| "step": 125, |
| "valid_targets_mean": 2860.1, |
| "valid_targets_min": 1215 |
| }, |
| { |
| "epoch": 0.13655462184873948, |
| "grad_norm": 0.8969789811481348, |
| "learning_rate": 7.736131934032984e-06, |
| "loss": 0.4152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.47167330980300903, |
| "step": 130, |
| "valid_targets_mean": 2499.8, |
| "valid_targets_min": 1218 |
| }, |
| { |
| "epoch": 0.14180672268907563, |
| "grad_norm": 0.8068868280254967, |
| "learning_rate": 8.035982008995503e-06, |
| "loss": 0.4163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4264189898967743, |
| "step": 135, |
| "valid_targets_mean": 2426.6, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 0.14705882352941177, |
| "grad_norm": 0.9031868308784958, |
| "learning_rate": 8.335832083958023e-06, |
| "loss": 0.4126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4020998775959015, |
| "step": 140, |
| "valid_targets_mean": 2240.5, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 0.15231092436974789, |
| "grad_norm": 0.7811330017492059, |
| "learning_rate": 8.63568215892054e-06, |
| "loss": 0.3964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4105680286884308, |
| "step": 145, |
| "valid_targets_mean": 2559.5, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 0.15756302521008403, |
| "grad_norm": 0.8087924248265574, |
| "learning_rate": 8.93553223388306e-06, |
| "loss": 0.4058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4330301880836487, |
| "step": 150, |
| "valid_targets_mean": 2632.9, |
| "valid_targets_min": 1231 |
| }, |
| { |
| "epoch": 0.16281512605042017, |
| "grad_norm": 0.7719589146187298, |
| "learning_rate": 9.235382308845579e-06, |
| "loss": 0.3981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3908872604370117, |
| "step": 155, |
| "valid_targets_mean": 2874.4, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 0.16806722689075632, |
| "grad_norm": 0.8718120536448756, |
| "learning_rate": 9.535232383808097e-06, |
| "loss": 0.3981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41889429092407227, |
| "step": 160, |
| "valid_targets_mean": 2393.1, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 0.17331932773109243, |
| "grad_norm": 0.8830904007290984, |
| "learning_rate": 9.835082458770614e-06, |
| "loss": 0.4037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38836172223091125, |
| "step": 165, |
| "valid_targets_mean": 2164.8, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 0.17857142857142858, |
| "grad_norm": 0.8311418026284046, |
| "learning_rate": 1.0134932533733135e-05, |
| "loss": 0.3887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3843948543071747, |
| "step": 170, |
| "valid_targets_mean": 2470.9, |
| "valid_targets_min": 1080 |
| }, |
| { |
| "epoch": 0.18382352941176472, |
| "grad_norm": 0.8211185772584042, |
| "learning_rate": 1.0434782608695653e-05, |
| "loss": 0.4169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4080219268798828, |
| "step": 175, |
| "valid_targets_mean": 2487.4, |
| "valid_targets_min": 688 |
| }, |
| { |
| "epoch": 0.18907563025210083, |
| "grad_norm": 0.8630859100580258, |
| "learning_rate": 1.0734632683658172e-05, |
| "loss": 0.3844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.42095762491226196, |
| "step": 180, |
| "valid_targets_mean": 2252.2, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 0.19432773109243698, |
| "grad_norm": 0.7978994945119684, |
| "learning_rate": 1.103448275862069e-05, |
| "loss": 0.3844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41790223121643066, |
| "step": 185, |
| "valid_targets_mean": 2912.1, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 0.19957983193277312, |
| "grad_norm": 0.8619777697515183, |
| "learning_rate": 1.1334332833583211e-05, |
| "loss": 0.3922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4195566773414612, |
| "step": 190, |
| "valid_targets_mean": 2451.5, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 0.20483193277310924, |
| "grad_norm": 0.8075469823787889, |
| "learning_rate": 1.1634182908545729e-05, |
| "loss": 0.381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3835638463497162, |
| "step": 195, |
| "valid_targets_mean": 2334.6, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 0.21008403361344538, |
| "grad_norm": 0.7886022090561562, |
| "learning_rate": 1.1934032983508246e-05, |
| "loss": 0.3732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41375166177749634, |
| "step": 200, |
| "valid_targets_mean": 2972.5, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 0.21533613445378152, |
| "grad_norm": 0.8061255296748036, |
| "learning_rate": 1.2233883058470766e-05, |
| "loss": 0.3888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4238708019256592, |
| "step": 205, |
| "valid_targets_mean": 2525.8, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 0.22058823529411764, |
| "grad_norm": 0.8001397668970225, |
| "learning_rate": 1.2533733133433283e-05, |
| "loss": 0.3628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3657309412956238, |
| "step": 210, |
| "valid_targets_mean": 2680.4, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 0.22584033613445378, |
| "grad_norm": 0.7848361664620995, |
| "learning_rate": 1.2833583208395803e-05, |
| "loss": 0.3762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37307411432266235, |
| "step": 215, |
| "valid_targets_mean": 2759.8, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 0.23109243697478993, |
| "grad_norm": 0.9451943941703829, |
| "learning_rate": 1.313343328335832e-05, |
| "loss": 0.3721, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35972413420677185, |
| "step": 220, |
| "valid_targets_mean": 1986.0, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 0.23634453781512604, |
| "grad_norm": 1.0257525942300505, |
| "learning_rate": 1.3433283358320841e-05, |
| "loss": 0.3903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37196558713912964, |
| "step": 225, |
| "valid_targets_mean": 2237.6, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 0.2415966386554622, |
| "grad_norm": 0.8450544047029999, |
| "learning_rate": 1.3733133433283359e-05, |
| "loss": 0.3774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.400920033454895, |
| "step": 230, |
| "valid_targets_mean": 2558.1, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 0.24684873949579833, |
| "grad_norm": 0.8081787234697447, |
| "learning_rate": 1.4032983508245878e-05, |
| "loss": 0.3585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35195618867874146, |
| "step": 235, |
| "valid_targets_mean": 2621.5, |
| "valid_targets_min": 749 |
| }, |
| { |
| "epoch": 0.25210084033613445, |
| "grad_norm": 0.8046828946061387, |
| "learning_rate": 1.4332833583208396e-05, |
| "loss": 0.3612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.340299516916275, |
| "step": 240, |
| "valid_targets_mean": 2374.2, |
| "valid_targets_min": 1079 |
| }, |
| { |
| "epoch": 0.25735294117647056, |
| "grad_norm": 0.6971318909820771, |
| "learning_rate": 1.4632683658170917e-05, |
| "loss": 0.357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3586806356906891, |
| "step": 245, |
| "valid_targets_mean": 3350.4, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 0.26260504201680673, |
| "grad_norm": 0.8055301071475804, |
| "learning_rate": 1.4932533733133435e-05, |
| "loss": 0.3433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3433215320110321, |
| "step": 250, |
| "valid_targets_mean": 2368.8, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 0.26785714285714285, |
| "grad_norm": 0.8154286910342443, |
| "learning_rate": 1.5232383808095954e-05, |
| "loss": 0.358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33199673891067505, |
| "step": 255, |
| "valid_targets_mean": 2458.3, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 0.27310924369747897, |
| "grad_norm": 0.8416573919590596, |
| "learning_rate": 1.5532233883058472e-05, |
| "loss": 0.3717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3616263270378113, |
| "step": 260, |
| "valid_targets_mean": 2318.0, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 0.27836134453781514, |
| "grad_norm": 0.7678040770406672, |
| "learning_rate": 1.5832083958020993e-05, |
| "loss": 0.3621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32790547609329224, |
| "step": 265, |
| "valid_targets_mean": 2317.4, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 0.28361344537815125, |
| "grad_norm": 0.8164391899177017, |
| "learning_rate": 1.613193403298351e-05, |
| "loss": 0.3392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2930743098258972, |
| "step": 270, |
| "valid_targets_mean": 2118.6, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 0.28886554621848737, |
| "grad_norm": 0.8248688372806788, |
| "learning_rate": 1.6431784107946028e-05, |
| "loss": 0.3646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3935636579990387, |
| "step": 275, |
| "valid_targets_mean": 2466.6, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 0.29411764705882354, |
| "grad_norm": 0.8270276632057298, |
| "learning_rate": 1.6731634182908546e-05, |
| "loss": 0.3683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36888253688812256, |
| "step": 280, |
| "valid_targets_mean": 2239.0, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 0.29936974789915966, |
| "grad_norm": 0.8394101421073619, |
| "learning_rate": 1.7031484257871064e-05, |
| "loss": 0.3563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3346269130706787, |
| "step": 285, |
| "valid_targets_mean": 2003.6, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 0.30462184873949577, |
| "grad_norm": 0.7147367181058835, |
| "learning_rate": 1.7331334332833585e-05, |
| "loss": 0.3588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3740352988243103, |
| "step": 290, |
| "valid_targets_mean": 3159.9, |
| "valid_targets_min": 1551 |
| }, |
| { |
| "epoch": 0.30987394957983194, |
| "grad_norm": 0.8491621210785679, |
| "learning_rate": 1.7631184407796102e-05, |
| "loss": 0.3563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.357749342918396, |
| "step": 295, |
| "valid_targets_mean": 2103.2, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 0.31512605042016806, |
| "grad_norm": 0.8318921687266874, |
| "learning_rate": 1.7931034482758623e-05, |
| "loss": 0.3319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3408452868461609, |
| "step": 300, |
| "valid_targets_mean": 2045.0, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 0.32037815126050423, |
| "grad_norm": 0.8396347924881318, |
| "learning_rate": 1.823088455772114e-05, |
| "loss": 0.3421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3563663959503174, |
| "step": 305, |
| "valid_targets_mean": 2256.4, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 0.32563025210084034, |
| "grad_norm": 0.9205468135189474, |
| "learning_rate": 1.853073463268366e-05, |
| "loss": 0.3732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.39193105697631836, |
| "step": 310, |
| "valid_targets_mean": 2059.1, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 0.33088235294117646, |
| "grad_norm": 0.9135710271321404, |
| "learning_rate": 1.8830584707646176e-05, |
| "loss": 0.3372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3061055541038513, |
| "step": 315, |
| "valid_targets_mean": 1836.5, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 0.33613445378151263, |
| "grad_norm": 0.913185572728451, |
| "learning_rate": 1.9130434782608697e-05, |
| "loss": 0.3472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3164549171924591, |
| "step": 320, |
| "valid_targets_mean": 2192.6, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 0.34138655462184875, |
| "grad_norm": 0.7411966725143038, |
| "learning_rate": 1.9430284857571215e-05, |
| "loss": 0.3551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34439602494239807, |
| "step": 325, |
| "valid_targets_mean": 2740.4, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 0.34663865546218486, |
| "grad_norm": 0.7141106760577947, |
| "learning_rate": 1.9730134932533736e-05, |
| "loss": 0.3467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3687133193016052, |
| "step": 330, |
| "valid_targets_mean": 2977.1, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 0.35189075630252103, |
| "grad_norm": 0.8006543236123854, |
| "learning_rate": 2.0029985007496254e-05, |
| "loss": 0.3435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3490038514137268, |
| "step": 335, |
| "valid_targets_mean": 2345.1, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 0.35714285714285715, |
| "grad_norm": 0.7847814844972669, |
| "learning_rate": 2.0329835082458775e-05, |
| "loss": 0.3439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3197982609272003, |
| "step": 340, |
| "valid_targets_mean": 2583.3, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 0.36239495798319327, |
| "grad_norm": 0.9492857105812816, |
| "learning_rate": 2.0629685157421292e-05, |
| "loss": 0.3519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3854501247406006, |
| "step": 345, |
| "valid_targets_mean": 2491.8, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 0.36764705882352944, |
| "grad_norm": 0.9063284452571975, |
| "learning_rate": 2.092953523238381e-05, |
| "loss": 0.3585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3553091883659363, |
| "step": 350, |
| "valid_targets_mean": 1893.2, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 0.37289915966386555, |
| "grad_norm": 0.7830522409215324, |
| "learning_rate": 2.1229385307346328e-05, |
| "loss": 0.3371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35570859909057617, |
| "step": 355, |
| "valid_targets_mean": 2596.5, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 0.37815126050420167, |
| "grad_norm": 0.9034654728534351, |
| "learning_rate": 2.152923538230885e-05, |
| "loss": 0.3633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3349594175815582, |
| "step": 360, |
| "valid_targets_mean": 1895.6, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 0.38340336134453784, |
| "grad_norm": 0.7718514232416079, |
| "learning_rate": 2.1829085457271363e-05, |
| "loss": 0.3499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3692238926887512, |
| "step": 365, |
| "valid_targets_mean": 3021.2, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 0.38865546218487396, |
| "grad_norm": 0.7100879122429138, |
| "learning_rate": 2.2128935532233884e-05, |
| "loss": 0.3618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38098081946372986, |
| "step": 370, |
| "valid_targets_mean": 3113.8, |
| "valid_targets_min": 1343 |
| }, |
| { |
| "epoch": 0.3939075630252101, |
| "grad_norm": 0.9674664797223852, |
| "learning_rate": 2.2428785607196405e-05, |
| "loss": 0.3563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.335666298866272, |
| "step": 375, |
| "valid_targets_mean": 1930.9, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 0.39915966386554624, |
| "grad_norm": 0.9243345478210326, |
| "learning_rate": 2.2728635682158923e-05, |
| "loss": 0.3336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33842527866363525, |
| "step": 380, |
| "valid_targets_mean": 2132.2, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 0.40441176470588236, |
| "grad_norm": 0.8789172880338919, |
| "learning_rate": 2.302848575712144e-05, |
| "loss": 0.3538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3681184947490692, |
| "step": 385, |
| "valid_targets_mean": 2242.4, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 0.4096638655462185, |
| "grad_norm": 0.8586032021607275, |
| "learning_rate": 2.3328335832083958e-05, |
| "loss": 0.3611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40162259340286255, |
| "step": 390, |
| "valid_targets_mean": 2104.2, |
| "valid_targets_min": 1341 |
| }, |
| { |
| "epoch": 0.41491596638655465, |
| "grad_norm": 0.7759128620985057, |
| "learning_rate": 2.362818590704648e-05, |
| "loss": 0.3534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30948907136917114, |
| "step": 395, |
| "valid_targets_mean": 2376.9, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 0.42016806722689076, |
| "grad_norm": 0.8511116280560821, |
| "learning_rate": 2.3928035982009e-05, |
| "loss": 0.3428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.335288405418396, |
| "step": 400, |
| "valid_targets_mean": 2221.9, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 0.4254201680672269, |
| "grad_norm": 0.8282588416488064, |
| "learning_rate": 2.4227886056971515e-05, |
| "loss": 0.3246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2992272973060608, |
| "step": 405, |
| "valid_targets_mean": 2456.8, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 0.43067226890756305, |
| "grad_norm": 0.8894895733438389, |
| "learning_rate": 2.4527736131934036e-05, |
| "loss": 0.3417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3676615357398987, |
| "step": 410, |
| "valid_targets_mean": 2224.9, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 0.43592436974789917, |
| "grad_norm": 0.6776249586308555, |
| "learning_rate": 2.4827586206896553e-05, |
| "loss": 0.3381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3416297435760498, |
| "step": 415, |
| "valid_targets_mean": 3067.1, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 0.4411764705882353, |
| "grad_norm": 0.775573641251283, |
| "learning_rate": 2.5127436281859074e-05, |
| "loss": 0.3254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33019617199897766, |
| "step": 420, |
| "valid_targets_mean": 2569.1, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 0.44642857142857145, |
| "grad_norm": 0.8373072328217271, |
| "learning_rate": 2.542728635682159e-05, |
| "loss": 0.3402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33131086826324463, |
| "step": 425, |
| "valid_targets_mean": 2256.8, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 0.45168067226890757, |
| "grad_norm": 0.8453545100732337, |
| "learning_rate": 2.572713643178411e-05, |
| "loss": 0.3243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3512518107891083, |
| "step": 430, |
| "valid_targets_mean": 2501.5, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 0.4569327731092437, |
| "grad_norm": 0.8253450678943121, |
| "learning_rate": 2.602698650674663e-05, |
| "loss": 0.3365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3878710865974426, |
| "step": 435, |
| "valid_targets_mean": 2262.6, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 0.46218487394957986, |
| "grad_norm": 0.6830047934435176, |
| "learning_rate": 2.632683658170915e-05, |
| "loss": 0.3246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32986515760421753, |
| "step": 440, |
| "valid_targets_mean": 2881.2, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 0.46743697478991597, |
| "grad_norm": 0.7176824990335685, |
| "learning_rate": 2.6626686656671666e-05, |
| "loss": 0.3396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3406386971473694, |
| "step": 445, |
| "valid_targets_mean": 2875.5, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 0.4726890756302521, |
| "grad_norm": 0.8474215992592125, |
| "learning_rate": 2.6926536731634184e-05, |
| "loss": 0.3537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3648040294647217, |
| "step": 450, |
| "valid_targets_mean": 2027.9, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 0.47794117647058826, |
| "grad_norm": 1.095403929365044, |
| "learning_rate": 2.7226386806596705e-05, |
| "loss": 0.3518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33743467926979065, |
| "step": 455, |
| "valid_targets_mean": 2896.9, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 0.4831932773109244, |
| "grad_norm": 0.7470324162963815, |
| "learning_rate": 2.752623688155922e-05, |
| "loss": 0.3492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.322024405002594, |
| "step": 460, |
| "valid_targets_mean": 2677.2, |
| "valid_targets_min": 1139 |
| }, |
| { |
| "epoch": 0.4884453781512605, |
| "grad_norm": 0.7287288163080067, |
| "learning_rate": 2.782608695652174e-05, |
| "loss": 0.3337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3294079601764679, |
| "step": 465, |
| "valid_targets_mean": 2836.6, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 0.49369747899159666, |
| "grad_norm": 0.7571889256497794, |
| "learning_rate": 2.812593703148426e-05, |
| "loss": 0.3408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3153488337993622, |
| "step": 470, |
| "valid_targets_mean": 2510.1, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 0.4989495798319328, |
| "grad_norm": 0.7390238171828771, |
| "learning_rate": 2.8425787106446782e-05, |
| "loss": 0.3346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3535560965538025, |
| "step": 475, |
| "valid_targets_mean": 2723.5, |
| "valid_targets_min": 1336 |
| }, |
| { |
| "epoch": 0.5042016806722689, |
| "grad_norm": 0.7519915733907849, |
| "learning_rate": 2.8725637181409296e-05, |
| "loss": 0.3336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35906684398651123, |
| "step": 480, |
| "valid_targets_mean": 2768.1, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 0.509453781512605, |
| "grad_norm": 0.8835497372225222, |
| "learning_rate": 2.9025487256371818e-05, |
| "loss": 0.3071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30021750926971436, |
| "step": 485, |
| "valid_targets_mean": 1918.7, |
| "valid_targets_min": 595 |
| }, |
| { |
| "epoch": 0.5147058823529411, |
| "grad_norm": 0.7720200309244449, |
| "learning_rate": 2.9325337331334335e-05, |
| "loss": 0.3371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2973299026489258, |
| "step": 490, |
| "valid_targets_mean": 2384.1, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 0.5199579831932774, |
| "grad_norm": 0.7920180853215862, |
| "learning_rate": 2.9625187406296856e-05, |
| "loss": 0.3357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31775835156440735, |
| "step": 495, |
| "valid_targets_mean": 2716.2, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 0.5252100840336135, |
| "grad_norm": 0.8442161626685477, |
| "learning_rate": 2.992503748125937e-05, |
| "loss": 0.3404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.304614782333374, |
| "step": 500, |
| "valid_targets_mean": 1944.6, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 0.5304621848739496, |
| "grad_norm": 0.8063704786094186, |
| "learning_rate": 3.022488755622189e-05, |
| "loss": 0.324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3063597083091736, |
| "step": 505, |
| "valid_targets_mean": 2314.1, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 0.5357142857142857, |
| "grad_norm": 0.8885170741957255, |
| "learning_rate": 3.052473763118441e-05, |
| "loss": 0.3186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.301100492477417, |
| "step": 510, |
| "valid_targets_mean": 1699.1, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 0.5409663865546218, |
| "grad_norm": 0.7707180348154409, |
| "learning_rate": 3.0824587706146934e-05, |
| "loss": 0.3444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33862438797950745, |
| "step": 515, |
| "valid_targets_mean": 2648.4, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 0.5462184873949579, |
| "grad_norm": 0.7331236147987067, |
| "learning_rate": 3.112443778110945e-05, |
| "loss": 0.3572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3474993109703064, |
| "step": 520, |
| "valid_targets_mean": 2870.6, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 0.5514705882352942, |
| "grad_norm": 0.9814672284053637, |
| "learning_rate": 3.142428785607197e-05, |
| "loss": 0.3307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.334958016872406, |
| "step": 525, |
| "valid_targets_mean": 2415.3, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 0.5567226890756303, |
| "grad_norm": 0.7379782030619627, |
| "learning_rate": 3.172413793103448e-05, |
| "loss": 0.3268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29642948508262634, |
| "step": 530, |
| "valid_targets_mean": 2672.1, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 0.5619747899159664, |
| "grad_norm": 0.7091140893245311, |
| "learning_rate": 3.2023988005997004e-05, |
| "loss": 0.3153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28314292430877686, |
| "step": 535, |
| "valid_targets_mean": 2483.3, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 0.5672268907563025, |
| "grad_norm": 0.7575431351825522, |
| "learning_rate": 3.2323838080959525e-05, |
| "loss": 0.324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33548930287361145, |
| "step": 540, |
| "valid_targets_mean": 2529.8, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 0.5724789915966386, |
| "grad_norm": 0.7600622983828266, |
| "learning_rate": 3.262368815592204e-05, |
| "loss": 0.3395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3454827666282654, |
| "step": 545, |
| "valid_targets_mean": 2808.9, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 0.5777310924369747, |
| "grad_norm": 0.8183170811821894, |
| "learning_rate": 3.292353823088456e-05, |
| "loss": 0.3224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35002923011779785, |
| "step": 550, |
| "valid_targets_mean": 2794.5, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 0.582983193277311, |
| "grad_norm": 0.8057355550873148, |
| "learning_rate": 3.3223388305847075e-05, |
| "loss": 0.3333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3431859612464905, |
| "step": 555, |
| "valid_targets_mean": 2285.7, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 0.5882352941176471, |
| "grad_norm": 0.6311718548224762, |
| "learning_rate": 3.3523238380809596e-05, |
| "loss": 0.3372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3158794641494751, |
| "step": 560, |
| "valid_targets_mean": 3329.5, |
| "valid_targets_min": 1114 |
| }, |
| { |
| "epoch": 0.5934873949579832, |
| "grad_norm": 0.7483509818624398, |
| "learning_rate": 3.382308845577212e-05, |
| "loss": 0.3101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.312336266040802, |
| "step": 565, |
| "valid_targets_mean": 2451.1, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 0.5987394957983193, |
| "grad_norm": 0.8180747042153188, |
| "learning_rate": 3.412293853073464e-05, |
| "loss": 0.3288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32389289140701294, |
| "step": 570, |
| "valid_targets_mean": 2601.9, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 0.6039915966386554, |
| "grad_norm": 0.7501508192177901, |
| "learning_rate": 3.442278860569715e-05, |
| "loss": 0.3178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3347775936126709, |
| "step": 575, |
| "valid_targets_mean": 2365.9, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 0.6092436974789915, |
| "grad_norm": 0.8986962858297536, |
| "learning_rate": 3.4722638680659673e-05, |
| "loss": 0.3175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2883639931678772, |
| "step": 580, |
| "valid_targets_mean": 2002.2, |
| "valid_targets_min": 1167 |
| }, |
| { |
| "epoch": 0.6144957983193278, |
| "grad_norm": 0.7802444960510159, |
| "learning_rate": 3.5022488755622194e-05, |
| "loss": 0.3346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32042810320854187, |
| "step": 585, |
| "valid_targets_mean": 2517.3, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 0.6197478991596639, |
| "grad_norm": 0.8123611572368629, |
| "learning_rate": 3.5322338830584716e-05, |
| "loss": 0.3421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3365861773490906, |
| "step": 590, |
| "valid_targets_mean": 2191.0, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 0.625, |
| "grad_norm": 0.7007108414732764, |
| "learning_rate": 3.562218890554723e-05, |
| "loss": 0.3405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3454342484474182, |
| "step": 595, |
| "valid_targets_mean": 2924.4, |
| "valid_targets_min": 1165 |
| }, |
| { |
| "epoch": 0.6302521008403361, |
| "grad_norm": 0.730987978325978, |
| "learning_rate": 3.592203898050975e-05, |
| "loss": 0.3132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29325562715530396, |
| "step": 600, |
| "valid_targets_mean": 2913.4, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 0.6355042016806722, |
| "grad_norm": 0.7733724038568615, |
| "learning_rate": 3.6221889055472265e-05, |
| "loss": 0.3195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3013491928577423, |
| "step": 605, |
| "valid_targets_mean": 2295.1, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 0.6407563025210085, |
| "grad_norm": 0.8343650173831091, |
| "learning_rate": 3.6521739130434786e-05, |
| "loss": 0.3194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29321059584617615, |
| "step": 610, |
| "valid_targets_mean": 1838.8, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 0.6460084033613446, |
| "grad_norm": 0.8241043537661473, |
| "learning_rate": 3.68215892053973e-05, |
| "loss": 0.3207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32989972829818726, |
| "step": 615, |
| "valid_targets_mean": 2260.1, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 0.6512605042016807, |
| "grad_norm": 0.8204056966498567, |
| "learning_rate": 3.712143928035982e-05, |
| "loss": 0.3318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32474619150161743, |
| "step": 620, |
| "valid_targets_mean": 2229.6, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 0.6565126050420168, |
| "grad_norm": 0.7119267457996982, |
| "learning_rate": 3.742128935532234e-05, |
| "loss": 0.3374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3413497507572174, |
| "step": 625, |
| "valid_targets_mean": 2606.0, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 0.6617647058823529, |
| "grad_norm": 0.8282736254561877, |
| "learning_rate": 3.772113943028486e-05, |
| "loss": 0.3145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30755430459976196, |
| "step": 630, |
| "valid_targets_mean": 1902.6, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 0.667016806722689, |
| "grad_norm": 0.7523816591845006, |
| "learning_rate": 3.802098950524738e-05, |
| "loss": 0.3373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34018948674201965, |
| "step": 635, |
| "valid_targets_mean": 2412.2, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 0.6722689075630253, |
| "grad_norm": 0.762541870874189, |
| "learning_rate": 3.83208395802099e-05, |
| "loss": 0.3223, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3180159330368042, |
| "step": 640, |
| "valid_targets_mean": 2287.2, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 0.6775210084033614, |
| "grad_norm": 1.0029207465299363, |
| "learning_rate": 3.862068965517242e-05, |
| "loss": 0.3572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33629217743873596, |
| "step": 645, |
| "valid_targets_mean": 2997.9, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 0.6827731092436975, |
| "grad_norm": 0.7213964566380182, |
| "learning_rate": 3.8920539730134934e-05, |
| "loss": 0.3128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2845936417579651, |
| "step": 650, |
| "valid_targets_mean": 2431.8, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 0.6880252100840336, |
| "grad_norm": 0.8519735795162455, |
| "learning_rate": 3.9220389805097455e-05, |
| "loss": 0.3433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3487856984138489, |
| "step": 655, |
| "valid_targets_mean": 2218.6, |
| "valid_targets_min": 954 |
| }, |
| { |
| "epoch": 0.6932773109243697, |
| "grad_norm": 0.7046220956008892, |
| "learning_rate": 3.9520239880059976e-05, |
| "loss": 0.3199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3212737441062927, |
| "step": 660, |
| "valid_targets_mean": 2970.2, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 0.6985294117647058, |
| "grad_norm": 0.7336185220602566, |
| "learning_rate": 3.982008995502249e-05, |
| "loss": 0.3157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3486784100532532, |
| "step": 665, |
| "valid_targets_mean": 2758.5, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 0.7037815126050421, |
| "grad_norm": 0.8287435711662308, |
| "learning_rate": 3.9999989022799437e-05, |
| "loss": 0.3279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3096350431442261, |
| "step": 670, |
| "valid_targets_mean": 1968.1, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 0.7090336134453782, |
| "grad_norm": 0.8202847564434639, |
| "learning_rate": 3.9999865529431466e-05, |
| "loss": 0.3302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3207584023475647, |
| "step": 675, |
| "valid_targets_mean": 2397.3, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 0.7142857142857143, |
| "grad_norm": 0.6219543558575774, |
| "learning_rate": 3.9999604822044886e-05, |
| "loss": 0.3056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2984098196029663, |
| "step": 680, |
| "valid_targets_mean": 3388.2, |
| "valid_targets_min": 1117 |
| }, |
| { |
| "epoch": 0.7195378151260504, |
| "grad_norm": 0.7173660798726208, |
| "learning_rate": 3.999920690242835e-05, |
| "loss": 0.304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29944783449172974, |
| "step": 685, |
| "valid_targets_mean": 2623.8, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 0.7247899159663865, |
| "grad_norm": 0.6960902757404932, |
| "learning_rate": 3.999867177331189e-05, |
| "loss": 0.3217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3305845856666565, |
| "step": 690, |
| "valid_targets_mean": 3031.8, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 0.7300420168067226, |
| "grad_norm": 0.9054223785892286, |
| "learning_rate": 3.9997999438366895e-05, |
| "loss": 0.3396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33356064558029175, |
| "step": 695, |
| "valid_targets_mean": 2308.3, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 0.7352941176470589, |
| "grad_norm": 0.7885273248848218, |
| "learning_rate": 3.9997189902206065e-05, |
| "loss": 0.3376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35361307859420776, |
| "step": 700, |
| "valid_targets_mean": 2145.7, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 0.740546218487395, |
| "grad_norm": 0.7007173394110273, |
| "learning_rate": 3.999624317038344e-05, |
| "loss": 0.3054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3023601770401001, |
| "step": 705, |
| "valid_targets_mean": 3050.5, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 0.7457983193277311, |
| "grad_norm": 0.6606567930836675, |
| "learning_rate": 3.9995159249394303e-05, |
| "loss": 0.3167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34521594643592834, |
| "step": 710, |
| "valid_targets_mean": 2787.5, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 0.7510504201680672, |
| "grad_norm": 0.7674014202376552, |
| "learning_rate": 3.999393814667517e-05, |
| "loss": 0.3251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3120829164981842, |
| "step": 715, |
| "valid_targets_mean": 2107.4, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 0.7563025210084033, |
| "grad_norm": 0.778065171637885, |
| "learning_rate": 3.9992579870603695e-05, |
| "loss": 0.3154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3578265905380249, |
| "step": 720, |
| "valid_targets_mean": 2320.1, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 0.7615546218487395, |
| "grad_norm": 0.6597642723911712, |
| "learning_rate": 3.999108443049869e-05, |
| "loss": 0.3072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3022955656051636, |
| "step": 725, |
| "valid_targets_mean": 2848.9, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 0.7668067226890757, |
| "grad_norm": 0.7875093632298531, |
| "learning_rate": 3.998945183661997e-05, |
| "loss": 0.3373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2969299256801605, |
| "step": 730, |
| "valid_targets_mean": 2284.4, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 0.7720588235294118, |
| "grad_norm": 0.718806100635945, |
| "learning_rate": 3.9987682100168376e-05, |
| "loss": 0.314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30758941173553467, |
| "step": 735, |
| "valid_targets_mean": 3248.9, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 0.7773109243697479, |
| "grad_norm": 0.6716380195670248, |
| "learning_rate": 3.99857752332856e-05, |
| "loss": 0.3062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29802027344703674, |
| "step": 740, |
| "valid_targets_mean": 2760.8, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 0.782563025210084, |
| "grad_norm": 0.7048509390731609, |
| "learning_rate": 3.998373124905418e-05, |
| "loss": 0.3266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.346552312374115, |
| "step": 745, |
| "valid_targets_mean": 2789.3, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 0.7878151260504201, |
| "grad_norm": 0.6889434405961281, |
| "learning_rate": 3.9981550161497375e-05, |
| "loss": 0.3285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30958837270736694, |
| "step": 750, |
| "valid_targets_mean": 2730.2, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 0.7930672268907563, |
| "grad_norm": 0.830218274291599, |
| "learning_rate": 3.9979231985579074e-05, |
| "loss": 0.3098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29535311460494995, |
| "step": 755, |
| "valid_targets_mean": 2651.5, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 0.7983193277310925, |
| "grad_norm": 0.869991526672995, |
| "learning_rate": 3.99767767372037e-05, |
| "loss": 0.3155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2807968854904175, |
| "step": 760, |
| "valid_targets_mean": 1711.4, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 0.8035714285714286, |
| "grad_norm": 0.7081493643105407, |
| "learning_rate": 3.997418443321609e-05, |
| "loss": 0.3097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32702767848968506, |
| "step": 765, |
| "valid_targets_mean": 2585.1, |
| "valid_targets_min": 572 |
| }, |
| { |
| "epoch": 0.8088235294117647, |
| "grad_norm": 0.8332144275405594, |
| "learning_rate": 3.997145509140138e-05, |
| "loss": 0.3095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31555208563804626, |
| "step": 770, |
| "valid_targets_mean": 2041.9, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 0.8140756302521008, |
| "grad_norm": 0.6009347239627268, |
| "learning_rate": 3.9968588730484896e-05, |
| "loss": 0.3284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34607839584350586, |
| "step": 775, |
| "valid_targets_mean": 3614.8, |
| "valid_targets_min": 1437 |
| }, |
| { |
| "epoch": 0.819327731092437, |
| "grad_norm": 0.7137919217562437, |
| "learning_rate": 3.9965585370132013e-05, |
| "loss": 0.314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30686646699905396, |
| "step": 780, |
| "valid_targets_mean": 2493.3, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 0.8245798319327731, |
| "grad_norm": 0.921127052828424, |
| "learning_rate": 3.996244503094804e-05, |
| "loss": 0.3143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29819056391716003, |
| "step": 785, |
| "valid_targets_mean": 1954.9, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 0.8298319327731093, |
| "grad_norm": 0.7650761079657684, |
| "learning_rate": 3.995916773447804e-05, |
| "loss": 0.3196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2871814966201782, |
| "step": 790, |
| "valid_targets_mean": 2216.4, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 0.8350840336134454, |
| "grad_norm": 0.7916639791964368, |
| "learning_rate": 3.995575350320671e-05, |
| "loss": 0.3237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3441137373447418, |
| "step": 795, |
| "valid_targets_mean": 2616.8, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 0.8403361344537815, |
| "grad_norm": 0.6287517180487977, |
| "learning_rate": 3.995220236055824e-05, |
| "loss": 0.3135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31627726554870605, |
| "step": 800, |
| "valid_targets_mean": 3041.9, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 0.8455882352941176, |
| "grad_norm": 0.6231303563829806, |
| "learning_rate": 3.99485143308961e-05, |
| "loss": 0.3099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3036961853504181, |
| "step": 805, |
| "valid_targets_mean": 3131.9, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 0.8508403361344538, |
| "grad_norm": 0.7183070177297722, |
| "learning_rate": 3.994468943952296e-05, |
| "loss": 0.3272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32938453555107117, |
| "step": 810, |
| "valid_targets_mean": 2472.3, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 0.8560924369747899, |
| "grad_norm": 0.7681753001830797, |
| "learning_rate": 3.994072771268041e-05, |
| "loss": 0.3195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3146156072616577, |
| "step": 815, |
| "valid_targets_mean": 2485.6, |
| "valid_targets_min": 903 |
| }, |
| { |
| "epoch": 0.8613445378151261, |
| "grad_norm": 0.6508689610348719, |
| "learning_rate": 3.993662917754885e-05, |
| "loss": 0.3127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32557421922683716, |
| "step": 820, |
| "valid_targets_mean": 2845.4, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 0.8665966386554622, |
| "grad_norm": 0.7108824995997928, |
| "learning_rate": 3.993239386224732e-05, |
| "loss": 0.3082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27090033888816833, |
| "step": 825, |
| "valid_targets_mean": 2473.5, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 0.8718487394957983, |
| "grad_norm": 0.7733012632993366, |
| "learning_rate": 3.992802179583322e-05, |
| "loss": 0.3199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32703638076782227, |
| "step": 830, |
| "valid_targets_mean": 2476.1, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 0.8771008403361344, |
| "grad_norm": 0.725543154459089, |
| "learning_rate": 3.9923513008302204e-05, |
| "loss": 0.3169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34420400857925415, |
| "step": 835, |
| "valid_targets_mean": 2456.4, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 0.8823529411764706, |
| "grad_norm": 0.6577502601354023, |
| "learning_rate": 3.991886753058792e-05, |
| "loss": 0.3014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27701324224472046, |
| "step": 840, |
| "valid_targets_mean": 2375.6, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 0.8876050420168067, |
| "grad_norm": 0.6971018819451299, |
| "learning_rate": 3.991408539456182e-05, |
| "loss": 0.3292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29996004700660706, |
| "step": 845, |
| "valid_targets_mean": 2597.3, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 0.8928571428571429, |
| "grad_norm": 0.6864026260317219, |
| "learning_rate": 3.990916663303293e-05, |
| "loss": 0.3211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3099818229675293, |
| "step": 850, |
| "valid_targets_mean": 2555.9, |
| "valid_targets_min": 1232 |
| }, |
| { |
| "epoch": 0.898109243697479, |
| "grad_norm": 0.6612404353720289, |
| "learning_rate": 3.990411127974762e-05, |
| "loss": 0.2985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32130175828933716, |
| "step": 855, |
| "valid_targets_mean": 3308.6, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 0.9033613445378151, |
| "grad_norm": 0.8109760616029387, |
| "learning_rate": 3.989891936938939e-05, |
| "loss": 0.297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30671462416648865, |
| "step": 860, |
| "valid_targets_mean": 1730.1, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 0.9086134453781513, |
| "grad_norm": 0.7674061973927943, |
| "learning_rate": 3.9893590937578634e-05, |
| "loss": 0.3084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35476604104042053, |
| "step": 865, |
| "valid_targets_mean": 1927.0, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 0.9138655462184874, |
| "grad_norm": 0.8917074057700859, |
| "learning_rate": 3.9888126020872375e-05, |
| "loss": 0.3193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3417109251022339, |
| "step": 870, |
| "valid_targets_mean": 2367.9, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 0.9191176470588235, |
| "grad_norm": 0.7447344177878483, |
| "learning_rate": 3.988252465676401e-05, |
| "loss": 0.332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3013457655906677, |
| "step": 875, |
| "valid_targets_mean": 2151.2, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 0.9243697478991597, |
| "grad_norm": 0.6389313482178219, |
| "learning_rate": 3.98767868836831e-05, |
| "loss": 0.2987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3207515478134155, |
| "step": 880, |
| "valid_targets_mean": 3044.4, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 0.9296218487394958, |
| "grad_norm": 0.7460485228221652, |
| "learning_rate": 3.987091274099504e-05, |
| "loss": 0.3008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.298840194940567, |
| "step": 885, |
| "valid_targets_mean": 2523.6, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 0.9348739495798319, |
| "grad_norm": 0.7123957413614789, |
| "learning_rate": 3.986490226900084e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3151017725467682, |
| "step": 890, |
| "valid_targets_mean": 2639.6, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 0.9401260504201681, |
| "grad_norm": 0.8425889968517829, |
| "learning_rate": 3.985875550893684e-05, |
| "loss": 0.3007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3078573942184448, |
| "step": 895, |
| "valid_targets_mean": 2052.1, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 0.9453781512605042, |
| "grad_norm": 0.6910638587235646, |
| "learning_rate": 3.9852472502974386e-05, |
| "loss": 0.2981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3093729019165039, |
| "step": 900, |
| "valid_targets_mean": 2373.8, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 0.9506302521008403, |
| "grad_norm": 0.67274771832946, |
| "learning_rate": 3.984605329421961e-05, |
| "loss": 0.3064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3389376997947693, |
| "step": 905, |
| "valid_targets_mean": 2981.9, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 0.9558823529411765, |
| "grad_norm": 0.7287563442852749, |
| "learning_rate": 3.983949792671307e-05, |
| "loss": 0.2871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29178452491760254, |
| "step": 910, |
| "valid_targets_mean": 2206.9, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 0.9611344537815126, |
| "grad_norm": 0.6697336132699603, |
| "learning_rate": 3.9832806445429486e-05, |
| "loss": 0.3059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2787833511829376, |
| "step": 915, |
| "valid_targets_mean": 2421.2, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 0.9663865546218487, |
| "grad_norm": 0.7721239770788888, |
| "learning_rate": 3.982597889627742e-05, |
| "loss": 0.3084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3243314027786255, |
| "step": 920, |
| "valid_targets_mean": 2458.9, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 0.9716386554621849, |
| "grad_norm": 0.6890378426610851, |
| "learning_rate": 3.981901532609896e-05, |
| "loss": 0.313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3086700439453125, |
| "step": 925, |
| "valid_targets_mean": 2401.8, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 0.976890756302521, |
| "grad_norm": 0.7281226712845131, |
| "learning_rate": 3.9811915782669406e-05, |
| "loss": 0.3124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27539515495300293, |
| "step": 930, |
| "valid_targets_mean": 2145.1, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 0.9821428571428571, |
| "grad_norm": 0.7223280692952256, |
| "learning_rate": 3.980468031469691e-05, |
| "loss": 0.3144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2952006459236145, |
| "step": 935, |
| "valid_targets_mean": 2334.9, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 0.9873949579831933, |
| "grad_norm": 0.7460709191349191, |
| "learning_rate": 3.9797308971822206e-05, |
| "loss": 0.3175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3261488676071167, |
| "step": 940, |
| "valid_targets_mean": 2191.4, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 0.9926470588235294, |
| "grad_norm": 0.6186791687377395, |
| "learning_rate": 3.978980180461821e-05, |
| "loss": 0.3292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33339810371398926, |
| "step": 945, |
| "valid_targets_mean": 3133.6, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 0.9978991596638656, |
| "grad_norm": 0.8177731068661213, |
| "learning_rate": 3.9782158864589696e-05, |
| "loss": 0.3013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27547362446784973, |
| "step": 950, |
| "valid_targets_mean": 1856.8, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 1.0031512605042017, |
| "grad_norm": 0.7256412516546766, |
| "learning_rate": 3.977438020417293e-05, |
| "loss": 0.2844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.305136114358902, |
| "step": 955, |
| "valid_targets_mean": 2359.5, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 1.0084033613445378, |
| "grad_norm": 0.7379697373188653, |
| "learning_rate": 3.9766465876735354e-05, |
| "loss": 0.2853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2883484661579132, |
| "step": 960, |
| "valid_targets_mean": 2517.8, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 1.013655462184874, |
| "grad_norm": 0.7450004669339628, |
| "learning_rate": 3.9758415936575155e-05, |
| "loss": 0.2694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2624656856060028, |
| "step": 965, |
| "valid_targets_mean": 2335.6, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 1.01890756302521, |
| "grad_norm": 0.8213378024423946, |
| "learning_rate": 3.975023043892094e-05, |
| "loss": 0.2998, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3582037091255188, |
| "step": 970, |
| "valid_targets_mean": 2665.7, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 1.0241596638655461, |
| "grad_norm": 1.1203862991152767, |
| "learning_rate": 3.974190943993133e-05, |
| "loss": 0.2855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2818828821182251, |
| "step": 975, |
| "valid_targets_mean": 1555.1, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 1.0294117647058822, |
| "grad_norm": 0.5968672236493667, |
| "learning_rate": 3.973345299669461e-05, |
| "loss": 0.2909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24849054217338562, |
| "step": 980, |
| "valid_targets_mean": 3073.6, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 1.0346638655462186, |
| "grad_norm": 0.6412679780590781, |
| "learning_rate": 3.972486116722828e-05, |
| "loss": 0.2966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.270571231842041, |
| "step": 985, |
| "valid_targets_mean": 2620.9, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 1.0399159663865547, |
| "grad_norm": 0.658674789610642, |
| "learning_rate": 3.971613401047872e-05, |
| "loss": 0.2928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28596004843711853, |
| "step": 990, |
| "valid_targets_mean": 2736.1, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 1.0451680672268908, |
| "grad_norm": 0.708522171289682, |
| "learning_rate": 3.970727158632075e-05, |
| "loss": 0.2791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25710612535476685, |
| "step": 995, |
| "valid_targets_mean": 2025.1, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 1.050420168067227, |
| "grad_norm": 0.8163565196188108, |
| "learning_rate": 3.969827395555721e-05, |
| "loss": 0.2842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3168991506099701, |
| "step": 1000, |
| "valid_targets_mean": 2106.7, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 1.055672268907563, |
| "grad_norm": 0.7814582268431446, |
| "learning_rate": 3.968914117991857e-05, |
| "loss": 0.2953, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.269026517868042, |
| "step": 1005, |
| "valid_targets_mean": 2927.3, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 1.0609243697478992, |
| "grad_norm": 0.7483470353521008, |
| "learning_rate": 3.967987332206249e-05, |
| "loss": 0.2864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2755717635154724, |
| "step": 1010, |
| "valid_targets_mean": 2053.3, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 1.0661764705882353, |
| "grad_norm": 0.6950043296063686, |
| "learning_rate": 3.967047044557341e-05, |
| "loss": 0.2927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2624019682407379, |
| "step": 1015, |
| "valid_targets_mean": 2560.6, |
| "valid_targets_min": 918 |
| }, |
| { |
| "epoch": 1.0714285714285714, |
| "grad_norm": 0.7326135503168667, |
| "learning_rate": 3.966093261496208e-05, |
| "loss": 0.2827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2939094305038452, |
| "step": 1020, |
| "valid_targets_mean": 2364.4, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 1.0766806722689075, |
| "grad_norm": 0.7595424312977608, |
| "learning_rate": 3.9651259895665146e-05, |
| "loss": 0.303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32039862871170044, |
| "step": 1025, |
| "valid_targets_mean": 2230.6, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 1.0819327731092436, |
| "grad_norm": 0.745092373926396, |
| "learning_rate": 3.9641452354044687e-05, |
| "loss": 0.2933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30866172909736633, |
| "step": 1030, |
| "valid_targets_mean": 2336.8, |
| "valid_targets_min": 1140 |
| }, |
| { |
| "epoch": 1.0871848739495797, |
| "grad_norm": 0.7617543273247012, |
| "learning_rate": 3.9631510057387765e-05, |
| "loss": 0.2765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2596009075641632, |
| "step": 1035, |
| "valid_targets_mean": 2062.8, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 1.092436974789916, |
| "grad_norm": 0.8286121150834354, |
| "learning_rate": 3.962143307390596e-05, |
| "loss": 0.2798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2832181453704834, |
| "step": 1040, |
| "valid_targets_mean": 2286.1, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 1.0976890756302522, |
| "grad_norm": 0.8421971274176083, |
| "learning_rate": 3.961122147273491e-05, |
| "loss": 0.28, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31647855043411255, |
| "step": 1045, |
| "valid_targets_mean": 2367.7, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 1.1029411764705883, |
| "grad_norm": 0.7098338434234529, |
| "learning_rate": 3.9600875323933826e-05, |
| "loss": 0.2787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30434438586235046, |
| "step": 1050, |
| "valid_targets_mean": 2628.7, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 1.1081932773109244, |
| "grad_norm": 0.6866219477953722, |
| "learning_rate": 3.959039469848502e-05, |
| "loss": 0.2878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29877203702926636, |
| "step": 1055, |
| "valid_targets_mean": 2690.5, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 1.1134453781512605, |
| "grad_norm": 0.6372603497209481, |
| "learning_rate": 3.9579779668293416e-05, |
| "loss": 0.3004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28999483585357666, |
| "step": 1060, |
| "valid_targets_mean": 2948.1, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 1.1186974789915967, |
| "grad_norm": 0.6799822940846726, |
| "learning_rate": 3.956903030618605e-05, |
| "loss": 0.2797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27467814087867737, |
| "step": 1065, |
| "valid_targets_mean": 2615.4, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 1.1239495798319328, |
| "grad_norm": 0.7809972116466566, |
| "learning_rate": 3.955814668591156e-05, |
| "loss": 0.2837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27500802278518677, |
| "step": 1070, |
| "valid_targets_mean": 2294.4, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 1.129201680672269, |
| "grad_norm": 0.7524552269972444, |
| "learning_rate": 3.9547128882139735e-05, |
| "loss": 0.274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2802833616733551, |
| "step": 1075, |
| "valid_targets_mean": 2288.1, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 1.134453781512605, |
| "grad_norm": 0.6658052832741743, |
| "learning_rate": 3.9535976970460925e-05, |
| "loss": 0.3048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3079906702041626, |
| "step": 1080, |
| "valid_targets_mean": 3495.8, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 1.1397058823529411, |
| "grad_norm": 0.7347104088170611, |
| "learning_rate": 3.9524691027385585e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31090694665908813, |
| "step": 1085, |
| "valid_targets_mean": 2511.8, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 1.1449579831932772, |
| "grad_norm": 0.6724112220847397, |
| "learning_rate": 3.95132711303437e-05, |
| "loss": 0.2997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30762532353401184, |
| "step": 1090, |
| "valid_targets_mean": 2850.2, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 1.1502100840336134, |
| "grad_norm": 0.8334744080367508, |
| "learning_rate": 3.9501717357684315e-05, |
| "loss": 0.2775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28743976354599, |
| "step": 1095, |
| "valid_targets_mean": 2099.1, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 1.1554621848739495, |
| "grad_norm": 0.7032590588711007, |
| "learning_rate": 3.9490029788674934e-05, |
| "loss": 0.2917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2826242446899414, |
| "step": 1100, |
| "valid_targets_mean": 2369.9, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 1.1607142857142858, |
| "grad_norm": 1.221702121249645, |
| "learning_rate": 3.9478208503501e-05, |
| "loss": 0.288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2712562680244446, |
| "step": 1105, |
| "valid_targets_mean": 2393.2, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 1.165966386554622, |
| "grad_norm": 0.7494443041520203, |
| "learning_rate": 3.946625358326538e-05, |
| "loss": 0.266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2519804835319519, |
| "step": 1110, |
| "valid_targets_mean": 1945.5, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 1.171218487394958, |
| "grad_norm": 0.5997164956764384, |
| "learning_rate": 3.945416510998775e-05, |
| "loss": 0.2959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2693081498146057, |
| "step": 1115, |
| "valid_targets_mean": 3155.6, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 1.1764705882352942, |
| "grad_norm": 0.6293715830721176, |
| "learning_rate": 3.944194316660406e-05, |
| "loss": 0.2876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2860058546066284, |
| "step": 1120, |
| "valid_targets_mean": 2777.3, |
| "valid_targets_min": 955 |
| }, |
| { |
| "epoch": 1.1817226890756303, |
| "grad_norm": 0.7097668355853033, |
| "learning_rate": 3.942958783696598e-05, |
| "loss": 0.2818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2959762215614319, |
| "step": 1125, |
| "valid_targets_mean": 2465.1, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 1.1869747899159664, |
| "grad_norm": 0.6825216992106221, |
| "learning_rate": 3.94170992058403e-05, |
| "loss": 0.2773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27206242084503174, |
| "step": 1130, |
| "valid_targets_mean": 2581.8, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 1.1922268907563025, |
| "grad_norm": 0.6192081356673204, |
| "learning_rate": 3.9404477358908354e-05, |
| "loss": 0.264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25278788805007935, |
| "step": 1135, |
| "valid_targets_mean": 2664.7, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 1.1974789915966386, |
| "grad_norm": 0.811292426338912, |
| "learning_rate": 3.9391722382765445e-05, |
| "loss": 0.2948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29716646671295166, |
| "step": 1140, |
| "valid_targets_mean": 1980.2, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 1.2027310924369747, |
| "grad_norm": 0.7668088242832095, |
| "learning_rate": 3.937883436492025e-05, |
| "loss": 0.2877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27448099851608276, |
| "step": 1145, |
| "valid_targets_mean": 1986.5, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 1.2079831932773109, |
| "grad_norm": 0.7413211114263699, |
| "learning_rate": 3.9365813393794186e-05, |
| "loss": 0.2983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2899211049079895, |
| "step": 1150, |
| "valid_targets_mean": 2858.4, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 1.213235294117647, |
| "grad_norm": 0.7546705832538436, |
| "learning_rate": 3.9352659558720836e-05, |
| "loss": 0.2826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2793716490268707, |
| "step": 1155, |
| "valid_targets_mean": 2138.5, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 1.2184873949579833, |
| "grad_norm": 0.782588277733481, |
| "learning_rate": 3.933937294994535e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2977146804332733, |
| "step": 1160, |
| "valid_targets_mean": 2275.8, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 1.2237394957983194, |
| "grad_norm": 0.8153448615714938, |
| "learning_rate": 3.932595365862379e-05, |
| "loss": 0.2974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3228553533554077, |
| "step": 1165, |
| "valid_targets_mean": 2634.8, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 1.2289915966386555, |
| "grad_norm": 0.792990263276749, |
| "learning_rate": 3.9312401776822504e-05, |
| "loss": 0.2789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26295557618141174, |
| "step": 1170, |
| "valid_targets_mean": 1794.0, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 1.2342436974789917, |
| "grad_norm": 0.6797271279062665, |
| "learning_rate": 3.9298717397517546e-05, |
| "loss": 0.2678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27940213680267334, |
| "step": 1175, |
| "valid_targets_mean": 2708.9, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 1.2394957983193278, |
| "grad_norm": 0.6849285603022243, |
| "learning_rate": 3.928490061459396e-05, |
| "loss": 0.2776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2747243046760559, |
| "step": 1180, |
| "valid_targets_mean": 2251.1, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 1.2447478991596639, |
| "grad_norm": 0.7245761997254816, |
| "learning_rate": 3.927095152284521e-05, |
| "loss": 0.2924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3488772511482239, |
| "step": 1185, |
| "valid_targets_mean": 3074.4, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 1.25, |
| "grad_norm": 0.7010066220238207, |
| "learning_rate": 3.925687021797249e-05, |
| "loss": 0.2834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29797542095184326, |
| "step": 1190, |
| "valid_targets_mean": 2721.6, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 1.2552521008403361, |
| "grad_norm": 1.0179359955088225, |
| "learning_rate": 3.924265679658407e-05, |
| "loss": 0.285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27947139739990234, |
| "step": 1195, |
| "valid_targets_mean": 1642.1, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 1.2605042016806722, |
| "grad_norm": 0.7149247912396931, |
| "learning_rate": 3.922831135619462e-05, |
| "loss": 0.2831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2821911573410034, |
| "step": 1200, |
| "valid_targets_mean": 2422.2, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 1.2657563025210083, |
| "grad_norm": 0.7243464387956448, |
| "learning_rate": 3.9213833995224605e-05, |
| "loss": 0.2818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2676169276237488, |
| "step": 1205, |
| "valid_targets_mean": 2188.3, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 1.2710084033613445, |
| "grad_norm": 0.7370679575877426, |
| "learning_rate": 3.919922481299952e-05, |
| "loss": 0.3017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32717978954315186, |
| "step": 1210, |
| "valid_targets_mean": 2311.9, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 1.2762605042016806, |
| "grad_norm": 0.6894289625236196, |
| "learning_rate": 3.918448390974928e-05, |
| "loss": 0.2759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26075074076652527, |
| "step": 1215, |
| "valid_targets_mean": 2090.9, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 1.2815126050420167, |
| "grad_norm": 0.8026290889025559, |
| "learning_rate": 3.9169611386607476e-05, |
| "loss": 0.2928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30541282892227173, |
| "step": 1220, |
| "valid_targets_mean": 2121.8, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 1.2867647058823528, |
| "grad_norm": 0.7771870350210088, |
| "learning_rate": 3.9154607345610746e-05, |
| "loss": 0.273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2856689691543579, |
| "step": 1225, |
| "valid_targets_mean": 2416.0, |
| "valid_targets_min": 1196 |
| }, |
| { |
| "epoch": 1.2920168067226891, |
| "grad_norm": 0.673563167861582, |
| "learning_rate": 3.913947188969801e-05, |
| "loss": 0.3009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2647175192832947, |
| "step": 1230, |
| "valid_targets_mean": 2471.2, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 1.2972689075630253, |
| "grad_norm": 0.6531080612213936, |
| "learning_rate": 3.912420512270981e-05, |
| "loss": 0.2766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22836507856845856, |
| "step": 1235, |
| "valid_targets_mean": 2253.1, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 1.3025210084033614, |
| "grad_norm": 0.7035585449641938, |
| "learning_rate": 3.910880714938757e-05, |
| "loss": 0.2851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3099633455276489, |
| "step": 1240, |
| "valid_targets_mean": 2499.9, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 1.3077731092436975, |
| "grad_norm": 0.5567277712502462, |
| "learning_rate": 3.909327807537288e-05, |
| "loss": 0.2897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28143376111984253, |
| "step": 1245, |
| "valid_targets_mean": 3603.4, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 1.3130252100840336, |
| "grad_norm": 0.7110770433202822, |
| "learning_rate": 3.90776180072068e-05, |
| "loss": 0.2744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2797868251800537, |
| "step": 1250, |
| "valid_targets_mean": 2393.1, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 1.3182773109243697, |
| "grad_norm": 0.5586358952592809, |
| "learning_rate": 3.906182705232909e-05, |
| "loss": 0.2778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2782168388366699, |
| "step": 1255, |
| "valid_targets_mean": 4218.8, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 1.3235294117647058, |
| "grad_norm": 0.7634189610982803, |
| "learning_rate": 3.904590531907751e-05, |
| "loss": 0.286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30689549446105957, |
| "step": 1260, |
| "valid_targets_mean": 2308.6, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 1.328781512605042, |
| "grad_norm": 0.660398552740273, |
| "learning_rate": 3.9029852916687034e-05, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29954206943511963, |
| "step": 1265, |
| "valid_targets_mean": 2645.9, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 1.334033613445378, |
| "grad_norm": 0.674497976039509, |
| "learning_rate": 3.9013669955289136e-05, |
| "loss": 0.2945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2616213858127594, |
| "step": 1270, |
| "valid_targets_mean": 2590.4, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 1.3392857142857144, |
| "grad_norm": 0.6745461538720665, |
| "learning_rate": 3.899735654591101e-05, |
| "loss": 0.2724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2934377193450928, |
| "step": 1275, |
| "valid_targets_mean": 2654.6, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 1.3445378151260505, |
| "grad_norm": 0.6298474437654481, |
| "learning_rate": 3.898091280047486e-05, |
| "loss": 0.2907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26556211709976196, |
| "step": 1280, |
| "valid_targets_mean": 3061.3, |
| "valid_targets_min": 905 |
| }, |
| { |
| "epoch": 1.3497899159663866, |
| "grad_norm": 0.6789724693265738, |
| "learning_rate": 3.896433883179703e-05, |
| "loss": 0.2797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24146893620491028, |
| "step": 1285, |
| "valid_targets_mean": 2094.8, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 1.3550420168067228, |
| "grad_norm": 0.7300952923000248, |
| "learning_rate": 3.894763475358736e-05, |
| "loss": 0.2687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2770267724990845, |
| "step": 1290, |
| "valid_targets_mean": 2336.6, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 1.3602941176470589, |
| "grad_norm": 0.8086297463249519, |
| "learning_rate": 3.8930800680448275e-05, |
| "loss": 0.2713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26473838090896606, |
| "step": 1295, |
| "valid_targets_mean": 1924.0, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 1.365546218487395, |
| "grad_norm": 0.6977529571217691, |
| "learning_rate": 3.891383672787411e-05, |
| "loss": 0.2761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2646206021308899, |
| "step": 1300, |
| "valid_targets_mean": 2431.1, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 1.370798319327731, |
| "grad_norm": 0.7033155019588632, |
| "learning_rate": 3.889674301225025e-05, |
| "loss": 0.2746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27550557255744934, |
| "step": 1305, |
| "valid_targets_mean": 2446.4, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 1.3760504201680672, |
| "grad_norm": 0.7011256224002429, |
| "learning_rate": 3.8879519650852356e-05, |
| "loss": 0.2798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29224735498428345, |
| "step": 1310, |
| "valid_targets_mean": 2337.5, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 1.3813025210084033, |
| "grad_norm": 0.7551918929706497, |
| "learning_rate": 3.886216676184555e-05, |
| "loss": 0.2786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25635597109794617, |
| "step": 1315, |
| "valid_targets_mean": 1767.4, |
| "valid_targets_min": 903 |
| }, |
| { |
| "epoch": 1.3865546218487395, |
| "grad_norm": 0.841773127497859, |
| "learning_rate": 3.8844684464283614e-05, |
| "loss": 0.2729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28463175892829895, |
| "step": 1320, |
| "valid_targets_mean": 2054.4, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 1.3918067226890756, |
| "grad_norm": 0.714138459758691, |
| "learning_rate": 3.882707287810817e-05, |
| "loss": 0.2829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3063795566558838, |
| "step": 1325, |
| "valid_targets_mean": 2356.1, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 1.3970588235294117, |
| "grad_norm": 0.7951782867715268, |
| "learning_rate": 3.880933212414786e-05, |
| "loss": 0.2791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31758105754852295, |
| "step": 1330, |
| "valid_targets_mean": 2118.9, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 1.4023109243697478, |
| "grad_norm": 0.6803907534201502, |
| "learning_rate": 3.87914623241175e-05, |
| "loss": 0.2774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2610444724559784, |
| "step": 1335, |
| "valid_targets_mean": 2595.9, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 1.407563025210084, |
| "grad_norm": 0.7146731724902138, |
| "learning_rate": 3.877346360061728e-05, |
| "loss": 0.2903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2991168200969696, |
| "step": 1340, |
| "valid_targets_mean": 2701.4, |
| "valid_targets_min": 931 |
| }, |
| { |
| "epoch": 1.41281512605042, |
| "grad_norm": 0.7591356155611764, |
| "learning_rate": 3.8755336077131894e-05, |
| "loss": 0.2835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2531967759132385, |
| "step": 1345, |
| "valid_targets_mean": 1822.8, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 1.4180672268907564, |
| "grad_norm": 0.6930387851247973, |
| "learning_rate": 3.873707987802967e-05, |
| "loss": 0.2775, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2844356298446655, |
| "step": 1350, |
| "valid_targets_mean": 2694.1, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 1.4233193277310925, |
| "grad_norm": 0.6030534452348743, |
| "learning_rate": 3.871869512856179e-05, |
| "loss": 0.2738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2641228139400482, |
| "step": 1355, |
| "valid_targets_mean": 3138.3, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 1.4285714285714286, |
| "grad_norm": 0.5730393066215059, |
| "learning_rate": 3.870018195486138e-05, |
| "loss": 0.2695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24910803139209747, |
| "step": 1360, |
| "valid_targets_mean": 3588.1, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 1.4338235294117647, |
| "grad_norm": 0.7755395352301468, |
| "learning_rate": 3.868154048394262e-05, |
| "loss": 0.276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2994786202907562, |
| "step": 1365, |
| "valid_targets_mean": 2700.9, |
| "valid_targets_min": 1110 |
| }, |
| { |
| "epoch": 1.4390756302521008, |
| "grad_norm": 0.7005171055078728, |
| "learning_rate": 3.8662770843699944e-05, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3116563558578491, |
| "step": 1370, |
| "valid_targets_mean": 2591.6, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 1.444327731092437, |
| "grad_norm": 0.7295296113213054, |
| "learning_rate": 3.8643873162907086e-05, |
| "loss": 0.2858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2686575651168823, |
| "step": 1375, |
| "valid_targets_mean": 2169.4, |
| "valid_targets_min": 690 |
| }, |
| { |
| "epoch": 1.449579831932773, |
| "grad_norm": 0.728303365746196, |
| "learning_rate": 3.862484757121627e-05, |
| "loss": 0.3071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.343506395816803, |
| "step": 1380, |
| "valid_targets_mean": 2436.4, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 1.4548319327731092, |
| "grad_norm": 0.7264219557451437, |
| "learning_rate": 3.860569419915727e-05, |
| "loss": 0.2952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27744126319885254, |
| "step": 1385, |
| "valid_targets_mean": 2069.1, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 1.4600840336134453, |
| "grad_norm": 0.7451210015033147, |
| "learning_rate": 3.858641317813653e-05, |
| "loss": 0.2592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.264180064201355, |
| "step": 1390, |
| "valid_targets_mean": 2131.1, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 1.4653361344537816, |
| "grad_norm": 0.7180216886659947, |
| "learning_rate": 3.8567004640436234e-05, |
| "loss": 0.2864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28325045108795166, |
| "step": 1395, |
| "valid_targets_mean": 2150.3, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 1.4705882352941178, |
| "grad_norm": 0.6005140811506897, |
| "learning_rate": 3.8547468719213476e-05, |
| "loss": 0.291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2805612087249756, |
| "step": 1400, |
| "valid_targets_mean": 2986.0, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 1.4758403361344539, |
| "grad_norm": 0.6701734829120335, |
| "learning_rate": 3.852780554849925e-05, |
| "loss": 0.2713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2722683250904083, |
| "step": 1405, |
| "valid_targets_mean": 2545.0, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 1.48109243697479, |
| "grad_norm": 0.7156588483612103, |
| "learning_rate": 3.850801526319761e-05, |
| "loss": 0.2917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3095453381538391, |
| "step": 1410, |
| "valid_targets_mean": 2583.2, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 1.486344537815126, |
| "grad_norm": 0.6515593357765462, |
| "learning_rate": 3.84880979990847e-05, |
| "loss": 0.278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2939472198486328, |
| "step": 1415, |
| "valid_targets_mean": 2874.5, |
| "valid_targets_min": 1405 |
| }, |
| { |
| "epoch": 1.4915966386554622, |
| "grad_norm": 0.6808237094478136, |
| "learning_rate": 3.846805389280782e-05, |
| "loss": 0.2836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29528388381004333, |
| "step": 1420, |
| "valid_targets_mean": 2692.4, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 1.4968487394957983, |
| "grad_norm": 0.6429218218943833, |
| "learning_rate": 3.844788308188452e-05, |
| "loss": 0.2749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24127134680747986, |
| "step": 1425, |
| "valid_targets_mean": 2371.2, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 1.5021008403361344, |
| "grad_norm": 0.7293161414772861, |
| "learning_rate": 3.8427585704701634e-05, |
| "loss": 0.289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32644128799438477, |
| "step": 1430, |
| "valid_targets_mean": 2395.9, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 1.5073529411764706, |
| "grad_norm": 0.6776284586447868, |
| "learning_rate": 3.840716190051433e-05, |
| "loss": 0.2978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2834451198577881, |
| "step": 1435, |
| "valid_targets_mean": 2865.2, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 1.5126050420168067, |
| "grad_norm": 0.7065935410256674, |
| "learning_rate": 3.8386611809445155e-05, |
| "loss": 0.2874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2767036557197571, |
| "step": 1440, |
| "valid_targets_mean": 2116.9, |
| "valid_targets_min": 1347 |
| }, |
| { |
| "epoch": 1.5178571428571428, |
| "grad_norm": 0.6875344935274045, |
| "learning_rate": 3.8365935572483095e-05, |
| "loss": 0.2797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25539255142211914, |
| "step": 1445, |
| "valid_targets_mean": 2034.7, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 1.523109243697479, |
| "grad_norm": 0.6114420882513082, |
| "learning_rate": 3.834513333148258e-05, |
| "loss": 0.2925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3040091097354889, |
| "step": 1450, |
| "valid_targets_mean": 3394.8, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 1.528361344537815, |
| "grad_norm": 0.7351299306831928, |
| "learning_rate": 3.832420522916252e-05, |
| "loss": 0.2726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29218441247940063, |
| "step": 1455, |
| "valid_targets_mean": 2289.6, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 1.5336134453781511, |
| "grad_norm": 0.6742529951804918, |
| "learning_rate": 3.830315140910534e-05, |
| "loss": 0.2824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27924418449401855, |
| "step": 1460, |
| "valid_targets_mean": 2554.1, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 1.5388655462184873, |
| "grad_norm": 0.642103371520459, |
| "learning_rate": 3.8281972015755965e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28389638662338257, |
| "step": 1465, |
| "valid_targets_mean": 2878.4, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 1.5441176470588234, |
| "grad_norm": 0.6652065712153472, |
| "learning_rate": 3.826066719442086e-05, |
| "loss": 0.3033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28304386138916016, |
| "step": 1470, |
| "valid_targets_mean": 3034.9, |
| "valid_targets_min": 1390 |
| }, |
| { |
| "epoch": 1.5493697478991597, |
| "grad_norm": 0.6732297614547262, |
| "learning_rate": 3.823923709126701e-05, |
| "loss": 0.2739, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27302515506744385, |
| "step": 1475, |
| "valid_targets_mean": 2630.1, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 1.5546218487394958, |
| "grad_norm": 0.7977790582505264, |
| "learning_rate": 3.821768185332095e-05, |
| "loss": 0.2752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23856990039348602, |
| "step": 1480, |
| "valid_targets_mean": 1874.7, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 1.559873949579832, |
| "grad_norm": 0.6416684613994287, |
| "learning_rate": 3.81960016284677e-05, |
| "loss": 0.2789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2834779918193817, |
| "step": 1485, |
| "valid_targets_mean": 2730.8, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 1.565126050420168, |
| "grad_norm": 0.7215663679705727, |
| "learning_rate": 3.817419656544979e-05, |
| "loss": 0.2713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28470200300216675, |
| "step": 1490, |
| "valid_targets_mean": 2297.9, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 1.5703781512605042, |
| "grad_norm": 0.7210848118654766, |
| "learning_rate": 3.815226681386626e-05, |
| "loss": 0.3029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30118465423583984, |
| "step": 1495, |
| "valid_targets_mean": 2422.6, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 1.5756302521008403, |
| "grad_norm": 0.7318400772244765, |
| "learning_rate": 3.8130212524171576e-05, |
| "loss": 0.2871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3544023036956787, |
| "step": 1500, |
| "valid_targets_mean": 2730.2, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 1.5808823529411766, |
| "grad_norm": 0.764194530000509, |
| "learning_rate": 3.810803384767465e-05, |
| "loss": 0.2668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22156544029712677, |
| "step": 1505, |
| "valid_targets_mean": 1869.6, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 1.5861344537815127, |
| "grad_norm": 0.7198936509540297, |
| "learning_rate": 3.808573093653777e-05, |
| "loss": 0.2803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29135745763778687, |
| "step": 1510, |
| "valid_targets_mean": 2092.8, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 1.5913865546218489, |
| "grad_norm": 0.664810251317532, |
| "learning_rate": 3.806330394377556e-05, |
| "loss": 0.2671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2656877934932709, |
| "step": 1515, |
| "valid_targets_mean": 2300.4, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 1.596638655462185, |
| "grad_norm": 0.7873381808170635, |
| "learning_rate": 3.8040753023253956e-05, |
| "loss": 0.2784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2537113130092621, |
| "step": 1520, |
| "valid_targets_mean": 2188.1, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 1.601890756302521, |
| "grad_norm": 0.8013762972275075, |
| "learning_rate": 3.801807832968912e-05, |
| "loss": 0.2911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28357455134391785, |
| "step": 1525, |
| "valid_targets_mean": 1841.9, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 1.6071428571428572, |
| "grad_norm": 0.6363572479336133, |
| "learning_rate": 3.799528001864637e-05, |
| "loss": 0.2632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28672128915786743, |
| "step": 1530, |
| "valid_targets_mean": 2678.1, |
| "valid_targets_min": 804 |
| }, |
| { |
| "epoch": 1.6123949579831933, |
| "grad_norm": 0.626675259486661, |
| "learning_rate": 3.797235824653918e-05, |
| "loss": 0.2834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2521238327026367, |
| "step": 1535, |
| "valid_targets_mean": 2923.1, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 1.6176470588235294, |
| "grad_norm": 0.7719429167065398, |
| "learning_rate": 3.7949313170628006e-05, |
| "loss": 0.2855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26524102687835693, |
| "step": 1540, |
| "valid_targets_mean": 2188.1, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 1.6228991596638656, |
| "grad_norm": 0.6140414130735539, |
| "learning_rate": 3.79261449490193e-05, |
| "loss": 0.2824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28398892283439636, |
| "step": 1545, |
| "valid_targets_mean": 2975.3, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 1.6281512605042017, |
| "grad_norm": 0.6333512043620656, |
| "learning_rate": 3.7902853740664356e-05, |
| "loss": 0.2777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25651031732559204, |
| "step": 1550, |
| "valid_targets_mean": 2676.1, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 1.6334033613445378, |
| "grad_norm": 0.7945225853691145, |
| "learning_rate": 3.7879439705358286e-05, |
| "loss": 0.2886, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28769397735595703, |
| "step": 1555, |
| "valid_targets_mean": 2333.7, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 1.638655462184874, |
| "grad_norm": 0.6613578680004154, |
| "learning_rate": 3.785590300373884e-05, |
| "loss": 0.2963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2788962423801422, |
| "step": 1560, |
| "valid_targets_mean": 2716.4, |
| "valid_targets_min": 1120 |
| }, |
| { |
| "epoch": 1.64390756302521, |
| "grad_norm": 0.6200210594873011, |
| "learning_rate": 3.7832243797285385e-05, |
| "loss": 0.2742, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30993425846099854, |
| "step": 1565, |
| "valid_targets_mean": 3246.9, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 1.6491596638655461, |
| "grad_norm": 0.6841959383278441, |
| "learning_rate": 3.780846224831775e-05, |
| "loss": 0.2795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29545074701309204, |
| "step": 1570, |
| "valid_targets_mean": 2656.0, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 1.6544117647058822, |
| "grad_norm": 0.646661736839655, |
| "learning_rate": 3.7784558519995135e-05, |
| "loss": 0.2807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2950468063354492, |
| "step": 1575, |
| "valid_targets_mean": 2778.9, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 1.6596638655462184, |
| "grad_norm": 0.5963871526060771, |
| "learning_rate": 3.776053277631496e-05, |
| "loss": 0.2784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27574625611305237, |
| "step": 1580, |
| "valid_targets_mean": 2941.4, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 1.6649159663865545, |
| "grad_norm": 0.6789032459708729, |
| "learning_rate": 3.7736385182111785e-05, |
| "loss": 0.2766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28872212767601013, |
| "step": 1585, |
| "valid_targets_mean": 2428.8, |
| "valid_targets_min": 1240 |
| }, |
| { |
| "epoch": 1.6701680672268906, |
| "grad_norm": 0.8766320854428324, |
| "learning_rate": 3.771211590305614e-05, |
| "loss": 0.2937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27332085371017456, |
| "step": 1590, |
| "valid_targets_mean": 2621.5, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 1.675420168067227, |
| "grad_norm": 0.6841578200409935, |
| "learning_rate": 3.768772510565342e-05, |
| "loss": 0.2698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2623317241668701, |
| "step": 1595, |
| "valid_targets_mean": 2145.7, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 1.680672268907563, |
| "grad_norm": 0.7486173630607642, |
| "learning_rate": 3.76632129572427e-05, |
| "loss": 0.2732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.306223064661026, |
| "step": 1600, |
| "valid_targets_mean": 2413.9, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 1.6859243697478992, |
| "grad_norm": 0.6168280825117122, |
| "learning_rate": 3.763857962599565e-05, |
| "loss": 0.2747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26991304755210876, |
| "step": 1605, |
| "valid_targets_mean": 2552.2, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 1.6911764705882353, |
| "grad_norm": 0.6766304351456689, |
| "learning_rate": 3.761382528091531e-05, |
| "loss": 0.2759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28340253233909607, |
| "step": 1610, |
| "valid_targets_mean": 2665.7, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 1.6964285714285714, |
| "grad_norm": 0.7062299801799153, |
| "learning_rate": 3.7588950091834986e-05, |
| "loss": 0.2863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27810871601104736, |
| "step": 1615, |
| "valid_targets_mean": 2484.9, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 1.7016806722689075, |
| "grad_norm": 0.6152392266872755, |
| "learning_rate": 3.756395422941706e-05, |
| "loss": 0.2823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3008061647415161, |
| "step": 1620, |
| "valid_targets_mean": 3126.2, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 1.7069327731092439, |
| "grad_norm": 0.5905779852643404, |
| "learning_rate": 3.753883786515181e-05, |
| "loss": 0.2714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26379841566085815, |
| "step": 1625, |
| "valid_targets_mean": 3115.7, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 1.71218487394958, |
| "grad_norm": 0.7318199425494478, |
| "learning_rate": 3.751360117135628e-05, |
| "loss": 0.2544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2550744414329529, |
| "step": 1630, |
| "valid_targets_mean": 2223.6, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 1.717436974789916, |
| "grad_norm": 0.663349889323202, |
| "learning_rate": 3.7488244321173025e-05, |
| "loss": 0.2836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2922671437263489, |
| "step": 1635, |
| "valid_targets_mean": 2466.1, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 1.7226890756302522, |
| "grad_norm": 0.7439072694880867, |
| "learning_rate": 3.746276748856898e-05, |
| "loss": 0.2728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2746467590332031, |
| "step": 1640, |
| "valid_targets_mean": 2209.7, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 1.7279411764705883, |
| "grad_norm": 0.7242128901414696, |
| "learning_rate": 3.743717084833425e-05, |
| "loss": 0.2713, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2738949656486511, |
| "step": 1645, |
| "valid_targets_mean": 2048.8, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 1.7331932773109244, |
| "grad_norm": 0.5975483868192742, |
| "learning_rate": 3.741145457608093e-05, |
| "loss": 0.2834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2882964611053467, |
| "step": 1650, |
| "valid_targets_mean": 3101.3, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 1.7384453781512605, |
| "grad_norm": 0.7199800936223271, |
| "learning_rate": 3.738561884824183e-05, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31954213976860046, |
| "step": 1655, |
| "valid_targets_mean": 2576.0, |
| "valid_targets_min": 1213 |
| }, |
| { |
| "epoch": 1.7436974789915967, |
| "grad_norm": 0.643400369166649, |
| "learning_rate": 3.735966384206936e-05, |
| "loss": 0.2691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2960051894187927, |
| "step": 1660, |
| "valid_targets_mean": 3030.7, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 1.7489495798319328, |
| "grad_norm": 0.5952106042261482, |
| "learning_rate": 3.733358973563425e-05, |
| "loss": 0.2851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29441675543785095, |
| "step": 1665, |
| "valid_targets_mean": 3160.8, |
| "valid_targets_min": 1137 |
| }, |
| { |
| "epoch": 1.754201680672269, |
| "grad_norm": 0.6786980642043301, |
| "learning_rate": 3.730739670782435e-05, |
| "loss": 0.2809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2848990559577942, |
| "step": 1670, |
| "valid_targets_mean": 2464.0, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 1.759453781512605, |
| "grad_norm": 0.6509095658222819, |
| "learning_rate": 3.72810849383434e-05, |
| "loss": 0.2678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26271501183509827, |
| "step": 1675, |
| "valid_targets_mean": 2341.4, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 1.7647058823529411, |
| "grad_norm": 0.7898671503621937, |
| "learning_rate": 3.725465460770978e-05, |
| "loss": 0.3089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3113194704055786, |
| "step": 1680, |
| "valid_targets_mean": 2466.2, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 1.7699579831932772, |
| "grad_norm": 0.6739070075903468, |
| "learning_rate": 3.7228105897255324e-05, |
| "loss": 0.2811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2531262934207916, |
| "step": 1685, |
| "valid_targets_mean": 2049.8, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 1.7752100840336134, |
| "grad_norm": 0.6710697879150522, |
| "learning_rate": 3.7201438989124e-05, |
| "loss": 0.2761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28480058908462524, |
| "step": 1690, |
| "valid_targets_mean": 2619.4, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 1.7804621848739495, |
| "grad_norm": 0.662695525206772, |
| "learning_rate": 3.717465406627074e-05, |
| "loss": 0.2726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2571936547756195, |
| "step": 1695, |
| "valid_targets_mean": 2399.6, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 1.7857142857142856, |
| "grad_norm": 0.6320359884584241, |
| "learning_rate": 3.714775131246011e-05, |
| "loss": 0.2818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2644287347793579, |
| "step": 1700, |
| "valid_targets_mean": 2833.1, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 1.7909663865546217, |
| "grad_norm": 0.5608837993978538, |
| "learning_rate": 3.71207309122651e-05, |
| "loss": 0.2656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25060662627220154, |
| "step": 1705, |
| "valid_targets_mean": 3011.6, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 1.7962184873949578, |
| "grad_norm": 0.7749333627981896, |
| "learning_rate": 3.709359305106585e-05, |
| "loss": 0.2835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3079194128513336, |
| "step": 1710, |
| "valid_targets_mean": 2177.3, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 1.8014705882352942, |
| "grad_norm": 0.6704960756054471, |
| "learning_rate": 3.7066337915048354e-05, |
| "loss": 0.2633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24317601323127747, |
| "step": 1715, |
| "valid_targets_mean": 2278.3, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 1.8067226890756303, |
| "grad_norm": 0.726852310035077, |
| "learning_rate": 3.7038965691203205e-05, |
| "loss": 0.2867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2838640809059143, |
| "step": 1720, |
| "valid_targets_mean": 2385.5, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 1.8119747899159664, |
| "grad_norm": 0.7307615924485396, |
| "learning_rate": 3.701147656732431e-05, |
| "loss": 0.2626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2594029903411865, |
| "step": 1725, |
| "valid_targets_mean": 2254.4, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 1.8172268907563025, |
| "grad_norm": 0.6804119390418033, |
| "learning_rate": 3.6983870732007596e-05, |
| "loss": 0.2897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30185481905937195, |
| "step": 1730, |
| "valid_targets_mean": 2529.1, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 1.8224789915966386, |
| "grad_norm": 0.5971578197210542, |
| "learning_rate": 3.695614837464972e-05, |
| "loss": 0.2799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2714010179042816, |
| "step": 1735, |
| "valid_targets_mean": 2919.9, |
| "valid_targets_min": 934 |
| }, |
| { |
| "epoch": 1.8277310924369747, |
| "grad_norm": 0.7432330036153248, |
| "learning_rate": 3.692830968544675e-05, |
| "loss": 0.2905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2643352150917053, |
| "step": 1740, |
| "valid_targets_mean": 2157.0, |
| "valid_targets_min": 913 |
| }, |
| { |
| "epoch": 1.832983193277311, |
| "grad_norm": 0.9451021623758795, |
| "learning_rate": 3.690035485539291e-05, |
| "loss": 0.2848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2754422128200531, |
| "step": 1745, |
| "valid_targets_mean": 2272.9, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 1.8382352941176472, |
| "grad_norm": 0.6448983937098554, |
| "learning_rate": 3.6872284076279205e-05, |
| "loss": 0.2735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27130642533302307, |
| "step": 1750, |
| "valid_targets_mean": 2665.2, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 1.8434873949579833, |
| "grad_norm": 0.6568847222392369, |
| "learning_rate": 3.684409754069215e-05, |
| "loss": 0.2887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28479936718940735, |
| "step": 1755, |
| "valid_targets_mean": 2863.5, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 1.8487394957983194, |
| "grad_norm": 0.9463446748898482, |
| "learning_rate": 3.681579544201244e-05, |
| "loss": 0.265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.267799973487854, |
| "step": 1760, |
| "valid_targets_mean": 2591.4, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 1.8539915966386555, |
| "grad_norm": 0.6626299146737941, |
| "learning_rate": 3.6787377974413614e-05, |
| "loss": 0.275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26858189702033997, |
| "step": 1765, |
| "valid_targets_mean": 2298.1, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 1.8592436974789917, |
| "grad_norm": 0.5511447233080423, |
| "learning_rate": 3.6758845332860734e-05, |
| "loss": 0.2641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25503212213516235, |
| "step": 1770, |
| "valid_targets_mean": 3300.6, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 1.8644957983193278, |
| "grad_norm": 0.6864216219048197, |
| "learning_rate": 3.673019771310903e-05, |
| "loss": 0.2724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29600006341934204, |
| "step": 1775, |
| "valid_targets_mean": 2480.2, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 1.8697478991596639, |
| "grad_norm": 0.6727603790480745, |
| "learning_rate": 3.670143531170258e-05, |
| "loss": 0.2847, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2595556974411011, |
| "step": 1780, |
| "valid_targets_mean": 2553.4, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 1.875, |
| "grad_norm": 0.6449743095704825, |
| "learning_rate": 3.667255832597294e-05, |
| "loss": 0.2719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.287334680557251, |
| "step": 1785, |
| "valid_targets_mean": 2550.0, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 1.8802521008403361, |
| "grad_norm": 0.7356297744717748, |
| "learning_rate": 3.664356695403781e-05, |
| "loss": 0.2709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2541128993034363, |
| "step": 1790, |
| "valid_targets_mean": 1760.9, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 1.8855042016806722, |
| "grad_norm": 0.6441525341607449, |
| "learning_rate": 3.661446139479965e-05, |
| "loss": 0.2722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2607778310775757, |
| "step": 1795, |
| "valid_targets_mean": 2639.6, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 1.8907563025210083, |
| "grad_norm": 0.6764765078850176, |
| "learning_rate": 3.658524184794436e-05, |
| "loss": 0.2808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2690533399581909, |
| "step": 1800, |
| "valid_targets_mean": 2191.6, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 1.8960084033613445, |
| "grad_norm": 0.6223425261146642, |
| "learning_rate": 3.655590851393984e-05, |
| "loss": 0.266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2553020417690277, |
| "step": 1805, |
| "valid_targets_mean": 2840.2, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 1.9012605042016806, |
| "grad_norm": 0.571683682772899, |
| "learning_rate": 3.652646159403468e-05, |
| "loss": 0.2724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2515188455581665, |
| "step": 1810, |
| "valid_targets_mean": 3140.4, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 1.9065126050420167, |
| "grad_norm": 0.6705352110164979, |
| "learning_rate": 3.649690129025675e-05, |
| "loss": 0.285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28106388449668884, |
| "step": 1815, |
| "valid_targets_mean": 2872.1, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 1.9117647058823528, |
| "grad_norm": 0.6674867092826292, |
| "learning_rate": 3.6467227805411824e-05, |
| "loss": 0.2805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2530893385410309, |
| "step": 1820, |
| "valid_targets_mean": 2187.0, |
| "valid_targets_min": 1228 |
| }, |
| { |
| "epoch": 1.917016806722689, |
| "grad_norm": 0.7791624483418543, |
| "learning_rate": 3.6437441343082174e-05, |
| "loss": 0.2576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25658732652664185, |
| "step": 1825, |
| "valid_targets_mean": 1671.2, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 1.9222689075630253, |
| "grad_norm": 0.7296738608202369, |
| "learning_rate": 3.6407542107625167e-05, |
| "loss": 0.2785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25650477409362793, |
| "step": 1830, |
| "valid_targets_mean": 2080.8, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 1.9275210084033614, |
| "grad_norm": 0.6401628879972454, |
| "learning_rate": 3.637753030417192e-05, |
| "loss": 0.2882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.271770179271698, |
| "step": 1835, |
| "valid_targets_mean": 2537.3, |
| "valid_targets_min": 1114 |
| }, |
| { |
| "epoch": 1.9327731092436975, |
| "grad_norm": 0.6126369558801827, |
| "learning_rate": 3.6347406138625805e-05, |
| "loss": 0.2925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2938627600669861, |
| "step": 1840, |
| "valid_targets_mean": 2981.4, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 1.9380252100840336, |
| "grad_norm": 0.7218262814733415, |
| "learning_rate": 3.631716981766111e-05, |
| "loss": 0.2786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30355095863342285, |
| "step": 1845, |
| "valid_targets_mean": 2301.2, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 1.9432773109243697, |
| "grad_norm": 0.668031618282193, |
| "learning_rate": 3.6286821548721594e-05, |
| "loss": 0.2752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27426058053970337, |
| "step": 1850, |
| "valid_targets_mean": 2243.2, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 1.9485294117647058, |
| "grad_norm": 0.752574443244231, |
| "learning_rate": 3.625636154001904e-05, |
| "loss": 0.2859, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3078942894935608, |
| "step": 1855, |
| "valid_targets_mean": 2398.1, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 1.9537815126050422, |
| "grad_norm": 0.7317868910075894, |
| "learning_rate": 3.622579000053186e-05, |
| "loss": 0.2737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28089436888694763, |
| "step": 1860, |
| "valid_targets_mean": 2312.2, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 1.9590336134453783, |
| "grad_norm": 0.5809494600449272, |
| "learning_rate": 3.619510714000368e-05, |
| "loss": 0.2872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28781622648239136, |
| "step": 1865, |
| "valid_targets_mean": 3431.6, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 1.9642857142857144, |
| "grad_norm": 0.6561581539587649, |
| "learning_rate": 3.616431316894181e-05, |
| "loss": 0.2752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2707546651363373, |
| "step": 1870, |
| "valid_targets_mean": 2314.8, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 1.9695378151260505, |
| "grad_norm": 0.6586257109850335, |
| "learning_rate": 3.613340829861592e-05, |
| "loss": 0.2674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28310245275497437, |
| "step": 1875, |
| "valid_targets_mean": 2942.6, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 1.9747899159663866, |
| "grad_norm": 0.6401802852139319, |
| "learning_rate": 3.61023927410565e-05, |
| "loss": 0.2666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.290630578994751, |
| "step": 1880, |
| "valid_targets_mean": 2797.1, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 1.9800420168067228, |
| "grad_norm": 0.6218936013613373, |
| "learning_rate": 3.607126670905346e-05, |
| "loss": 0.2807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27291837334632874, |
| "step": 1885, |
| "valid_targets_mean": 2842.4, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 1.9852941176470589, |
| "grad_norm": 0.6591905106890031, |
| "learning_rate": 3.60400304161546e-05, |
| "loss": 0.2745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24094945192337036, |
| "step": 1890, |
| "valid_targets_mean": 2038.6, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 1.990546218487395, |
| "grad_norm": 0.6093929527492841, |
| "learning_rate": 3.600868407666426e-05, |
| "loss": 0.2653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.251456618309021, |
| "step": 1895, |
| "valid_targets_mean": 2710.1, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 1.995798319327731, |
| "grad_norm": 0.7825350266466161, |
| "learning_rate": 3.597722790564172e-05, |
| "loss": 0.2824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.288199245929718, |
| "step": 1900, |
| "valid_targets_mean": 1974.7, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 2.0010504201680672, |
| "grad_norm": 0.5933761068921561, |
| "learning_rate": 3.5945662118899824e-05, |
| "loss": 0.2795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2670100927352905, |
| "step": 1905, |
| "valid_targets_mean": 3187.6, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 2.0063025210084033, |
| "grad_norm": 0.681788431886679, |
| "learning_rate": 3.5913986933003455e-05, |
| "loss": 0.2537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23222820460796356, |
| "step": 1910, |
| "valid_targets_mean": 2392.1, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 2.0115546218487395, |
| "grad_norm": 0.6959432299927795, |
| "learning_rate": 3.5882202565268046e-05, |
| "loss": 0.2578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25007233023643494, |
| "step": 1915, |
| "valid_targets_mean": 2417.9, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 2.0168067226890756, |
| "grad_norm": 0.7488088088666018, |
| "learning_rate": 3.58503092337581e-05, |
| "loss": 0.2415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26307564973831177, |
| "step": 1920, |
| "valid_targets_mean": 2433.2, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 2.0220588235294117, |
| "grad_norm": 0.8762656352125061, |
| "learning_rate": 3.5818307157285705e-05, |
| "loss": 0.2404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2252756655216217, |
| "step": 1925, |
| "valid_targets_mean": 2069.1, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 2.027310924369748, |
| "grad_norm": 0.7108878947236019, |
| "learning_rate": 3.5786196555409006e-05, |
| "loss": 0.2483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2223615050315857, |
| "step": 1930, |
| "valid_targets_mean": 2248.2, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 2.032563025210084, |
| "grad_norm": 0.6819496202558551, |
| "learning_rate": 3.575397764843073e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2185153365135193, |
| "step": 1935, |
| "valid_targets_mean": 2224.1, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 2.03781512605042, |
| "grad_norm": 0.6372992890667374, |
| "learning_rate": 3.572165065739664e-05, |
| "loss": 0.2442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2360488474369049, |
| "step": 1940, |
| "valid_targets_mean": 2788.4, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 2.043067226890756, |
| "grad_norm": 0.6386451317642459, |
| "learning_rate": 3.5689215804094053e-05, |
| "loss": 0.2322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22324788570404053, |
| "step": 1945, |
| "valid_targets_mean": 2618.2, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 2.0483193277310923, |
| "grad_norm": 0.7004427658132236, |
| "learning_rate": 3.5656673311050285e-05, |
| "loss": 0.2515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27351114153862, |
| "step": 1950, |
| "valid_targets_mean": 2478.5, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 2.0535714285714284, |
| "grad_norm": 0.7101917295820503, |
| "learning_rate": 3.562402340153115e-05, |
| "loss": 0.2297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2520638406276703, |
| "step": 1955, |
| "valid_targets_mean": 2472.2, |
| "valid_targets_min": 1105 |
| }, |
| { |
| "epoch": 2.0588235294117645, |
| "grad_norm": 0.6511098248209234, |
| "learning_rate": 3.559126629953942e-05, |
| "loss": 0.2551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2435356080532074, |
| "step": 1960, |
| "valid_targets_mean": 3219.1, |
| "valid_targets_min": 1104 |
| }, |
| { |
| "epoch": 2.064075630252101, |
| "grad_norm": 0.6358952603701429, |
| "learning_rate": 3.5558402229813287e-05, |
| "loss": 0.2449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2297707498073578, |
| "step": 1965, |
| "valid_targets_mean": 2425.1, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 2.069327731092437, |
| "grad_norm": 0.6868889163392828, |
| "learning_rate": 3.552543141782483e-05, |
| "loss": 0.2333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24342474341392517, |
| "step": 1970, |
| "valid_targets_mean": 2674.5, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 2.0745798319327733, |
| "grad_norm": 0.6503662588808112, |
| "learning_rate": 3.549235408977843e-05, |
| "loss": 0.2432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23457615077495575, |
| "step": 1975, |
| "valid_targets_mean": 2697.2, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 2.0798319327731094, |
| "grad_norm": 0.822377652612648, |
| "learning_rate": 3.545917047260928e-05, |
| "loss": 0.2556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26807093620300293, |
| "step": 1980, |
| "valid_targets_mean": 1928.6, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 2.0850840336134455, |
| "grad_norm": 0.7145196067189729, |
| "learning_rate": 3.542588079398179e-05, |
| "loss": 0.2426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26111432909965515, |
| "step": 1985, |
| "valid_targets_mean": 2330.2, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 2.0903361344537816, |
| "grad_norm": 0.7523096751763567, |
| "learning_rate": 3.539248528228801e-05, |
| "loss": 0.2426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24235697090625763, |
| "step": 1990, |
| "valid_targets_mean": 2053.5, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 2.0955882352941178, |
| "grad_norm": 0.7632438420213485, |
| "learning_rate": 3.535898416664611e-05, |
| "loss": 0.2326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22527560591697693, |
| "step": 1995, |
| "valid_targets_mean": 2201.0, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 2.100840336134454, |
| "grad_norm": 0.7057387201013904, |
| "learning_rate": 3.5325377676898766e-05, |
| "loss": 0.233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25476691126823425, |
| "step": 2000, |
| "valid_targets_mean": 2419.0, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 2.10609243697479, |
| "grad_norm": 0.6906581075458723, |
| "learning_rate": 3.529166604361161e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19508974254131317, |
| "step": 2005, |
| "valid_targets_mean": 1831.8, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 2.111344537815126, |
| "grad_norm": 0.7527030761728207, |
| "learning_rate": 3.525784949807162e-05, |
| "loss": 0.2359, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23376065492630005, |
| "step": 2010, |
| "valid_targets_mean": 2055.6, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 2.116596638655462, |
| "grad_norm": 0.6868567018841076, |
| "learning_rate": 3.522392827228557e-05, |
| "loss": 0.2511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2521514296531677, |
| "step": 2015, |
| "valid_targets_mean": 3081.2, |
| "valid_targets_min": 1079 |
| }, |
| { |
| "epoch": 2.1218487394957983, |
| "grad_norm": 0.6159147126631715, |
| "learning_rate": 3.518990259897841e-05, |
| "loss": 0.2301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24102434515953064, |
| "step": 2020, |
| "valid_targets_mean": 3128.9, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 2.1271008403361344, |
| "grad_norm": 0.6607408752549182, |
| "learning_rate": 3.515577271159167e-05, |
| "loss": 0.2451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24916204810142517, |
| "step": 2025, |
| "valid_targets_mean": 2437.9, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 2.1323529411764706, |
| "grad_norm": 0.6823759669457126, |
| "learning_rate": 3.512153884428188e-05, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24420082569122314, |
| "step": 2030, |
| "valid_targets_mean": 2662.5, |
| "valid_targets_min": 1212 |
| }, |
| { |
| "epoch": 2.1376050420168067, |
| "grad_norm": 0.8063415806620354, |
| "learning_rate": 3.5087201231918944e-05, |
| "loss": 0.2482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.255155086517334, |
| "step": 2035, |
| "valid_targets_mean": 2731.2, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 2.142857142857143, |
| "grad_norm": 0.7415414698356663, |
| "learning_rate": 3.505276011008454e-05, |
| "loss": 0.2435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23635327816009521, |
| "step": 2040, |
| "valid_targets_mean": 2135.6, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.148109243697479, |
| "grad_norm": 0.6907057684258697, |
| "learning_rate": 3.501821571507048e-05, |
| "loss": 0.2379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24406486749649048, |
| "step": 2045, |
| "valid_targets_mean": 2447.7, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 2.153361344537815, |
| "grad_norm": 0.6782470155275483, |
| "learning_rate": 3.498356828387714e-05, |
| "loss": 0.2463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23916223645210266, |
| "step": 2050, |
| "valid_targets_mean": 2313.4, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 2.158613445378151, |
| "grad_norm": 0.5671322606625604, |
| "learning_rate": 3.494881805421176e-05, |
| "loss": 0.2438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19718879461288452, |
| "step": 2055, |
| "valid_targets_mean": 2824.4, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 2.1638655462184873, |
| "grad_norm": 0.9382283657965643, |
| "learning_rate": 3.4913965264486894e-05, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25609293580055237, |
| "step": 2060, |
| "valid_targets_mean": 1910.2, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 2.1691176470588234, |
| "grad_norm": 0.6346830510041134, |
| "learning_rate": 3.48790101538187e-05, |
| "loss": 0.2413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2414173036813736, |
| "step": 2065, |
| "valid_targets_mean": 2811.0, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 2.1743697478991595, |
| "grad_norm": 0.7269704066923304, |
| "learning_rate": 3.484395296202537e-05, |
| "loss": 0.2459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24697639048099518, |
| "step": 2070, |
| "valid_targets_mean": 2118.1, |
| "valid_targets_min": 1008 |
| }, |
| { |
| "epoch": 2.1796218487394956, |
| "grad_norm": 0.6343101249317197, |
| "learning_rate": 3.480879392962541e-05, |
| "loss": 0.2452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23526614904403687, |
| "step": 2075, |
| "valid_targets_mean": 2820.8, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 2.184873949579832, |
| "grad_norm": 0.7287435124218465, |
| "learning_rate": 3.477353329783606e-05, |
| "loss": 0.2366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24225783348083496, |
| "step": 2080, |
| "valid_targets_mean": 2625.6, |
| "valid_targets_min": 1045 |
| }, |
| { |
| "epoch": 2.190126050420168, |
| "grad_norm": 0.713355174077326, |
| "learning_rate": 3.4738171308571595e-05, |
| "loss": 0.2524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.254425972700119, |
| "step": 2085, |
| "valid_targets_mean": 2268.8, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 2.1953781512605044, |
| "grad_norm": 0.6705604877150245, |
| "learning_rate": 3.470270820444168e-05, |
| "loss": 0.2453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2541666328907013, |
| "step": 2090, |
| "valid_targets_mean": 2757.6, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 2.2006302521008405, |
| "grad_norm": 0.7233467972990565, |
| "learning_rate": 3.4667144228749697e-05, |
| "loss": 0.2656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25709813833236694, |
| "step": 2095, |
| "valid_targets_mean": 2277.6, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 2.2058823529411766, |
| "grad_norm": 0.7024704278871472, |
| "learning_rate": 3.463147962549109e-05, |
| "loss": 0.2302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.238604336977005, |
| "step": 2100, |
| "valid_targets_mean": 2394.7, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 2.2111344537815127, |
| "grad_norm": 0.7334542386999148, |
| "learning_rate": 3.459571463935168e-05, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25194650888442993, |
| "step": 2105, |
| "valid_targets_mean": 2613.2, |
| "valid_targets_min": 1580 |
| }, |
| { |
| "epoch": 2.216386554621849, |
| "grad_norm": 0.645760996168686, |
| "learning_rate": 3.455984951570598e-05, |
| "loss": 0.2452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22080859541893005, |
| "step": 2110, |
| "valid_targets_mean": 2687.3, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 2.221638655462185, |
| "grad_norm": 0.6519130528193421, |
| "learning_rate": 3.452388450061556e-05, |
| "loss": 0.2498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2937582731246948, |
| "step": 2115, |
| "valid_targets_mean": 3205.2, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 2.226890756302521, |
| "grad_norm": 0.6624235701635455, |
| "learning_rate": 3.448781984082727e-05, |
| "loss": 0.2343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21843945980072021, |
| "step": 2120, |
| "valid_targets_mean": 2508.0, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 2.232142857142857, |
| "grad_norm": 0.7029645390202783, |
| "learning_rate": 3.4451655783771625e-05, |
| "loss": 0.2541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2414093017578125, |
| "step": 2125, |
| "valid_targets_mean": 2228.1, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 2.2373949579831933, |
| "grad_norm": 0.7968386644644923, |
| "learning_rate": 3.4415392577561064e-05, |
| "loss": 0.2339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24058222770690918, |
| "step": 2130, |
| "valid_targets_mean": 1892.4, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 2.2426470588235294, |
| "grad_norm": 0.7056496069912468, |
| "learning_rate": 3.4379030470988285e-05, |
| "loss": 0.2477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24626708030700684, |
| "step": 2135, |
| "valid_targets_mean": 2260.1, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 2.2478991596638656, |
| "grad_norm": 0.6124790183288958, |
| "learning_rate": 3.4342569713524496e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22665052115917206, |
| "step": 2140, |
| "valid_targets_mean": 3020.3, |
| "valid_targets_min": 1178 |
| }, |
| { |
| "epoch": 2.2531512605042017, |
| "grad_norm": 0.7290143698690328, |
| "learning_rate": 3.4306010555317735e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26667648553848267, |
| "step": 2145, |
| "valid_targets_mean": 2242.3, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 2.258403361344538, |
| "grad_norm": 0.6119475782036818, |
| "learning_rate": 3.4269353247191135e-05, |
| "loss": 0.2374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2166629135608673, |
| "step": 2150, |
| "valid_targets_mean": 2546.4, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 2.263655462184874, |
| "grad_norm": 0.6765056487027129, |
| "learning_rate": 3.423259804064122e-05, |
| "loss": 0.2492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24621796607971191, |
| "step": 2155, |
| "valid_targets_mean": 2518.2, |
| "valid_targets_min": 1296 |
| }, |
| { |
| "epoch": 2.26890756302521, |
| "grad_norm": 0.711905698459275, |
| "learning_rate": 3.419574518783616e-05, |
| "loss": 0.2287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24736756086349487, |
| "step": 2160, |
| "valid_targets_mean": 3044.6, |
| "valid_targets_min": 607 |
| }, |
| { |
| "epoch": 2.274159663865546, |
| "grad_norm": 0.6672052083995789, |
| "learning_rate": 3.4158794941614055e-05, |
| "loss": 0.2546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24737080931663513, |
| "step": 2165, |
| "valid_targets_mean": 3020.8, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 2.2794117647058822, |
| "grad_norm": 0.7567079909016078, |
| "learning_rate": 3.4121747555481216e-05, |
| "loss": 0.2381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2148715853691101, |
| "step": 2170, |
| "valid_targets_mean": 1714.9, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 2.2846638655462184, |
| "grad_norm": 0.7056947251086683, |
| "learning_rate": 3.4084603283610365e-05, |
| "loss": 0.2458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27144932746887207, |
| "step": 2175, |
| "valid_targets_mean": 2400.7, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 2.2899159663865545, |
| "grad_norm": 0.7646246632019781, |
| "learning_rate": 3.404736238083897e-05, |
| "loss": 0.2429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23836296796798706, |
| "step": 2180, |
| "valid_targets_mean": 2148.2, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 2.2951680672268906, |
| "grad_norm": 0.6677517363916046, |
| "learning_rate": 3.401002510266744e-05, |
| "loss": 0.2433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24747160077095032, |
| "step": 2185, |
| "valid_targets_mean": 2523.8, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 2.3004201680672267, |
| "grad_norm": 0.7787607353169186, |
| "learning_rate": 3.397259170525739e-05, |
| "loss": 0.2398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24741989374160767, |
| "step": 2190, |
| "valid_targets_mean": 2161.8, |
| "valid_targets_min": 1218 |
| }, |
| { |
| "epoch": 2.3056722689075633, |
| "grad_norm": 0.6898906104395905, |
| "learning_rate": 3.393506244542991e-05, |
| "loss": 0.2345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21572214365005493, |
| "step": 2195, |
| "valid_targets_mean": 2425.9, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 2.310924369747899, |
| "grad_norm": 0.7076822593529297, |
| "learning_rate": 3.389743758066374e-05, |
| "loss": 0.2481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2650451064109802, |
| "step": 2200, |
| "valid_targets_mean": 2744.9, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 2.3161764705882355, |
| "grad_norm": 0.7536553955769041, |
| "learning_rate": 3.385971736909357e-05, |
| "loss": 0.257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2877483367919922, |
| "step": 2205, |
| "valid_targets_mean": 2068.6, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 2.3214285714285716, |
| "grad_norm": 0.7234207845549456, |
| "learning_rate": 3.382190206950822e-05, |
| "loss": 0.2504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.243576318025589, |
| "step": 2210, |
| "valid_targets_mean": 2941.5, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 2.3266806722689077, |
| "grad_norm": 0.7515713668566515, |
| "learning_rate": 3.3783991941348916e-05, |
| "loss": 0.2464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.264710009098053, |
| "step": 2215, |
| "valid_targets_mean": 2004.6, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 2.331932773109244, |
| "grad_norm": 0.6251497478316201, |
| "learning_rate": 3.374598724470745e-05, |
| "loss": 0.2429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24632088840007782, |
| "step": 2220, |
| "valid_targets_mean": 2663.2, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 2.33718487394958, |
| "grad_norm": 0.6823271730426904, |
| "learning_rate": 3.370788824032441e-05, |
| "loss": 0.2411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24375592172145844, |
| "step": 2225, |
| "valid_targets_mean": 2528.2, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 2.342436974789916, |
| "grad_norm": 0.650663602449571, |
| "learning_rate": 3.366969518958746e-05, |
| "loss": 0.2552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2503768801689148, |
| "step": 2230, |
| "valid_targets_mean": 2865.1, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 2.347689075630252, |
| "grad_norm": 0.6601800895017542, |
| "learning_rate": 3.363140835452945e-05, |
| "loss": 0.2565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2578763961791992, |
| "step": 2235, |
| "valid_targets_mean": 2738.4, |
| "valid_targets_min": 1007 |
| }, |
| { |
| "epoch": 2.3529411764705883, |
| "grad_norm": 0.692317322973956, |
| "learning_rate": 3.3593027997826654e-05, |
| "loss": 0.2478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2523569166660309, |
| "step": 2240, |
| "valid_targets_mean": 2517.1, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 2.3581932773109244, |
| "grad_norm": 0.7286731675117749, |
| "learning_rate": 3.355455438279702e-05, |
| "loss": 0.228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20360924303531647, |
| "step": 2245, |
| "valid_targets_mean": 1795.9, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 2.3634453781512605, |
| "grad_norm": 0.7006474168718877, |
| "learning_rate": 3.351598777339827e-05, |
| "loss": 0.2312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2347767949104309, |
| "step": 2250, |
| "valid_targets_mean": 2666.3, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 2.3686974789915967, |
| "grad_norm": 0.5939844727687064, |
| "learning_rate": 3.3477328434226164e-05, |
| "loss": 0.2413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23968379199504852, |
| "step": 2255, |
| "valid_targets_mean": 3521.1, |
| "valid_targets_min": 1437 |
| }, |
| { |
| "epoch": 2.3739495798319328, |
| "grad_norm": 0.7625687687660169, |
| "learning_rate": 3.343857663051264e-05, |
| "loss": 0.2371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20183886587619781, |
| "step": 2260, |
| "valid_targets_mean": 1734.0, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 2.379201680672269, |
| "grad_norm": 0.7219603926351075, |
| "learning_rate": 3.339973262812403e-05, |
| "loss": 0.2486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22381290793418884, |
| "step": 2265, |
| "valid_targets_mean": 2065.6, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 2.384453781512605, |
| "grad_norm": 0.6274958459143466, |
| "learning_rate": 3.336079669355921e-05, |
| "loss": 0.2592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26679128408432007, |
| "step": 2270, |
| "valid_targets_mean": 3185.1, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 2.389705882352941, |
| "grad_norm": 0.6780169305716136, |
| "learning_rate": 3.332176909394777e-05, |
| "loss": 0.2304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2543075978755951, |
| "step": 2275, |
| "valid_targets_mean": 2658.4, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 2.3949579831932772, |
| "grad_norm": 0.5895782853276299, |
| "learning_rate": 3.3282650097048206e-05, |
| "loss": 0.2562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23634852468967438, |
| "step": 2280, |
| "valid_targets_mean": 3037.2, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 2.4002100840336134, |
| "grad_norm": 0.7590461713759683, |
| "learning_rate": 3.324343997124606e-05, |
| "loss": 0.2388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23115390539169312, |
| "step": 2285, |
| "valid_targets_mean": 2907.3, |
| "valid_targets_min": 1192 |
| }, |
| { |
| "epoch": 2.4054621848739495, |
| "grad_norm": 0.7830457306094891, |
| "learning_rate": 3.3204138985552094e-05, |
| "loss": 0.2334, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27056723833084106, |
| "step": 2290, |
| "valid_targets_mean": 1997.1, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.4107142857142856, |
| "grad_norm": 0.6194407127598283, |
| "learning_rate": 3.316474740960041e-05, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19772791862487793, |
| "step": 2295, |
| "valid_targets_mean": 2389.4, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 2.4159663865546217, |
| "grad_norm": 0.6520643182398843, |
| "learning_rate": 3.312526551364667e-05, |
| "loss": 0.2378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22252126038074493, |
| "step": 2300, |
| "valid_targets_mean": 2424.2, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 2.421218487394958, |
| "grad_norm": 0.6888170634914532, |
| "learning_rate": 3.308569356856616e-05, |
| "loss": 0.2456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24550795555114746, |
| "step": 2305, |
| "valid_targets_mean": 2487.7, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 2.426470588235294, |
| "grad_norm": 0.5982413076324926, |
| "learning_rate": 3.3046031845851993e-05, |
| "loss": 0.2497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25226032733917236, |
| "step": 2310, |
| "valid_targets_mean": 3157.9, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 2.43172268907563, |
| "grad_norm": 0.6571326373833773, |
| "learning_rate": 3.3006280617613214e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22074852883815765, |
| "step": 2315, |
| "valid_targets_mean": 2177.3, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 2.4369747899159666, |
| "grad_norm": 0.6894533182551907, |
| "learning_rate": 3.296644015657295e-05, |
| "loss": 0.2392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21584966778755188, |
| "step": 2320, |
| "valid_targets_mean": 2304.4, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 2.4422268907563023, |
| "grad_norm": 0.6972919721870979, |
| "learning_rate": 3.292651073606652e-05, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23415690660476685, |
| "step": 2325, |
| "valid_targets_mean": 2303.6, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 2.447478991596639, |
| "grad_norm": 0.6334274393400314, |
| "learning_rate": 3.288649263003958e-05, |
| "loss": 0.239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23000667989253998, |
| "step": 2330, |
| "valid_targets_mean": 2705.6, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 2.452731092436975, |
| "grad_norm": 0.618380033342548, |
| "learning_rate": 3.284638611304623e-05, |
| "loss": 0.237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2020508050918579, |
| "step": 2335, |
| "valid_targets_mean": 2487.5, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 2.457983193277311, |
| "grad_norm": 0.6426580413501916, |
| "learning_rate": 3.280619146024714e-05, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23832888901233673, |
| "step": 2340, |
| "valid_targets_mean": 2668.8, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 2.463235294117647, |
| "grad_norm": 0.6496710491874221, |
| "learning_rate": 3.2765908947407665e-05, |
| "loss": 0.2465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24643950164318085, |
| "step": 2345, |
| "valid_targets_mean": 3095.7, |
| "valid_targets_min": 1618 |
| }, |
| { |
| "epoch": 2.4684873949579833, |
| "grad_norm": 0.6671046199265696, |
| "learning_rate": 3.2725538850895933e-05, |
| "loss": 0.2419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24697118997573853, |
| "step": 2350, |
| "valid_targets_mean": 3175.2, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 2.4737394957983194, |
| "grad_norm": 0.608779379161093, |
| "learning_rate": 3.268508144768096e-05, |
| "loss": 0.2383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2293773591518402, |
| "step": 2355, |
| "valid_targets_mean": 2969.8, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 2.4789915966386555, |
| "grad_norm": 0.7152715550331328, |
| "learning_rate": 3.264453701533075e-05, |
| "loss": 0.2418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24297022819519043, |
| "step": 2360, |
| "valid_targets_mean": 2333.1, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 2.4842436974789917, |
| "grad_norm": 0.6884766551131825, |
| "learning_rate": 3.260390583201041e-05, |
| "loss": 0.2468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2274142950773239, |
| "step": 2365, |
| "valid_targets_mean": 2203.9, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 2.4894957983193278, |
| "grad_norm": 0.6696446459706793, |
| "learning_rate": 3.2563188176480217e-05, |
| "loss": 0.2394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2381383329629898, |
| "step": 2370, |
| "valid_targets_mean": 2626.6, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 2.494747899159664, |
| "grad_norm": 0.6401047773492371, |
| "learning_rate": 3.252238432809368e-05, |
| "loss": 0.2466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2555871307849884, |
| "step": 2375, |
| "valid_targets_mean": 2559.3, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 2.5, |
| "grad_norm": 0.7122232018012691, |
| "learning_rate": 3.2481494566795716e-05, |
| "loss": 0.2501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2375078648328781, |
| "step": 2380, |
| "valid_targets_mean": 2202.1, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 2.505252100840336, |
| "grad_norm": 0.6808348421830116, |
| "learning_rate": 3.244051917312061e-05, |
| "loss": 0.2424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23621997237205505, |
| "step": 2385, |
| "valid_targets_mean": 2670.9, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 2.5105042016806722, |
| "grad_norm": 0.6243398513672342, |
| "learning_rate": 3.239945842819018e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23079396784305573, |
| "step": 2390, |
| "valid_targets_mean": 2769.6, |
| "valid_targets_min": 1140 |
| }, |
| { |
| "epoch": 2.5157563025210083, |
| "grad_norm": 0.6608060434787372, |
| "learning_rate": 3.2358312613711804e-05, |
| "loss": 0.2547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.253095418214798, |
| "step": 2395, |
| "valid_targets_mean": 2660.6, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 2.5210084033613445, |
| "grad_norm": 0.7121224716293856, |
| "learning_rate": 3.231708201197653e-05, |
| "loss": 0.2408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21336033940315247, |
| "step": 2400, |
| "valid_targets_mean": 2111.9, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 2.5262605042016806, |
| "grad_norm": 0.6338382678155583, |
| "learning_rate": 3.227576690585706e-05, |
| "loss": 0.2496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2580583095550537, |
| "step": 2405, |
| "valid_targets_mean": 3034.8, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 2.5315126050420167, |
| "grad_norm": 0.7538479941411893, |
| "learning_rate": 3.223436757880591e-05, |
| "loss": 0.2508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22333016991615295, |
| "step": 2410, |
| "valid_targets_mean": 1899.9, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 2.536764705882353, |
| "grad_norm": 0.6566761719653834, |
| "learning_rate": 3.219288431485337e-05, |
| "loss": 0.2396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24630621075630188, |
| "step": 2415, |
| "valid_targets_mean": 2439.4, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 2.542016806722689, |
| "grad_norm": 0.6042493534650838, |
| "learning_rate": 3.2151317398605646e-05, |
| "loss": 0.2392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25575879216194153, |
| "step": 2420, |
| "valid_targets_mean": 3347.0, |
| "valid_targets_min": 1460 |
| }, |
| { |
| "epoch": 2.5472689075630255, |
| "grad_norm": 0.6284939551656498, |
| "learning_rate": 3.2109667115242815e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24401450157165527, |
| "step": 2425, |
| "valid_targets_mean": 2538.7, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 2.552521008403361, |
| "grad_norm": 0.6528228615180638, |
| "learning_rate": 3.206793375051694e-05, |
| "loss": 0.2495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25775042176246643, |
| "step": 2430, |
| "valid_targets_mean": 2766.4, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 2.5577731092436977, |
| "grad_norm": 0.6809614766621044, |
| "learning_rate": 3.2026117590750086e-05, |
| "loss": 0.2415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25471678376197815, |
| "step": 2435, |
| "valid_targets_mean": 2465.3, |
| "valid_targets_min": 800 |
| }, |
| { |
| "epoch": 2.5630252100840334, |
| "grad_norm": 0.7551843328572223, |
| "learning_rate": 3.198421892283235e-05, |
| "loss": 0.2356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2478971630334854, |
| "step": 2440, |
| "valid_targets_mean": 2033.8, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 2.56827731092437, |
| "grad_norm": 0.732748269558122, |
| "learning_rate": 3.1942238034219885e-05, |
| "loss": 0.2358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25034216046333313, |
| "step": 2445, |
| "valid_targets_mean": 2231.6, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 2.5735294117647056, |
| "grad_norm": 0.6778858165535954, |
| "learning_rate": 3.190017521293296e-05, |
| "loss": 0.2494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23393598198890686, |
| "step": 2450, |
| "valid_targets_mean": 2473.6, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 2.578781512605042, |
| "grad_norm": 0.6028467351028476, |
| "learning_rate": 3.185803074755395e-05, |
| "loss": 0.2458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2509484887123108, |
| "step": 2455, |
| "valid_targets_mean": 2993.6, |
| "valid_targets_min": 1079 |
| }, |
| { |
| "epoch": 2.5840336134453783, |
| "grad_norm": 0.7291609586754345, |
| "learning_rate": 3.1815804927225363e-05, |
| "loss": 0.2342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2330750823020935, |
| "step": 2460, |
| "valid_targets_mean": 2394.2, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 2.5892857142857144, |
| "grad_norm": 0.7117035098015625, |
| "learning_rate": 3.1773498041647876e-05, |
| "loss": 0.2477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2390121966600418, |
| "step": 2465, |
| "valid_targets_mean": 2322.9, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 2.5945378151260505, |
| "grad_norm": 0.7267971531615649, |
| "learning_rate": 3.173111038107834e-05, |
| "loss": 0.2433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24882632493972778, |
| "step": 2470, |
| "valid_targets_mean": 2219.9, |
| "valid_targets_min": 887 |
| }, |
| { |
| "epoch": 2.5997899159663866, |
| "grad_norm": 0.6553214599651517, |
| "learning_rate": 3.168864223632776e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23804202675819397, |
| "step": 2475, |
| "valid_targets_mean": 2536.0, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 2.6050420168067228, |
| "grad_norm": 0.6758403503740037, |
| "learning_rate": 3.1646093898759334e-05, |
| "loss": 0.235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23084652423858643, |
| "step": 2480, |
| "valid_targets_mean": 2361.0, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.610294117647059, |
| "grad_norm": 0.7731853525222528, |
| "learning_rate": 3.160346566028645e-05, |
| "loss": 0.2566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27315887808799744, |
| "step": 2485, |
| "valid_targets_mean": 1826.8, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 2.615546218487395, |
| "grad_norm": 0.7568845150659382, |
| "learning_rate": 3.156075781337068e-05, |
| "loss": 0.2446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26611223816871643, |
| "step": 2490, |
| "valid_targets_mean": 2255.1, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 2.620798319327731, |
| "grad_norm": 0.7862703099000441, |
| "learning_rate": 3.1517970651019735e-05, |
| "loss": 0.2466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26096102595329285, |
| "step": 2495, |
| "valid_targets_mean": 2134.9, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 2.6260504201680672, |
| "grad_norm": 0.67585915869592, |
| "learning_rate": 3.1475104466785536e-05, |
| "loss": 0.2462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26358675956726074, |
| "step": 2500, |
| "valid_targets_mean": 2735.0, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 2.6313025210084033, |
| "grad_norm": 0.6329275844175969, |
| "learning_rate": 3.143215955476211e-05, |
| "loss": 0.2491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24213485419750214, |
| "step": 2505, |
| "valid_targets_mean": 2604.1, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 2.6365546218487395, |
| "grad_norm": 0.6225761182265704, |
| "learning_rate": 3.138913620958365e-05, |
| "loss": 0.2581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2655182480812073, |
| "step": 2510, |
| "valid_targets_mean": 3134.6, |
| "valid_targets_min": 1472 |
| }, |
| { |
| "epoch": 2.6418067226890756, |
| "grad_norm": 0.6693316147755365, |
| "learning_rate": 3.134603472642244e-05, |
| "loss": 0.2612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2521858513355255, |
| "step": 2515, |
| "valid_targets_mean": 2876.2, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 2.6470588235294117, |
| "grad_norm": 0.7037886165836804, |
| "learning_rate": 3.1302855400986866e-05, |
| "loss": 0.2518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26977285742759705, |
| "step": 2520, |
| "valid_targets_mean": 2489.3, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 2.652310924369748, |
| "grad_norm": 0.7880145756624581, |
| "learning_rate": 3.1259598529519336e-05, |
| "loss": 0.241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24999578297138214, |
| "step": 2525, |
| "valid_targets_mean": 2124.8, |
| "valid_targets_min": 592 |
| }, |
| { |
| "epoch": 2.657563025210084, |
| "grad_norm": 0.6308106007836234, |
| "learning_rate": 3.121626440879432e-05, |
| "loss": 0.2391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2530635595321655, |
| "step": 2530, |
| "valid_targets_mean": 2594.6, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 2.66281512605042, |
| "grad_norm": 0.7372282318557066, |
| "learning_rate": 3.117285333611625e-05, |
| "loss": 0.2264, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2395913451910019, |
| "step": 2535, |
| "valid_targets_mean": 1904.2, |
| "valid_targets_min": 965 |
| }, |
| { |
| "epoch": 2.668067226890756, |
| "grad_norm": 0.667012830669792, |
| "learning_rate": 3.112936560931752e-05, |
| "loss": 0.2315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22841016948223114, |
| "step": 2540, |
| "valid_targets_mean": 2184.2, |
| "valid_targets_min": 942 |
| }, |
| { |
| "epoch": 2.6733193277310923, |
| "grad_norm": 0.6644445077742529, |
| "learning_rate": 3.108580152675642e-05, |
| "loss": 0.2501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23634028434753418, |
| "step": 2545, |
| "valid_targets_mean": 2397.2, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 2.678571428571429, |
| "grad_norm": 0.7787179904265334, |
| "learning_rate": 3.104216138731511e-05, |
| "loss": 0.2383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2434334009885788, |
| "step": 2550, |
| "valid_targets_mean": 2057.8, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 2.6838235294117645, |
| "grad_norm": 0.6846974855879137, |
| "learning_rate": 3.0998445490397546e-05, |
| "loss": 0.2379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24789969623088837, |
| "step": 2555, |
| "valid_targets_mean": 2343.2, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 2.689075630252101, |
| "grad_norm": 0.7370020291648643, |
| "learning_rate": 3.095465413592743e-05, |
| "loss": 0.2442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25336140394210815, |
| "step": 2560, |
| "valid_targets_mean": 2095.1, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 2.6943277310924367, |
| "grad_norm": 0.6326410487326921, |
| "learning_rate": 3.091078762434616e-05, |
| "loss": 0.241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2503868043422699, |
| "step": 2565, |
| "valid_targets_mean": 2962.9, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 2.6995798319327733, |
| "grad_norm": 0.6774135014050404, |
| "learning_rate": 3.086684625661081e-05, |
| "loss": 0.2402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2455071359872818, |
| "step": 2570, |
| "valid_targets_mean": 2381.1, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 2.7048319327731094, |
| "grad_norm": 0.6927859104567512, |
| "learning_rate": 3.082283033419197e-05, |
| "loss": 0.2543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29159125685691833, |
| "step": 2575, |
| "valid_targets_mean": 2816.8, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 2.7100840336134455, |
| "grad_norm": 0.6723232233408306, |
| "learning_rate": 3.077874015907174e-05, |
| "loss": 0.2481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2541651725769043, |
| "step": 2580, |
| "valid_targets_mean": 2508.1, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 2.7153361344537816, |
| "grad_norm": 0.6173987363991384, |
| "learning_rate": 3.073457603374167e-05, |
| "loss": 0.2295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2286214530467987, |
| "step": 2585, |
| "valid_targets_mean": 3016.7, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 2.7205882352941178, |
| "grad_norm": 0.7180860813557801, |
| "learning_rate": 3.069033826120066e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23617371916770935, |
| "step": 2590, |
| "valid_targets_mean": 2155.6, |
| "valid_targets_min": 805 |
| }, |
| { |
| "epoch": 2.725840336134454, |
| "grad_norm": 0.6332083889121407, |
| "learning_rate": 3.064602714495286e-05, |
| "loss": 0.2303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2275339514017105, |
| "step": 2595, |
| "valid_targets_mean": 2649.5, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 2.73109243697479, |
| "grad_norm": 0.5824671695502105, |
| "learning_rate": 3.060164298900565e-05, |
| "loss": 0.2474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21272224187850952, |
| "step": 2600, |
| "valid_targets_mean": 2831.7, |
| "valid_targets_min": 1280 |
| }, |
| { |
| "epoch": 2.736344537815126, |
| "grad_norm": 0.7999352632938964, |
| "learning_rate": 3.055718609786749e-05, |
| "loss": 0.2357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23128217458724976, |
| "step": 2605, |
| "valid_targets_mean": 1753.5, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 2.741596638655462, |
| "grad_norm": 0.6862220018448458, |
| "learning_rate": 3.051265677654585e-05, |
| "loss": 0.2388, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24940389394760132, |
| "step": 2610, |
| "valid_targets_mean": 2828.1, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 2.7468487394957983, |
| "grad_norm": 0.7409612251295014, |
| "learning_rate": 3.0468055330545162e-05, |
| "loss": 0.2466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.226776584982872, |
| "step": 2615, |
| "valid_targets_mean": 2611.8, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 2.7521008403361344, |
| "grad_norm": 0.7045597400364605, |
| "learning_rate": 3.0423382065864653e-05, |
| "loss": 0.2308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22663600742816925, |
| "step": 2620, |
| "valid_targets_mean": 1957.2, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.7573529411764706, |
| "grad_norm": 0.7198164206409869, |
| "learning_rate": 3.0378637288996304e-05, |
| "loss": 0.2404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23351144790649414, |
| "step": 2625, |
| "valid_targets_mean": 2081.1, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 2.7626050420168067, |
| "grad_norm": 0.5873814818670327, |
| "learning_rate": 3.033382130692269e-05, |
| "loss": 0.243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21516209840774536, |
| "step": 2630, |
| "valid_targets_mean": 2769.6, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 2.767857142857143, |
| "grad_norm": 0.6335582852038116, |
| "learning_rate": 3.0288934427114955e-05, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2048596739768982, |
| "step": 2635, |
| "valid_targets_mean": 2169.6, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 2.773109243697479, |
| "grad_norm": 0.67104459281815, |
| "learning_rate": 3.0243976957530602e-05, |
| "loss": 0.2512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2463095635175705, |
| "step": 2640, |
| "valid_targets_mean": 2423.3, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 2.778361344537815, |
| "grad_norm": 0.6291113433855628, |
| "learning_rate": 3.0198949206611475e-05, |
| "loss": 0.2302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.247708261013031, |
| "step": 2645, |
| "valid_targets_mean": 2842.7, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 2.783613445378151, |
| "grad_norm": 0.7183619458186878, |
| "learning_rate": 3.0153851483281582e-05, |
| "loss": 0.2478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25846749544143677, |
| "step": 2650, |
| "valid_targets_mean": 2008.1, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 2.7888655462184873, |
| "grad_norm": 0.6296111197357144, |
| "learning_rate": 3.010868409694499e-05, |
| "loss": 0.2311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2236376702785492, |
| "step": 2655, |
| "valid_targets_mean": 2598.8, |
| "valid_targets_min": 1260 |
| }, |
| { |
| "epoch": 2.7941176470588234, |
| "grad_norm": 0.6152933998116437, |
| "learning_rate": 3.0063447357483712e-05, |
| "loss": 0.2306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22628861665725708, |
| "step": 2660, |
| "valid_targets_mean": 2571.6, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 2.79936974789916, |
| "grad_norm": 0.6612164055765357, |
| "learning_rate": 3.0018141575255587e-05, |
| "loss": 0.2464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22041192650794983, |
| "step": 2665, |
| "valid_targets_mean": 2249.2, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 2.8046218487394956, |
| "grad_norm": 0.7274917143243959, |
| "learning_rate": 2.9972767061092107e-05, |
| "loss": 0.2358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2216116338968277, |
| "step": 2670, |
| "valid_targets_mean": 1970.0, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 2.809873949579832, |
| "grad_norm": 0.6906029702041456, |
| "learning_rate": 2.9927324126296352e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23099112510681152, |
| "step": 2675, |
| "valid_targets_mean": 2226.4, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 2.815126050420168, |
| "grad_norm": 0.6602585381068012, |
| "learning_rate": 2.98818130826408e-05, |
| "loss": 0.2395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23484909534454346, |
| "step": 2680, |
| "valid_targets_mean": 2583.8, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 2.8203781512605044, |
| "grad_norm": 0.700101600296082, |
| "learning_rate": 2.9836234242365204e-05, |
| "loss": 0.2446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26351702213287354, |
| "step": 2685, |
| "valid_targets_mean": 2604.2, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 2.82563025210084, |
| "grad_norm": 1.1113414468630831, |
| "learning_rate": 2.979058791817447e-05, |
| "loss": 0.2361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2611852288246155, |
| "step": 2690, |
| "valid_targets_mean": 2256.4, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 2.8308823529411766, |
| "grad_norm": 0.6092742628805521, |
| "learning_rate": 2.974487442323647e-05, |
| "loss": 0.2433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22087091207504272, |
| "step": 2695, |
| "valid_targets_mean": 2595.6, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 2.8361344537815127, |
| "grad_norm": 0.6990782326556737, |
| "learning_rate": 2.9699094071179938e-05, |
| "loss": 0.2424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24499669671058655, |
| "step": 2700, |
| "valid_targets_mean": 2403.4, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 2.841386554621849, |
| "grad_norm": 0.6311106363395269, |
| "learning_rate": 2.9653247176092286e-05, |
| "loss": 0.2526, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23955629765987396, |
| "step": 2705, |
| "valid_targets_mean": 3173.2, |
| "valid_targets_min": 1337 |
| }, |
| { |
| "epoch": 2.846638655462185, |
| "grad_norm": 0.6466020830134367, |
| "learning_rate": 2.9607334052517466e-05, |
| "loss": 0.2356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25517964363098145, |
| "step": 2710, |
| "valid_targets_mean": 2581.2, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 2.851890756302521, |
| "grad_norm": 0.6364448114027271, |
| "learning_rate": 2.9561355015453803e-05, |
| "loss": 0.2428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23851974308490753, |
| "step": 2715, |
| "valid_targets_mean": 2660.0, |
| "valid_targets_min": 514 |
| }, |
| { |
| "epoch": 2.857142857142857, |
| "grad_norm": 0.6924312748250914, |
| "learning_rate": 2.9515310380351847e-05, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25390565395355225, |
| "step": 2720, |
| "valid_targets_mean": 2458.5, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 2.8623949579831933, |
| "grad_norm": 0.6680820681499023, |
| "learning_rate": 2.9469200463112186e-05, |
| "loss": 0.2322, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22375771403312683, |
| "step": 2725, |
| "valid_targets_mean": 2688.9, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 2.8676470588235294, |
| "grad_norm": 0.6088973094421416, |
| "learning_rate": 2.9423025580083298e-05, |
| "loss": 0.2306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20682302117347717, |
| "step": 2730, |
| "valid_targets_mean": 2755.1, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 2.8728991596638656, |
| "grad_norm": 0.6859266823062403, |
| "learning_rate": 2.937678604805938e-05, |
| "loss": 0.2342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21406525373458862, |
| "step": 2735, |
| "valid_targets_mean": 2067.5, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 2.8781512605042017, |
| "grad_norm": 0.6634535239376516, |
| "learning_rate": 2.9330482184278168e-05, |
| "loss": 0.2381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24567797780036926, |
| "step": 2740, |
| "valid_targets_mean": 2457.8, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 2.883403361344538, |
| "grad_norm": 0.6340089258781645, |
| "learning_rate": 2.9284114306418758e-05, |
| "loss": 0.2389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2264363169670105, |
| "step": 2745, |
| "valid_targets_mean": 2580.6, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 2.888655462184874, |
| "grad_norm": 0.6682756597647231, |
| "learning_rate": 2.923768273259942e-05, |
| "loss": 0.2342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2170996367931366, |
| "step": 2750, |
| "valid_targets_mean": 2042.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 2.89390756302521, |
| "grad_norm": 0.6425815374610044, |
| "learning_rate": 2.919118778137546e-05, |
| "loss": 0.2371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20629505813121796, |
| "step": 2755, |
| "valid_targets_mean": 2251.1, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 2.899159663865546, |
| "grad_norm": 0.6998165427866984, |
| "learning_rate": 2.9144629771736954e-05, |
| "loss": 0.2626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27105337381362915, |
| "step": 2760, |
| "valid_targets_mean": 2532.9, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 2.9044117647058822, |
| "grad_norm": 0.6850527077895415, |
| "learning_rate": 2.9098009023106645e-05, |
| "loss": 0.2419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2457822561264038, |
| "step": 2765, |
| "valid_targets_mean": 2170.1, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 2.9096638655462184, |
| "grad_norm": 0.5591265461314032, |
| "learning_rate": 2.9051325855337684e-05, |
| "loss": 0.2417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23795005679130554, |
| "step": 2770, |
| "valid_targets_mean": 3337.8, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 2.9149159663865545, |
| "grad_norm": 0.7253204297962602, |
| "learning_rate": 2.90045805887115e-05, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26152512431144714, |
| "step": 2775, |
| "valid_targets_mean": 2250.4, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 2.9201680672268906, |
| "grad_norm": 0.6320606127718346, |
| "learning_rate": 2.8957773543935518e-05, |
| "loss": 0.231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22176562249660492, |
| "step": 2780, |
| "valid_targets_mean": 2631.1, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 2.9254201680672267, |
| "grad_norm": 0.6808320182720331, |
| "learning_rate": 2.8910905042141046e-05, |
| "loss": 0.2378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2327442467212677, |
| "step": 2785, |
| "valid_targets_mean": 2285.2, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 2.9306722689075633, |
| "grad_norm": 0.7718275961115919, |
| "learning_rate": 2.8863975404881022e-05, |
| "loss": 0.2489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23095104098320007, |
| "step": 2790, |
| "valid_targets_mean": 1883.9, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 2.935924369747899, |
| "grad_norm": 0.6901725161531642, |
| "learning_rate": 2.881698495412781e-05, |
| "loss": 0.2383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23618492484092712, |
| "step": 2795, |
| "valid_targets_mean": 2379.7, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 2.9411764705882355, |
| "grad_norm": 0.6510522678878954, |
| "learning_rate": 2.8769934012271004e-05, |
| "loss": 0.2418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26842981576919556, |
| "step": 2800, |
| "valid_targets_mean": 2957.8, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 2.946428571428571, |
| "grad_norm": 0.690393878481563, |
| "learning_rate": 2.8722822902115228e-05, |
| "loss": 0.2301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2306583821773529, |
| "step": 2805, |
| "valid_targets_mean": 2844.0, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 2.9516806722689077, |
| "grad_norm": 0.6881209587839068, |
| "learning_rate": 2.8675651946877884e-05, |
| "loss": 0.2508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26074153184890747, |
| "step": 2810, |
| "valid_targets_mean": 2694.2, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 2.956932773109244, |
| "grad_norm": 0.5892580385058059, |
| "learning_rate": 2.862842147018696e-05, |
| "loss": 0.2448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2656477689743042, |
| "step": 2815, |
| "valid_targets_mean": 3714.4, |
| "valid_targets_min": 1073 |
| }, |
| { |
| "epoch": 2.96218487394958, |
| "grad_norm": 0.6824881929007802, |
| "learning_rate": 2.858113179607881e-05, |
| "loss": 0.2421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23978950083255768, |
| "step": 2820, |
| "valid_targets_mean": 2137.4, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 2.967436974789916, |
| "grad_norm": 0.6773521974686484, |
| "learning_rate": 2.8533783248995938e-05, |
| "loss": 0.2435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2452758550643921, |
| "step": 2825, |
| "valid_targets_mean": 2297.1, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 2.972689075630252, |
| "grad_norm": 0.7308770430795042, |
| "learning_rate": 2.848637615378475e-05, |
| "loss": 0.2534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24922780692577362, |
| "step": 2830, |
| "valid_targets_mean": 2439.7, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 2.9779411764705883, |
| "grad_norm": 0.6031497666783858, |
| "learning_rate": 2.8438910835693314e-05, |
| "loss": 0.2387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2477431297302246, |
| "step": 2835, |
| "valid_targets_mean": 2889.0, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 2.9831932773109244, |
| "grad_norm": 0.7153376315518947, |
| "learning_rate": 2.8391387620369192e-05, |
| "loss": 0.2448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25468868017196655, |
| "step": 2840, |
| "valid_targets_mean": 2295.2, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 2.9884453781512605, |
| "grad_norm": 0.6969521384499777, |
| "learning_rate": 2.834380683385714e-05, |
| "loss": 0.2429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.220721036195755, |
| "step": 2845, |
| "valid_targets_mean": 2244.9, |
| "valid_targets_min": 1073 |
| }, |
| { |
| "epoch": 2.9936974789915967, |
| "grad_norm": 0.7414684846578835, |
| "learning_rate": 2.8296168802596892e-05, |
| "loss": 0.2391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23130197823047638, |
| "step": 2850, |
| "valid_targets_mean": 1981.4, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 2.9989495798319328, |
| "grad_norm": 0.7478026755802675, |
| "learning_rate": 2.8248473853420933e-05, |
| "loss": 0.2411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2313975691795349, |
| "step": 2855, |
| "valid_targets_mean": 1840.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 3.004201680672269, |
| "grad_norm": 0.6438849416484059, |
| "learning_rate": 2.8200722313552247e-05, |
| "loss": 0.2094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20280009508132935, |
| "step": 2860, |
| "valid_targets_mean": 2363.8, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 3.009453781512605, |
| "grad_norm": 0.6700105099862343, |
| "learning_rate": 2.8152914510602073e-05, |
| "loss": 0.2048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21491551399230957, |
| "step": 2865, |
| "valid_targets_mean": 2595.0, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 3.014705882352941, |
| "grad_norm": 0.6973369056653054, |
| "learning_rate": 2.810505077256765e-05, |
| "loss": 0.2078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19096165895462036, |
| "step": 2870, |
| "valid_targets_mean": 2309.4, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 3.0199579831932772, |
| "grad_norm": 0.7391770624716282, |
| "learning_rate": 2.8057131427829983e-05, |
| "loss": 0.2055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22697217762470245, |
| "step": 2875, |
| "valid_targets_mean": 2748.4, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 3.0252100840336134, |
| "grad_norm": 0.7323248663686152, |
| "learning_rate": 2.800915680515157e-05, |
| "loss": 0.2135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21774935722351074, |
| "step": 2880, |
| "valid_targets_mean": 2176.5, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 3.0304621848739495, |
| "grad_norm": 0.7293920324073403, |
| "learning_rate": 2.7961127233674167e-05, |
| "loss": 0.2025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19380387663841248, |
| "step": 2885, |
| "valid_targets_mean": 2121.6, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 3.0357142857142856, |
| "grad_norm": 0.7214083612213081, |
| "learning_rate": 2.7913043042916513e-05, |
| "loss": 0.2057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2048916071653366, |
| "step": 2890, |
| "valid_targets_mean": 2635.6, |
| "valid_targets_min": 916 |
| }, |
| { |
| "epoch": 3.0409663865546217, |
| "grad_norm": 0.6608114815054316, |
| "learning_rate": 2.786490456277208e-05, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21670818328857422, |
| "step": 2895, |
| "valid_targets_mean": 2556.7, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 3.046218487394958, |
| "grad_norm": 0.66860146042256, |
| "learning_rate": 2.7816712123506796e-05, |
| "loss": 0.1965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20460188388824463, |
| "step": 2900, |
| "valid_targets_mean": 2566.9, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 3.051470588235294, |
| "grad_norm": 0.7008326884337155, |
| "learning_rate": 2.776846605575681e-05, |
| "loss": 0.2132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.201397106051445, |
| "step": 2905, |
| "valid_targets_mean": 2224.4, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 3.05672268907563, |
| "grad_norm": 0.7720626933651689, |
| "learning_rate": 2.772016669052618e-05, |
| "loss": 0.2133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2363039255142212, |
| "step": 2910, |
| "valid_targets_mean": 2557.2, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 3.0619747899159666, |
| "grad_norm": 0.7021404124625371, |
| "learning_rate": 2.767181435918464e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20766621828079224, |
| "step": 2915, |
| "valid_targets_mean": 2482.2, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 3.0672268907563027, |
| "grad_norm": 0.6343762530485658, |
| "learning_rate": 2.7623409393465298e-05, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19036218523979187, |
| "step": 2920, |
| "valid_targets_mean": 3076.4, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 3.072478991596639, |
| "grad_norm": 0.7035625376410721, |
| "learning_rate": 2.7574952125462386e-05, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18567273020744324, |
| "step": 2925, |
| "valid_targets_mean": 2296.6, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 3.077731092436975, |
| "grad_norm": 0.6382148687024268, |
| "learning_rate": 2.7526442887628962e-05, |
| "loss": 0.2128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19346240162849426, |
| "step": 2930, |
| "valid_targets_mean": 2762.5, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 3.082983193277311, |
| "grad_norm": 0.7008906642109496, |
| "learning_rate": 2.7477882012774633e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21867555379867554, |
| "step": 2935, |
| "valid_targets_mean": 2581.9, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 3.088235294117647, |
| "grad_norm": 0.708331450124728, |
| "learning_rate": 2.742926983406328e-05, |
| "loss": 0.2003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22323349118232727, |
| "step": 2940, |
| "valid_targets_mean": 2543.1, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 3.0934873949579833, |
| "grad_norm": 0.7455067327316252, |
| "learning_rate": 2.7380606685010767e-05, |
| "loss": 0.2035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21157895028591156, |
| "step": 2945, |
| "valid_targets_mean": 2247.4, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 3.0987394957983194, |
| "grad_norm": 0.6753873272175467, |
| "learning_rate": 2.7331892899482654e-05, |
| "loss": 0.2167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2144676148891449, |
| "step": 2950, |
| "valid_targets_mean": 2689.9, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 3.1039915966386555, |
| "grad_norm": 0.6865230940428809, |
| "learning_rate": 2.7283128811691893e-05, |
| "loss": 0.2062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2236787974834442, |
| "step": 2955, |
| "valid_targets_mean": 2606.0, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 3.1092436974789917, |
| "grad_norm": 0.6404580815887296, |
| "learning_rate": 2.7234314756196564e-05, |
| "loss": 0.1962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.197324737906456, |
| "step": 2960, |
| "valid_targets_mean": 2785.6, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 3.1144957983193278, |
| "grad_norm": 0.7140771160670712, |
| "learning_rate": 2.718545106789755e-05, |
| "loss": 0.2037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19954288005828857, |
| "step": 2965, |
| "valid_targets_mean": 2234.5, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 3.119747899159664, |
| "grad_norm": 0.6975932021440397, |
| "learning_rate": 2.713653808203626e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2170845866203308, |
| "step": 2970, |
| "valid_targets_mean": 2639.3, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 3.125, |
| "grad_norm": 0.7113689274916534, |
| "learning_rate": 2.7087576134192305e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21494010090827942, |
| "step": 2975, |
| "valid_targets_mean": 2403.4, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 3.130252100840336, |
| "grad_norm": 0.6838797403752815, |
| "learning_rate": 2.7038565560281252e-05, |
| "loss": 0.2072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22361846268177032, |
| "step": 2980, |
| "valid_targets_mean": 2727.6, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 3.1355042016806722, |
| "grad_norm": 0.7301967352422043, |
| "learning_rate": 2.6989506696552224e-05, |
| "loss": 0.2226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24528783559799194, |
| "step": 2985, |
| "valid_targets_mean": 2384.6, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 3.1407563025210083, |
| "grad_norm": 0.7300962730703254, |
| "learning_rate": 2.6940399879585685e-05, |
| "loss": 0.2226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24462322890758514, |
| "step": 2990, |
| "valid_targets_mean": 2379.9, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 3.1460084033613445, |
| "grad_norm": 0.6314374147339737, |
| "learning_rate": 2.6891245446291093e-05, |
| "loss": 0.1947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20750781893730164, |
| "step": 2995, |
| "valid_targets_mean": 3385.5, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 3.1512605042016806, |
| "grad_norm": 0.6709712599868535, |
| "learning_rate": 2.6842043733904578e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19627419114112854, |
| "step": 3000, |
| "valid_targets_mean": 2626.9, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 3.1565126050420167, |
| "grad_norm": 0.7079636790584424, |
| "learning_rate": 2.6792795079986634e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21414107084274292, |
| "step": 3005, |
| "valid_targets_mean": 2522.1, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 3.161764705882353, |
| "grad_norm": 0.8013316017451616, |
| "learning_rate": 2.6743499822419833e-05, |
| "loss": 0.2065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21229714155197144, |
| "step": 3010, |
| "valid_targets_mean": 1945.2, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 3.167016806722689, |
| "grad_norm": 0.7573033558532629, |
| "learning_rate": 2.669415829940646e-05, |
| "loss": 0.2004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22666743397712708, |
| "step": 3015, |
| "valid_targets_mean": 2352.1, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 3.172268907563025, |
| "grad_norm": 0.6967416593034284, |
| "learning_rate": 2.6644770849466226e-05, |
| "loss": 0.2107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19799959659576416, |
| "step": 3020, |
| "valid_targets_mean": 2473.9, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 3.177521008403361, |
| "grad_norm": 0.6958940312721166, |
| "learning_rate": 2.6595337811433925e-05, |
| "loss": 0.2213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21963286399841309, |
| "step": 3025, |
| "valid_targets_mean": 2855.2, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 3.1827731092436973, |
| "grad_norm": 0.6644738321935247, |
| "learning_rate": 2.654585952445714e-05, |
| "loss": 0.2058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19399645924568176, |
| "step": 3030, |
| "valid_targets_mean": 2638.8, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 3.1880252100840334, |
| "grad_norm": 0.7306469351103843, |
| "learning_rate": 2.6496336327993882e-05, |
| "loss": 0.2144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20161199569702148, |
| "step": 3035, |
| "valid_targets_mean": 2136.2, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 3.19327731092437, |
| "grad_norm": 0.7466263828328548, |
| "learning_rate": 2.6446768561810264e-05, |
| "loss": 0.209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20817327499389648, |
| "step": 3040, |
| "valid_targets_mean": 2153.1, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 3.198529411764706, |
| "grad_norm": 0.6197811979812847, |
| "learning_rate": 2.6397156565978198e-05, |
| "loss": 0.2048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18749669194221497, |
| "step": 3045, |
| "valid_targets_mean": 2755.1, |
| "valid_targets_min": 823 |
| }, |
| { |
| "epoch": 3.203781512605042, |
| "grad_norm": 0.6980373354580599, |
| "learning_rate": 2.6347500680873043e-05, |
| "loss": 0.2155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20377440750598907, |
| "step": 3050, |
| "valid_targets_mean": 2491.8, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 3.2090336134453783, |
| "grad_norm": 0.7085865520639477, |
| "learning_rate": 2.6297801247171258e-05, |
| "loss": 0.2129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2216644287109375, |
| "step": 3055, |
| "valid_targets_mean": 2806.9, |
| "valid_targets_min": 1071 |
| }, |
| { |
| "epoch": 3.2142857142857144, |
| "grad_norm": 0.7205089790035474, |
| "learning_rate": 2.6248058605848097e-05, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22407683730125427, |
| "step": 3060, |
| "valid_targets_mean": 2472.9, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 3.2195378151260505, |
| "grad_norm": 0.737404594127863, |
| "learning_rate": 2.6198273098175234e-05, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20326296985149384, |
| "step": 3065, |
| "valid_targets_mean": 2019.1, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 3.2247899159663866, |
| "grad_norm": 0.6073130718222292, |
| "learning_rate": 2.614844506571844e-05, |
| "loss": 0.2108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20230062305927277, |
| "step": 3070, |
| "valid_targets_mean": 3304.4, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 3.2300420168067228, |
| "grad_norm": 0.7085944292327786, |
| "learning_rate": 2.609857485033525e-05, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20458903908729553, |
| "step": 3075, |
| "valid_targets_mean": 2500.9, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 3.235294117647059, |
| "grad_norm": 0.7171287135570944, |
| "learning_rate": 2.6048662794172595e-05, |
| "loss": 0.2095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20819462835788727, |
| "step": 3080, |
| "valid_targets_mean": 2273.6, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 3.240546218487395, |
| "grad_norm": 0.7241451356443119, |
| "learning_rate": 2.599870923966447e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2197907567024231, |
| "step": 3085, |
| "valid_targets_mean": 2637.4, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 3.245798319327731, |
| "grad_norm": 0.6305118521703866, |
| "learning_rate": 2.5948714529529565e-05, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18660598993301392, |
| "step": 3090, |
| "valid_targets_mean": 3157.4, |
| "valid_targets_min": 1567 |
| }, |
| { |
| "epoch": 3.2510504201680672, |
| "grad_norm": 0.6893413514689206, |
| "learning_rate": 2.5898679006768958e-05, |
| "loss": 0.2081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19289371371269226, |
| "step": 3095, |
| "valid_targets_mean": 2322.9, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 3.2563025210084033, |
| "grad_norm": 0.7101789326050002, |
| "learning_rate": 2.5848603014663702e-05, |
| "loss": 0.2077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2187972515821457, |
| "step": 3100, |
| "valid_targets_mean": 2543.6, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 3.2615546218487395, |
| "grad_norm": 0.9990787057867775, |
| "learning_rate": 2.579848689677252e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21138152480125427, |
| "step": 3105, |
| "valid_targets_mean": 2269.6, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 3.2668067226890756, |
| "grad_norm": 0.8018203500723405, |
| "learning_rate": 2.5748330996929414e-05, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20356349647045135, |
| "step": 3110, |
| "valid_targets_mean": 1958.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 3.2720588235294117, |
| "grad_norm": 0.6603494412466163, |
| "learning_rate": 2.5698135659241334e-05, |
| "loss": 0.2031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18327882885932922, |
| "step": 3115, |
| "valid_targets_mean": 2493.4, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 3.277310924369748, |
| "grad_norm": 0.762235597580697, |
| "learning_rate": 2.564790122808579e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20926137268543243, |
| "step": 3120, |
| "valid_targets_mean": 2595.1, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 3.282563025210084, |
| "grad_norm": 0.6535295283093114, |
| "learning_rate": 2.5597628048108504e-05, |
| "loss": 0.2168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19361212849617004, |
| "step": 3125, |
| "valid_targets_mean": 2594.5, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 3.28781512605042, |
| "grad_norm": 0.7359578809709093, |
| "learning_rate": 2.5547316464221058e-05, |
| "loss": 0.2171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24306191504001617, |
| "step": 3130, |
| "valid_targets_mean": 2595.2, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 3.293067226890756, |
| "grad_norm": 0.7555698425148304, |
| "learning_rate": 2.5496966821598493e-05, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18649283051490784, |
| "step": 3135, |
| "valid_targets_mean": 2025.6, |
| "valid_targets_min": 1099 |
| }, |
| { |
| "epoch": 3.2983193277310923, |
| "grad_norm": 0.6867271312637763, |
| "learning_rate": 2.5446579465676977e-05, |
| "loss": 0.1993, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2280460000038147, |
| "step": 3140, |
| "valid_targets_mean": 2837.4, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 3.3035714285714284, |
| "grad_norm": 0.7890879070663028, |
| "learning_rate": 2.5396154742151407e-05, |
| "loss": 0.2058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24599486589431763, |
| "step": 3145, |
| "valid_targets_mean": 2421.9, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 3.3088235294117645, |
| "grad_norm": 0.7043690415607949, |
| "learning_rate": 2.5345692996973075e-05, |
| "loss": 0.2029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20645210146903992, |
| "step": 3150, |
| "valid_targets_mean": 2250.8, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 3.314075630252101, |
| "grad_norm": 0.6920998160391696, |
| "learning_rate": 2.5295194576347233e-05, |
| "loss": 0.2121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22358179092407227, |
| "step": 3155, |
| "valid_targets_mean": 2739.9, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 3.3193277310924367, |
| "grad_norm": 0.8209408504141388, |
| "learning_rate": 2.5244659826730774e-05, |
| "loss": 0.2082, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22088845074176788, |
| "step": 3160, |
| "valid_targets_mean": 2667.9, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 3.3245798319327733, |
| "grad_norm": 0.73587278467102, |
| "learning_rate": 2.519408909482984e-05, |
| "loss": 0.2101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20288720726966858, |
| "step": 3165, |
| "valid_targets_mean": 2124.1, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 3.3298319327731094, |
| "grad_norm": 0.6501152833208236, |
| "learning_rate": 2.5143482727597427e-05, |
| "loss": 0.2008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20123985409736633, |
| "step": 3170, |
| "valid_targets_mean": 3260.6, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 3.3350840336134455, |
| "grad_norm": 0.6791329217706075, |
| "learning_rate": 2.509284107223102e-05, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21437102556228638, |
| "step": 3175, |
| "valid_targets_mean": 2677.3, |
| "valid_targets_min": 1019 |
| }, |
| { |
| "epoch": 3.3403361344537816, |
| "grad_norm": 0.8312153231004512, |
| "learning_rate": 2.50421644761702e-05, |
| "loss": 0.2154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2082928568124771, |
| "step": 3180, |
| "valid_targets_mean": 1766.3, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 3.3455882352941178, |
| "grad_norm": 0.6346713038488362, |
| "learning_rate": 2.499145328709429e-05, |
| "loss": 0.2047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2058856189250946, |
| "step": 3185, |
| "valid_targets_mean": 2967.8, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 3.350840336134454, |
| "grad_norm": 0.7841149043918871, |
| "learning_rate": 2.4940707852919924e-05, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21573182940483093, |
| "step": 3190, |
| "valid_targets_mean": 1853.8, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 3.35609243697479, |
| "grad_norm": 0.7289604889723915, |
| "learning_rate": 2.488992852179868e-05, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21095168590545654, |
| "step": 3195, |
| "valid_targets_mean": 2192.4, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 3.361344537815126, |
| "grad_norm": 0.7426897994171837, |
| "learning_rate": 2.483911564211472e-05, |
| "loss": 0.2013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2094847857952118, |
| "step": 3200, |
| "valid_targets_mean": 2182.3, |
| "valid_targets_min": 1090 |
| }, |
| { |
| "epoch": 3.366596638655462, |
| "grad_norm": 0.6905790936704768, |
| "learning_rate": 2.4788269562482355e-05, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18250685930252075, |
| "step": 3205, |
| "valid_targets_mean": 2181.2, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 3.3718487394957983, |
| "grad_norm": 0.6711044771695471, |
| "learning_rate": 2.4737390631743675e-05, |
| "loss": 0.217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21213862299919128, |
| "step": 3210, |
| "valid_targets_mean": 2841.9, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 3.3771008403361344, |
| "grad_norm": 0.7172706019446755, |
| "learning_rate": 2.4686479198966146e-05, |
| "loss": 0.2113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21013203263282776, |
| "step": 3215, |
| "valid_targets_mean": 2435.9, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 3.3823529411764706, |
| "grad_norm": 0.746681881677102, |
| "learning_rate": 2.463553561344024e-05, |
| "loss": 0.2193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2209860384464264, |
| "step": 3220, |
| "valid_targets_mean": 2233.9, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 3.3876050420168067, |
| "grad_norm": 0.7545727322641577, |
| "learning_rate": 2.4584560224677013e-05, |
| "loss": 0.2176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2379944920539856, |
| "step": 3225, |
| "valid_targets_mean": 2649.4, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 3.392857142857143, |
| "grad_norm": 0.6782835854882808, |
| "learning_rate": 2.4533553382405702e-05, |
| "loss": 0.211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20617589354515076, |
| "step": 3230, |
| "valid_targets_mean": 2802.6, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 3.398109243697479, |
| "grad_norm": 0.7578767328316001, |
| "learning_rate": 2.4482515436571365e-05, |
| "loss": 0.2172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22788771986961365, |
| "step": 3235, |
| "valid_targets_mean": 2326.2, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 3.403361344537815, |
| "grad_norm": 0.6541735808021184, |
| "learning_rate": 2.4431446737332437e-05, |
| "loss": 0.2121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20903077721595764, |
| "step": 3240, |
| "valid_targets_mean": 3203.4, |
| "valid_targets_min": 1003 |
| }, |
| { |
| "epoch": 3.408613445378151, |
| "grad_norm": 0.7811038952636883, |
| "learning_rate": 2.438034763505833e-05, |
| "loss": 0.2166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21477511525154114, |
| "step": 3245, |
| "valid_targets_mean": 1979.8, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 3.4138655462184873, |
| "grad_norm": 0.6625538840028757, |
| "learning_rate": 2.432921848032707e-05, |
| "loss": 0.2044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2320900559425354, |
| "step": 3250, |
| "valid_targets_mean": 2910.2, |
| "valid_targets_min": 1315 |
| }, |
| { |
| "epoch": 3.4191176470588234, |
| "grad_norm": 0.7485969796152663, |
| "learning_rate": 2.427805962392286e-05, |
| "loss": 0.2025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20698726177215576, |
| "step": 3255, |
| "valid_targets_mean": 1875.1, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 3.4243697478991595, |
| "grad_norm": 0.7348995050217967, |
| "learning_rate": 2.4226871416833683e-05, |
| "loss": 0.1988, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20574046671390533, |
| "step": 3260, |
| "valid_targets_mean": 2167.6, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 3.4296218487394956, |
| "grad_norm": 0.6743471501486973, |
| "learning_rate": 2.4175654210248848e-05, |
| "loss": 0.2121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19565929472446442, |
| "step": 3265, |
| "valid_targets_mean": 2611.9, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 3.434873949579832, |
| "grad_norm": 0.6301404143473273, |
| "learning_rate": 2.4124408355556677e-05, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22094877064228058, |
| "step": 3270, |
| "valid_targets_mean": 3081.8, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 3.440126050420168, |
| "grad_norm": 0.6526940719618316, |
| "learning_rate": 2.4073134204342014e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20152367651462555, |
| "step": 3275, |
| "valid_targets_mean": 2381.3, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 3.4453781512605044, |
| "grad_norm": 0.6659235538473005, |
| "learning_rate": 2.4021832108383837e-05, |
| "loss": 0.2207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20738565921783447, |
| "step": 3280, |
| "valid_targets_mean": 2625.6, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 3.4506302521008405, |
| "grad_norm": 0.7166624142705825, |
| "learning_rate": 2.3970502419652854e-05, |
| "loss": 0.2073, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19094321131706238, |
| "step": 3285, |
| "valid_targets_mean": 2041.8, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 3.4558823529411766, |
| "grad_norm": 0.7984671258808161, |
| "learning_rate": 2.3919145490309076e-05, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21888110041618347, |
| "step": 3290, |
| "valid_targets_mean": 1798.3, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 3.4611344537815127, |
| "grad_norm": 0.6963556467492686, |
| "learning_rate": 2.38677616726994e-05, |
| "loss": 0.1958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17585915327072144, |
| "step": 3295, |
| "valid_targets_mean": 2040.5, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 3.466386554621849, |
| "grad_norm": 0.5743174603598479, |
| "learning_rate": 2.381635131935521e-05, |
| "loss": 0.205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1667209416627884, |
| "step": 3300, |
| "valid_targets_mean": 3134.2, |
| "valid_targets_min": 522 |
| }, |
| { |
| "epoch": 3.471638655462185, |
| "grad_norm": 0.7243626640826193, |
| "learning_rate": 2.3764914782989926e-05, |
| "loss": 0.2135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22822029888629913, |
| "step": 3305, |
| "valid_targets_mean": 2619.9, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 3.476890756302521, |
| "grad_norm": 0.669561945697959, |
| "learning_rate": 2.3713452416496625e-05, |
| "loss": 0.2097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20612934231758118, |
| "step": 3310, |
| "valid_targets_mean": 2525.0, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 3.482142857142857, |
| "grad_norm": 0.7414140882682606, |
| "learning_rate": 2.366196457294558e-05, |
| "loss": 0.2137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21093863248825073, |
| "step": 3315, |
| "valid_targets_mean": 2090.9, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 3.4873949579831933, |
| "grad_norm": 0.6133977770277803, |
| "learning_rate": 2.3610451605581858e-05, |
| "loss": 0.2061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1882474273443222, |
| "step": 3320, |
| "valid_targets_mean": 3069.8, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 3.4926470588235294, |
| "grad_norm": 0.6648952110036311, |
| "learning_rate": 2.3558913867822905e-05, |
| "loss": 0.2057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20279830694198608, |
| "step": 3325, |
| "valid_targets_mean": 2729.6, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 3.4978991596638656, |
| "grad_norm": 0.7839692483507994, |
| "learning_rate": 2.3507351713256105e-05, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21825388073921204, |
| "step": 3330, |
| "valid_targets_mean": 1961.4, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 3.5031512605042017, |
| "grad_norm": 0.6420384291551596, |
| "learning_rate": 2.3455765495636353e-05, |
| "loss": 0.2015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20120246708393097, |
| "step": 3335, |
| "valid_targets_mean": 2840.8, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 3.508403361344538, |
| "grad_norm": 0.7332433509193245, |
| "learning_rate": 2.3404155568883643e-05, |
| "loss": 0.214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23752212524414062, |
| "step": 3340, |
| "valid_targets_mean": 2502.9, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 3.513655462184874, |
| "grad_norm": 0.7036254623505526, |
| "learning_rate": 2.3352522287080625e-05, |
| "loss": 0.2107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22437232732772827, |
| "step": 3345, |
| "valid_targets_mean": 2470.9, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.51890756302521, |
| "grad_norm": 0.674241478442284, |
| "learning_rate": 2.3300866004470182e-05, |
| "loss": 0.2121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23106199502944946, |
| "step": 3350, |
| "valid_targets_mean": 2678.7, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 3.524159663865546, |
| "grad_norm": 0.6913901681322876, |
| "learning_rate": 2.324918707545302e-05, |
| "loss": 0.2085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20624200999736786, |
| "step": 3355, |
| "valid_targets_mean": 2525.9, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 3.5294117647058822, |
| "grad_norm": 0.7215505447514452, |
| "learning_rate": 2.3197485854585183e-05, |
| "loss": 0.2074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18115992844104767, |
| "step": 3360, |
| "valid_targets_mean": 1991.8, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 3.5346638655462184, |
| "grad_norm": 0.6339782709302462, |
| "learning_rate": 2.3145762696575675e-05, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20273572206497192, |
| "step": 3365, |
| "valid_targets_mean": 3340.9, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 3.5399159663865545, |
| "grad_norm": 0.6976739706673805, |
| "learning_rate": 2.3094017956283995e-05, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2007465362548828, |
| "step": 3370, |
| "valid_targets_mean": 2454.3, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 3.5451680672268906, |
| "grad_norm": 0.6726999837744964, |
| "learning_rate": 2.3042251988717728e-05, |
| "loss": 0.2006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16553646326065063, |
| "step": 3375, |
| "valid_targets_mean": 2192.6, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 3.5504201680672267, |
| "grad_norm": 0.7301827373994265, |
| "learning_rate": 2.2990465149030077e-05, |
| "loss": 0.2013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19199733436107635, |
| "step": 3380, |
| "valid_targets_mean": 2214.3, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 3.5556722689075633, |
| "grad_norm": 0.6670894246533184, |
| "learning_rate": 2.2938657792517446e-05, |
| "loss": 0.221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2090798318386078, |
| "step": 3385, |
| "valid_targets_mean": 2772.3, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 3.560924369747899, |
| "grad_norm": 0.7737810251679192, |
| "learning_rate": 2.2886830274617017e-05, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24221691489219666, |
| "step": 3390, |
| "valid_targets_mean": 2221.1, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 3.5661764705882355, |
| "grad_norm": 0.6681259679390096, |
| "learning_rate": 2.2834982950904267e-05, |
| "loss": 0.2107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19659334421157837, |
| "step": 3395, |
| "valid_targets_mean": 2447.6, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 3.571428571428571, |
| "grad_norm": 0.8318412772228536, |
| "learning_rate": 2.2783116177090573e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22690819203853607, |
| "step": 3400, |
| "valid_targets_mean": 2100.6, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 3.5766806722689077, |
| "grad_norm": 0.6541716254669749, |
| "learning_rate": 2.2731230309020762e-05, |
| "loss": 0.2164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19614872336387634, |
| "step": 3405, |
| "valid_targets_mean": 2690.9, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 3.581932773109244, |
| "grad_norm": 0.735048933666179, |
| "learning_rate": 2.2679325702670642e-05, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22025522589683533, |
| "step": 3410, |
| "valid_targets_mean": 2054.1, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 3.58718487394958, |
| "grad_norm": 0.7432848251883631, |
| "learning_rate": 2.2627402714144586e-05, |
| "loss": 0.2058, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21356913447380066, |
| "step": 3415, |
| "valid_targets_mean": 2400.3, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 3.592436974789916, |
| "grad_norm": 0.6273611826621119, |
| "learning_rate": 2.2575461699673085e-05, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21526393294334412, |
| "step": 3420, |
| "valid_targets_mean": 3208.0, |
| "valid_targets_min": 1402 |
| }, |
| { |
| "epoch": 3.597689075630252, |
| "grad_norm": 0.6901843944101652, |
| "learning_rate": 2.2523503015610303e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21407434344291687, |
| "step": 3425, |
| "valid_targets_mean": 2472.9, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 3.6029411764705883, |
| "grad_norm": 0.6750339364655951, |
| "learning_rate": 2.2471527018431637e-05, |
| "loss": 0.2146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2302270233631134, |
| "step": 3430, |
| "valid_targets_mean": 3292.7, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 3.6081932773109244, |
| "grad_norm": 0.6870012851485073, |
| "learning_rate": 2.2419534064731238e-05, |
| "loss": 0.2054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2101989984512329, |
| "step": 3435, |
| "valid_targets_mean": 2430.9, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 3.6134453781512605, |
| "grad_norm": 0.7652411173135991, |
| "learning_rate": 2.236752451121963e-05, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20987604558467865, |
| "step": 3440, |
| "valid_targets_mean": 2773.8, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 3.6186974789915967, |
| "grad_norm": 0.96702355486614, |
| "learning_rate": 2.2315498714721198e-05, |
| "loss": 0.2094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2208380401134491, |
| "step": 3445, |
| "valid_targets_mean": 2227.6, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 3.6239495798319328, |
| "grad_norm": 0.7568581037232849, |
| "learning_rate": 2.2263457032171762e-05, |
| "loss": 0.2144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20502294600009918, |
| "step": 3450, |
| "valid_targets_mean": 1974.8, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 3.629201680672269, |
| "grad_norm": 0.6324142287116146, |
| "learning_rate": 2.2211399820616154e-05, |
| "loss": 0.2017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1848364919424057, |
| "step": 3455, |
| "valid_targets_mean": 2530.7, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 3.634453781512605, |
| "grad_norm": 0.6787789057247168, |
| "learning_rate": 2.2159327437205733e-05, |
| "loss": 0.2202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20259186625480652, |
| "step": 3460, |
| "valid_targets_mean": 2469.3, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 3.639705882352941, |
| "grad_norm": 0.6108458629326181, |
| "learning_rate": 2.210724023919595e-05, |
| "loss": 0.21, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21205033361911774, |
| "step": 3465, |
| "valid_targets_mean": 3304.5, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 3.6449579831932772, |
| "grad_norm": 0.7630702002273175, |
| "learning_rate": 2.205513858394389e-05, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22506915032863617, |
| "step": 3470, |
| "valid_targets_mean": 2128.4, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 3.6502100840336134, |
| "grad_norm": 0.6853988147626505, |
| "learning_rate": 2.2003022828905832e-05, |
| "loss": 0.2047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2102399468421936, |
| "step": 3475, |
| "valid_targets_mean": 2369.8, |
| "valid_targets_min": 942 |
| }, |
| { |
| "epoch": 3.6554621848739495, |
| "grad_norm": 0.8205924816380262, |
| "learning_rate": 2.19508933316348e-05, |
| "loss": 0.2094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2225526124238968, |
| "step": 3480, |
| "valid_targets_mean": 2051.9, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 3.6607142857142856, |
| "grad_norm": 0.7855685679107322, |
| "learning_rate": 2.189875044977808e-05, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21352198719978333, |
| "step": 3485, |
| "valid_targets_mean": 2024.9, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 3.6659663865546217, |
| "grad_norm": 0.6891565684644114, |
| "learning_rate": 2.1846594541074796e-05, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19370394945144653, |
| "step": 3490, |
| "valid_targets_mean": 2303.7, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 3.671218487394958, |
| "grad_norm": 0.66281123426459, |
| "learning_rate": 2.179442596335345e-05, |
| "loss": 0.2158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21961744129657745, |
| "step": 3495, |
| "valid_targets_mean": 2835.9, |
| "valid_targets_min": 771 |
| }, |
| { |
| "epoch": 3.6764705882352944, |
| "grad_norm": 0.6917997631532197, |
| "learning_rate": 2.174224507452945e-05, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20729771256446838, |
| "step": 3500, |
| "valid_targets_mean": 2409.9, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 3.68172268907563, |
| "grad_norm": 0.7215177976056998, |
| "learning_rate": 2.1690052232602677e-05, |
| "loss": 0.2213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24402323365211487, |
| "step": 3505, |
| "valid_targets_mean": 2753.1, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 3.6869747899159666, |
| "grad_norm": 0.6763541211099533, |
| "learning_rate": 2.1637847795655022e-05, |
| "loss": 0.2118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21992330253124237, |
| "step": 3510, |
| "valid_targets_mean": 2720.9, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 3.6922268907563023, |
| "grad_norm": 0.6816841950766274, |
| "learning_rate": 2.1585632121847925e-05, |
| "loss": 0.2169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19951927661895752, |
| "step": 3515, |
| "valid_targets_mean": 2837.1, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 3.697478991596639, |
| "grad_norm": 0.695061597525997, |
| "learning_rate": 2.153340556941991e-05, |
| "loss": 0.2147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23091833293437958, |
| "step": 3520, |
| "valid_targets_mean": 2830.2, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 3.7027310924369745, |
| "grad_norm": 0.7145487481152861, |
| "learning_rate": 2.1481168496684145e-05, |
| "loss": 0.2152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22669626772403717, |
| "step": 3525, |
| "valid_targets_mean": 2385.2, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 3.707983193277311, |
| "grad_norm": 0.773517958966538, |
| "learning_rate": 2.142892126202597e-05, |
| "loss": 0.2083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20061250030994415, |
| "step": 3530, |
| "valid_targets_mean": 1901.8, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 3.713235294117647, |
| "grad_norm": 0.6514006030844219, |
| "learning_rate": 2.137666422390045e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21307383477687836, |
| "step": 3535, |
| "valid_targets_mean": 2973.2, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 3.7184873949579833, |
| "grad_norm": 0.6294462036244911, |
| "learning_rate": 2.132439774082991e-05, |
| "loss": 0.2197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2212301641702652, |
| "step": 3540, |
| "valid_targets_mean": 3056.4, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 3.7237394957983194, |
| "grad_norm": 0.654887046400427, |
| "learning_rate": 2.1272122171401467e-05, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18347257375717163, |
| "step": 3545, |
| "valid_targets_mean": 2574.4, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 3.7289915966386555, |
| "grad_norm": 0.6809633747210387, |
| "learning_rate": 2.1219837874264573e-05, |
| "loss": 0.2024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18207016587257385, |
| "step": 3550, |
| "valid_targets_mean": 2467.8, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 3.7342436974789917, |
| "grad_norm": 0.8490088878626119, |
| "learning_rate": 2.116754520812857e-05, |
| "loss": 0.2161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21279117465019226, |
| "step": 3555, |
| "valid_targets_mean": 1938.0, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 3.7394957983193278, |
| "grad_norm": 0.7362797471450374, |
| "learning_rate": 2.111524453176022e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2274627536535263, |
| "step": 3560, |
| "valid_targets_mean": 2261.9, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 3.744747899159664, |
| "grad_norm": 0.7547351585834484, |
| "learning_rate": 2.1062936203981227e-05, |
| "loss": 0.2208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21145398914813995, |
| "step": 3565, |
| "valid_targets_mean": 2079.0, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 3.75, |
| "grad_norm": 0.6040282948873019, |
| "learning_rate": 2.10106205836658e-05, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17291516065597534, |
| "step": 3570, |
| "valid_targets_mean": 2807.0, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 3.755252100840336, |
| "grad_norm": 0.7692191031763723, |
| "learning_rate": 2.095829802973817e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21016576886177063, |
| "step": 3575, |
| "valid_targets_mean": 2692.1, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 3.7605042016806722, |
| "grad_norm": 0.6937553318754113, |
| "learning_rate": 2.090596890117016e-05, |
| "loss": 0.211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20397567749023438, |
| "step": 3580, |
| "valid_targets_mean": 2325.8, |
| "valid_targets_min": 915 |
| }, |
| { |
| "epoch": 3.7657563025210083, |
| "grad_norm": 0.7298575781771081, |
| "learning_rate": 2.0853633556978674e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2305256426334381, |
| "step": 3585, |
| "valid_targets_mean": 2357.3, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 3.7710084033613445, |
| "grad_norm": 0.8229634474031364, |
| "learning_rate": 2.0801292356223265e-05, |
| "loss": 0.2235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23045924305915833, |
| "step": 3590, |
| "valid_targets_mean": 1879.1, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 3.7762605042016806, |
| "grad_norm": 0.6135522966100759, |
| "learning_rate": 2.0748945658003695e-05, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20716413855552673, |
| "step": 3595, |
| "valid_targets_mean": 3463.8, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 3.7815126050420167, |
| "grad_norm": 0.8109456213693356, |
| "learning_rate": 2.0696593821457392e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21201831102371216, |
| "step": 3600, |
| "valid_targets_mean": 2110.6, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 3.786764705882353, |
| "grad_norm": 0.7309833863162327, |
| "learning_rate": 2.064423720575709e-05, |
| "loss": 0.2172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22593368589878082, |
| "step": 3605, |
| "valid_targets_mean": 2323.6, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 3.792016806722689, |
| "grad_norm": 0.6453442893544274, |
| "learning_rate": 2.0591876170108257e-05, |
| "loss": 0.2124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22857289016246796, |
| "step": 3610, |
| "valid_targets_mean": 2964.2, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 3.7972689075630255, |
| "grad_norm": 1.045593114030177, |
| "learning_rate": 2.0539511073746743e-05, |
| "loss": 0.1914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2170926183462143, |
| "step": 3615, |
| "valid_targets_mean": 2493.9, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 3.802521008403361, |
| "grad_norm": 0.685780352452399, |
| "learning_rate": 2.0487142275936213e-05, |
| "loss": 0.2002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1872934252023697, |
| "step": 3620, |
| "valid_targets_mean": 2356.4, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 3.8077731092436977, |
| "grad_norm": 0.7579039345943492, |
| "learning_rate": 2.0434770135965743e-05, |
| "loss": 0.2121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.200333833694458, |
| "step": 3625, |
| "valid_targets_mean": 2157.2, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 3.8130252100840334, |
| "grad_norm": 0.6470297697973766, |
| "learning_rate": 2.0382395013147347e-05, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19545529782772064, |
| "step": 3630, |
| "valid_targets_mean": 2711.9, |
| "valid_targets_min": 1144 |
| }, |
| { |
| "epoch": 3.81827731092437, |
| "grad_norm": 0.653362214398331, |
| "learning_rate": 2.033001726681349e-05, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21826599538326263, |
| "step": 3635, |
| "valid_targets_mean": 2853.1, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 3.8235294117647056, |
| "grad_norm": 0.6867053178122183, |
| "learning_rate": 2.027763725631463e-05, |
| "loss": 0.2023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19404883682727814, |
| "step": 3640, |
| "valid_targets_mean": 2482.8, |
| "valid_targets_min": 1067 |
| }, |
| { |
| "epoch": 3.828781512605042, |
| "grad_norm": 0.7218696655921097, |
| "learning_rate": 2.0225255341016794e-05, |
| "loss": 0.2105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1934603750705719, |
| "step": 3645, |
| "valid_targets_mean": 2152.1, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 3.8340336134453783, |
| "grad_norm": 0.7091556745123918, |
| "learning_rate": 2.017287188029904e-05, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21000255644321442, |
| "step": 3650, |
| "valid_targets_mean": 2308.8, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 3.8392857142857144, |
| "grad_norm": 0.6815200778696167, |
| "learning_rate": 2.0120487233551035e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23103326559066772, |
| "step": 3655, |
| "valid_targets_mean": 2734.1, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 3.8445378151260505, |
| "grad_norm": 0.6280352447022034, |
| "learning_rate": 2.006810176017059e-05, |
| "loss": 0.2085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21302129328250885, |
| "step": 3660, |
| "valid_targets_mean": 3324.1, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 3.8497899159663866, |
| "grad_norm": 0.7066023629427282, |
| "learning_rate": 2.0015715819561205e-05, |
| "loss": 0.2138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21427252888679504, |
| "step": 3665, |
| "valid_targets_mean": 2452.4, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 3.8550420168067228, |
| "grad_norm": 0.647316148786966, |
| "learning_rate": 1.9963329771129558e-05, |
| "loss": 0.1952, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1968604177236557, |
| "step": 3670, |
| "valid_targets_mean": 2530.9, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 3.860294117647059, |
| "grad_norm": 0.6784605187933433, |
| "learning_rate": 1.9910943974283066e-05, |
| "loss": 0.2143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2061229795217514, |
| "step": 3675, |
| "valid_targets_mean": 2622.5, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 3.865546218487395, |
| "grad_norm": 0.6920269949000379, |
| "learning_rate": 1.9858558788427447e-05, |
| "loss": 0.1973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18967095017433167, |
| "step": 3680, |
| "valid_targets_mean": 2135.2, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 3.870798319327731, |
| "grad_norm": 0.7052959882420897, |
| "learning_rate": 1.9806174572964205e-05, |
| "loss": 0.2198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20895016193389893, |
| "step": 3685, |
| "valid_targets_mean": 2395.5, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 3.8760504201680672, |
| "grad_norm": 0.6385724766539387, |
| "learning_rate": 1.975379168728819e-05, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2081984281539917, |
| "step": 3690, |
| "valid_targets_mean": 2853.7, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 3.8813025210084033, |
| "grad_norm": 0.72510115733088, |
| "learning_rate": 1.9701410490785128e-05, |
| "loss": 0.2249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22268277406692505, |
| "step": 3695, |
| "valid_targets_mean": 2524.2, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 3.8865546218487395, |
| "grad_norm": 0.7123147276422185, |
| "learning_rate": 1.9649031342829178e-05, |
| "loss": 0.2055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22262287139892578, |
| "step": 3700, |
| "valid_targets_mean": 2540.8, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 3.8918067226890756, |
| "grad_norm": 0.6390925839310951, |
| "learning_rate": 1.9596654602780398e-05, |
| "loss": 0.2161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19909490644931793, |
| "step": 3705, |
| "valid_targets_mean": 2773.2, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 3.8970588235294117, |
| "grad_norm": 0.6412477203773937, |
| "learning_rate": 1.9544280629982364e-05, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1946112960577011, |
| "step": 3710, |
| "valid_targets_mean": 2642.8, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 3.902310924369748, |
| "grad_norm": 0.716484891233997, |
| "learning_rate": 1.949190978375966e-05, |
| "loss": 0.2122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23176735639572144, |
| "step": 3715, |
| "valid_targets_mean": 2558.9, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 3.907563025210084, |
| "grad_norm": 0.6768189969402229, |
| "learning_rate": 1.9439542423415413e-05, |
| "loss": 0.2018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19778092205524445, |
| "step": 3720, |
| "valid_targets_mean": 2772.1, |
| "valid_targets_min": 1107 |
| }, |
| { |
| "epoch": 3.91281512605042, |
| "grad_norm": 0.6207653385694745, |
| "learning_rate": 1.9387178908228838e-05, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20920640230178833, |
| "step": 3725, |
| "valid_targets_mean": 3297.2, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 3.918067226890756, |
| "grad_norm": 0.7356716818302198, |
| "learning_rate": 1.933481959745276e-05, |
| "loss": 0.2218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24886155128479004, |
| "step": 3730, |
| "valid_targets_mean": 2577.4, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 3.9233193277310923, |
| "grad_norm": 0.6771424238422388, |
| "learning_rate": 1.9282464850311184e-05, |
| "loss": 0.2115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22557204961776733, |
| "step": 3735, |
| "valid_targets_mean": 2883.5, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 3.928571428571429, |
| "grad_norm": 0.7641048688976471, |
| "learning_rate": 1.9230115025996764e-05, |
| "loss": 0.208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2032201588153839, |
| "step": 3740, |
| "valid_targets_mean": 1858.1, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 3.9338235294117645, |
| "grad_norm": 0.5906821588122515, |
| "learning_rate": 1.9177770483668416e-05, |
| "loss": 0.2203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1867651641368866, |
| "step": 3745, |
| "valid_targets_mean": 2936.9, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 3.939075630252101, |
| "grad_norm": 0.6203552861446046, |
| "learning_rate": 1.912543158244881e-05, |
| "loss": 0.2128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19798970222473145, |
| "step": 3750, |
| "valid_targets_mean": 3003.4, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 3.9443277310924367, |
| "grad_norm": 0.7646340475457648, |
| "learning_rate": 1.9073098681421895e-05, |
| "loss": 0.2129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19918084144592285, |
| "step": 3755, |
| "valid_targets_mean": 1886.4, |
| "valid_targets_min": 545 |
| }, |
| { |
| "epoch": 3.9495798319327733, |
| "grad_norm": 0.6926521998600635, |
| "learning_rate": 1.902077213963048e-05, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2141200602054596, |
| "step": 3760, |
| "valid_targets_mean": 2899.2, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 3.9548319327731094, |
| "grad_norm": 0.7157783415052118, |
| "learning_rate": 1.896845231607372e-05, |
| "loss": 0.1966, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19222521781921387, |
| "step": 3765, |
| "valid_targets_mean": 2013.7, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 3.9600840336134455, |
| "grad_norm": 0.8266386898112025, |
| "learning_rate": 1.8916139569704704e-05, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22533836960792542, |
| "step": 3770, |
| "valid_targets_mean": 2034.5, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 3.9653361344537816, |
| "grad_norm": 0.8096944452658449, |
| "learning_rate": 1.886383425942795e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18177619576454163, |
| "step": 3775, |
| "valid_targets_mean": 1980.1, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 3.9705882352941178, |
| "grad_norm": 0.6708795853596977, |
| "learning_rate": 1.8811536744096956e-05, |
| "loss": 0.2115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2508021593093872, |
| "step": 3780, |
| "valid_targets_mean": 2865.2, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 3.975840336134454, |
| "grad_norm": 0.6124622098856916, |
| "learning_rate": 1.8759247382511748e-05, |
| "loss": 0.2019, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21529731154441833, |
| "step": 3785, |
| "valid_targets_mean": 3260.9, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 3.98109243697479, |
| "grad_norm": 0.7245013981014534, |
| "learning_rate": 1.8706966533416413e-05, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2099657505750656, |
| "step": 3790, |
| "valid_targets_mean": 2156.7, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 3.986344537815126, |
| "grad_norm": 0.7199624429982473, |
| "learning_rate": 1.8654694555496624e-05, |
| "loss": 0.2138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2163430154323578, |
| "step": 3795, |
| "valid_targets_mean": 2900.4, |
| "valid_targets_min": 1205 |
| }, |
| { |
| "epoch": 3.991596638655462, |
| "grad_norm": 0.7313432594209842, |
| "learning_rate": 1.860243180737721e-05, |
| "loss": 0.2097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24018210172653198, |
| "step": 3800, |
| "valid_targets_mean": 2467.2, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 3.9968487394957983, |
| "grad_norm": 0.686344735243992, |
| "learning_rate": 1.8550178647619664e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2029697597026825, |
| "step": 3805, |
| "valid_targets_mean": 2462.6, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 4.0021008403361344, |
| "grad_norm": 0.5964545073234324, |
| "learning_rate": 1.84979354347197e-05, |
| "loss": 0.1972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15941348671913147, |
| "step": 3810, |
| "valid_targets_mean": 2904.0, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 4.007352941176471, |
| "grad_norm": 0.6310111711662433, |
| "learning_rate": 1.8445702527104782e-05, |
| "loss": 0.1758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17425957322120667, |
| "step": 3815, |
| "valid_targets_mean": 2903.4, |
| "valid_targets_min": 1572 |
| }, |
| { |
| "epoch": 4.012605042016807, |
| "grad_norm": 0.8382816261281872, |
| "learning_rate": 1.8393480283131677e-05, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1987411081790924, |
| "step": 3820, |
| "valid_targets_mean": 2029.4, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 4.017857142857143, |
| "grad_norm": 0.6828047242423465, |
| "learning_rate": 1.8341269061083996e-05, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16214141249656677, |
| "step": 3825, |
| "valid_targets_mean": 2665.1, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 4.023109243697479, |
| "grad_norm": 0.6544969992637274, |
| "learning_rate": 1.8289069219169717e-05, |
| "loss": 0.1698, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15575842559337616, |
| "step": 3830, |
| "valid_targets_mean": 2708.9, |
| "valid_targets_min": 741 |
| }, |
| { |
| "epoch": 4.0283613445378155, |
| "grad_norm": 0.665567823015263, |
| "learning_rate": 1.8236881115518766e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1710759848356247, |
| "step": 3835, |
| "valid_targets_mean": 2501.2, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 4.033613445378151, |
| "grad_norm": 0.8048649946622554, |
| "learning_rate": 1.8184705108180516e-05, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21742048859596252, |
| "step": 3840, |
| "valid_targets_mean": 2245.1, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 4.038865546218488, |
| "grad_norm": 0.6730348979572065, |
| "learning_rate": 1.8132541555121353e-05, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17370149493217468, |
| "step": 3845, |
| "valid_targets_mean": 3004.6, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 4.044117647058823, |
| "grad_norm": 0.6773064122209941, |
| "learning_rate": 1.808039081422223e-05, |
| "loss": 0.1759, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.177533358335495, |
| "step": 3850, |
| "valid_targets_mean": 2959.3, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 4.04936974789916, |
| "grad_norm": 0.8972828803367779, |
| "learning_rate": 1.802825324327618e-05, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19859957695007324, |
| "step": 3855, |
| "valid_targets_mean": 1707.2, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 4.054621848739496, |
| "grad_norm": 0.6816271881225173, |
| "learning_rate": 1.7976129199985886e-05, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19027729332447052, |
| "step": 3860, |
| "valid_targets_mean": 2623.9, |
| "valid_targets_min": 1048 |
| }, |
| { |
| "epoch": 4.059873949579832, |
| "grad_norm": 0.7082107239302485, |
| "learning_rate": 1.7924019041961228e-05, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17302575707435608, |
| "step": 3865, |
| "valid_targets_mean": 2540.1, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 4.065126050420168, |
| "grad_norm": 0.781860364268105, |
| "learning_rate": 1.7871923126716827e-05, |
| "loss": 0.1827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17314311861991882, |
| "step": 3870, |
| "valid_targets_mean": 1902.4, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 4.070378151260504, |
| "grad_norm": 0.770240331697946, |
| "learning_rate": 1.7819841811669573e-05, |
| "loss": 0.1726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17767006158828735, |
| "step": 3875, |
| "valid_targets_mean": 2162.2, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 4.07563025210084, |
| "grad_norm": 0.7494050596565602, |
| "learning_rate": 1.7767775454136194e-05, |
| "loss": 0.1684, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16591396927833557, |
| "step": 3880, |
| "valid_targets_mean": 2518.5, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 4.080882352941177, |
| "grad_norm": 0.6697129284162905, |
| "learning_rate": 1.7715724411330806e-05, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1829383820295334, |
| "step": 3885, |
| "valid_targets_mean": 3106.3, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 4.086134453781512, |
| "grad_norm": 0.7339734064772027, |
| "learning_rate": 1.7663689040362446e-05, |
| "loss": 0.1872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18020042777061462, |
| "step": 3890, |
| "valid_targets_mean": 2812.9, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 4.091386554621849, |
| "grad_norm": 0.7376435988375549, |
| "learning_rate": 1.761166969823262e-05, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15077045559883118, |
| "step": 3895, |
| "valid_targets_mean": 2092.4, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 4.0966386554621845, |
| "grad_norm": 0.6730357795335743, |
| "learning_rate": 1.7559666741832896e-05, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16643144190311432, |
| "step": 3900, |
| "valid_targets_mean": 2449.2, |
| "valid_targets_min": 982 |
| }, |
| { |
| "epoch": 4.101890756302521, |
| "grad_norm": 0.8297442949389751, |
| "learning_rate": 1.750768052794239e-05, |
| "loss": 0.1927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18952782452106476, |
| "step": 3905, |
| "valid_targets_mean": 1901.9, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 4.107142857142857, |
| "grad_norm": 0.794021570909151, |
| "learning_rate": 1.7455711413225372e-05, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19502568244934082, |
| "step": 3910, |
| "valid_targets_mean": 2269.1, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 4.112394957983193, |
| "grad_norm": 0.8070144150239097, |
| "learning_rate": 1.7403759754228794e-05, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17317187786102295, |
| "step": 3915, |
| "valid_targets_mean": 1938.3, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 4.117647058823529, |
| "grad_norm": 0.6999096413433571, |
| "learning_rate": 1.7351825907379837e-05, |
| "loss": 0.1803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1811293363571167, |
| "step": 3920, |
| "valid_targets_mean": 2730.1, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 4.1228991596638656, |
| "grad_norm": 0.7320665392327763, |
| "learning_rate": 1.7299910228983513e-05, |
| "loss": 0.1786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1840408742427826, |
| "step": 3925, |
| "valid_targets_mean": 2366.4, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 4.128151260504202, |
| "grad_norm": 0.7286921165522647, |
| "learning_rate": 1.7248013075220128e-05, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17183949053287506, |
| "step": 3930, |
| "valid_targets_mean": 2257.6, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 4.133403361344538, |
| "grad_norm": 0.7113378690439488, |
| "learning_rate": 1.7196134802142945e-05, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1910371482372284, |
| "step": 3935, |
| "valid_targets_mean": 2610.0, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 4.138655462184874, |
| "grad_norm": 0.9815704878476788, |
| "learning_rate": 1.7144275765675673e-05, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1488598883152008, |
| "step": 3940, |
| "valid_targets_mean": 2683.5, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 4.14390756302521, |
| "grad_norm": 0.6552007544862622, |
| "learning_rate": 1.7092436321610042e-05, |
| "loss": 0.1755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17244458198547363, |
| "step": 3945, |
| "valid_targets_mean": 3017.2, |
| "valid_targets_min": 706 |
| }, |
| { |
| "epoch": 4.149159663865547, |
| "grad_norm": 0.7250853653334564, |
| "learning_rate": 1.704061682560336e-05, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17147307097911835, |
| "step": 3950, |
| "valid_targets_mean": 2484.5, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 4.154411764705882, |
| "grad_norm": 0.7570116394721385, |
| "learning_rate": 1.698881763317609e-05, |
| "loss": 0.1856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19652274250984192, |
| "step": 3955, |
| "valid_targets_mean": 2825.2, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 4.159663865546219, |
| "grad_norm": 0.7477767810091138, |
| "learning_rate": 1.69370390997094e-05, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1591658890247345, |
| "step": 3960, |
| "valid_targets_mean": 2386.2, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 4.1649159663865545, |
| "grad_norm": 0.7313664660917486, |
| "learning_rate": 1.6885281580442677e-05, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18173372745513916, |
| "step": 3965, |
| "valid_targets_mean": 2462.9, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 4.170168067226891, |
| "grad_norm": 0.6878567291997353, |
| "learning_rate": 1.6833545430471194e-05, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16087912023067474, |
| "step": 3970, |
| "valid_targets_mean": 2534.8, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 4.175420168067227, |
| "grad_norm": 0.7273228101827134, |
| "learning_rate": 1.678183100474359e-05, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1902090162038803, |
| "step": 3975, |
| "valid_targets_mean": 2782.7, |
| "valid_targets_min": 1105 |
| }, |
| { |
| "epoch": 4.180672268907563, |
| "grad_norm": 0.7924963064350935, |
| "learning_rate": 1.6730138658059448e-05, |
| "loss": 0.1784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18615125119686127, |
| "step": 3980, |
| "valid_targets_mean": 2283.1, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 4.185924369747899, |
| "grad_norm": 0.7668376984218435, |
| "learning_rate": 1.667846874506689e-05, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18692851066589355, |
| "step": 3985, |
| "valid_targets_mean": 2412.2, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 4.1911764705882355, |
| "grad_norm": 0.6979922592014087, |
| "learning_rate": 1.662682162026012e-05, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16892990469932556, |
| "step": 3990, |
| "valid_targets_mean": 2284.2, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 4.196428571428571, |
| "grad_norm": 0.7050681864554844, |
| "learning_rate": 1.6575197637976995e-05, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19187793135643005, |
| "step": 3995, |
| "valid_targets_mean": 3008.6, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 4.201680672268908, |
| "grad_norm": 0.7383233513848826, |
| "learning_rate": 1.652359715239661e-05, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17365893721580505, |
| "step": 4000, |
| "valid_targets_mean": 2399.9, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 4.206932773109243, |
| "grad_norm": 0.7797983416724591, |
| "learning_rate": 1.6472020517536828e-05, |
| "loss": 0.1804, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17422497272491455, |
| "step": 4005, |
| "valid_targets_mean": 3114.1, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 4.21218487394958, |
| "grad_norm": 0.7864125547244055, |
| "learning_rate": 1.6420468087251907e-05, |
| "loss": 0.1807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16865600645542145, |
| "step": 4010, |
| "valid_targets_mean": 1723.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.217436974789916, |
| "grad_norm": 0.7327097751903167, |
| "learning_rate": 1.6368940215230026e-05, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16839268803596497, |
| "step": 4015, |
| "valid_targets_mean": 2459.2, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 4.222689075630252, |
| "grad_norm": 0.8238296453072825, |
| "learning_rate": 1.6317437254990875e-05, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1884918212890625, |
| "step": 4020, |
| "valid_targets_mean": 2194.0, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 4.227941176470588, |
| "grad_norm": 0.6460591633506324, |
| "learning_rate": 1.626595955988325e-05, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20153161883354187, |
| "step": 4025, |
| "valid_targets_mean": 3779.9, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 4.233193277310924, |
| "grad_norm": 0.7457345391565217, |
| "learning_rate": 1.6214507483082593e-05, |
| "loss": 0.1892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19580884277820587, |
| "step": 4030, |
| "valid_targets_mean": 2798.9, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 4.23844537815126, |
| "grad_norm": 0.9377584690672369, |
| "learning_rate": 1.6163081377588588e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19530422985553741, |
| "step": 4035, |
| "valid_targets_mean": 2320.8, |
| "valid_targets_min": 1065 |
| }, |
| { |
| "epoch": 4.243697478991597, |
| "grad_norm": 0.7042255194986914, |
| "learning_rate": 1.6111681596222732e-05, |
| "loss": 0.1858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1799120008945465, |
| "step": 4040, |
| "valid_targets_mean": 2469.2, |
| "valid_targets_min": 1188 |
| }, |
| { |
| "epoch": 4.248949579831933, |
| "grad_norm": 0.8657610459161533, |
| "learning_rate": 1.606030849162593e-05, |
| "loss": 0.1878, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17773385345935822, |
| "step": 4045, |
| "valid_targets_mean": 2067.2, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 4.254201680672269, |
| "grad_norm": 0.7170358815089117, |
| "learning_rate": 1.600896241625605e-05, |
| "loss": 0.1819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17556703090667725, |
| "step": 4050, |
| "valid_targets_mean": 2699.3, |
| "valid_targets_min": 1230 |
| }, |
| { |
| "epoch": 4.2594537815126055, |
| "grad_norm": 0.6997369617036321, |
| "learning_rate": 1.5957643722385532e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18936964869499207, |
| "step": 4055, |
| "valid_targets_mean": 2953.2, |
| "valid_targets_min": 1086 |
| }, |
| { |
| "epoch": 4.264705882352941, |
| "grad_norm": 0.6298850135767894, |
| "learning_rate": 1.590635276209896e-05, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15947186946868896, |
| "step": 4060, |
| "valid_targets_mean": 3146.7, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 4.269957983193278, |
| "grad_norm": 0.7757297711293648, |
| "learning_rate": 1.5855089887290634e-05, |
| "loss": 0.1883, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1859544813632965, |
| "step": 4065, |
| "valid_targets_mean": 2376.6, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 4.275210084033613, |
| "grad_norm": 0.707196240386275, |
| "learning_rate": 1.5803855449662175e-05, |
| "loss": 0.1838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17105159163475037, |
| "step": 4070, |
| "valid_targets_mean": 3088.3, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 4.28046218487395, |
| "grad_norm": 0.6412532070399728, |
| "learning_rate": 1.5752649800720096e-05, |
| "loss": 0.1827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17575950920581818, |
| "step": 4075, |
| "valid_targets_mean": 3077.6, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 4.285714285714286, |
| "grad_norm": 0.7333503639293483, |
| "learning_rate": 1.5701473291773395e-05, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16692572832107544, |
| "step": 4080, |
| "valid_targets_mean": 2213.4, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 4.290966386554622, |
| "grad_norm": 0.7789248084874639, |
| "learning_rate": 1.5650326273931166e-05, |
| "loss": 0.1898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18778863549232483, |
| "step": 4085, |
| "valid_targets_mean": 2436.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 4.296218487394958, |
| "grad_norm": 0.7608523839784216, |
| "learning_rate": 1.559920909810016e-05, |
| "loss": 0.1905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18575254082679749, |
| "step": 4090, |
| "valid_targets_mean": 2774.9, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 4.301470588235294, |
| "grad_norm": 0.7894327029271562, |
| "learning_rate": 1.5548122114982393e-05, |
| "loss": 0.1838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20460262894630432, |
| "step": 4095, |
| "valid_targets_mean": 2156.1, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 4.30672268907563, |
| "grad_norm": 0.7108371500394565, |
| "learning_rate": 1.5497065675072728e-05, |
| "loss": 0.174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1754794716835022, |
| "step": 4100, |
| "valid_targets_mean": 2560.9, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 4.311974789915967, |
| "grad_norm": 0.7197950949390775, |
| "learning_rate": 1.5446040128656485e-05, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1896936446428299, |
| "step": 4105, |
| "valid_targets_mean": 2634.4, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 4.317226890756302, |
| "grad_norm": 0.815627208196532, |
| "learning_rate": 1.539504582580704e-05, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1940707117319107, |
| "step": 4110, |
| "valid_targets_mean": 2417.6, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 4.322478991596639, |
| "grad_norm": 0.6715019204570937, |
| "learning_rate": 1.5344083116383395e-05, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16882187128067017, |
| "step": 4115, |
| "valid_targets_mean": 3112.1, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 4.3277310924369745, |
| "grad_norm": 0.8201097153549575, |
| "learning_rate": 1.529315235002781e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18270252645015717, |
| "step": 4120, |
| "valid_targets_mean": 2153.9, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 4.332983193277311, |
| "grad_norm": 0.6915688934573623, |
| "learning_rate": 1.5242253876163399e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18757754564285278, |
| "step": 4125, |
| "valid_targets_mean": 3134.6, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 4.338235294117647, |
| "grad_norm": 0.7700752339493685, |
| "learning_rate": 1.5191388043991712e-05, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20721203088760376, |
| "step": 4130, |
| "valid_targets_mean": 2372.6, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 4.343487394957983, |
| "grad_norm": 0.7313076777239362, |
| "learning_rate": 1.5140555202490359e-05, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16860508918762207, |
| "step": 4135, |
| "valid_targets_mean": 2125.1, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 4.348739495798319, |
| "grad_norm": 0.7070894615662773, |
| "learning_rate": 1.5089755700410602e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1806333363056183, |
| "step": 4140, |
| "valid_targets_mean": 2950.4, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 4.3539915966386555, |
| "grad_norm": 0.7047900654504996, |
| "learning_rate": 1.5038989886274992e-05, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17181357741355896, |
| "step": 4145, |
| "valid_targets_mean": 2456.4, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 4.359243697478991, |
| "grad_norm": 0.7947773694315373, |
| "learning_rate": 1.498825810837492e-05, |
| "loss": 0.1824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1729154884815216, |
| "step": 4150, |
| "valid_targets_mean": 2260.0, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 4.364495798319328, |
| "grad_norm": 0.7438599144833491, |
| "learning_rate": 1.4937560714768283e-05, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17960473895072937, |
| "step": 4155, |
| "valid_targets_mean": 2432.4, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 4.369747899159664, |
| "grad_norm": 0.771452228573944, |
| "learning_rate": 1.4886898053277086e-05, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21052835881710052, |
| "step": 4160, |
| "valid_targets_mean": 2578.2, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 4.375, |
| "grad_norm": 0.6592959235985212, |
| "learning_rate": 1.4836270471485029e-05, |
| "loss": 0.1706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18025822937488556, |
| "step": 4165, |
| "valid_targets_mean": 3174.4, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 4.380252100840336, |
| "grad_norm": 0.818888534502337, |
| "learning_rate": 1.4785678316735144e-05, |
| "loss": 0.1788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1800573468208313, |
| "step": 4170, |
| "valid_targets_mean": 2206.2, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 4.385504201680672, |
| "grad_norm": 0.6949510487488129, |
| "learning_rate": 1.4735121936127406e-05, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15901532769203186, |
| "step": 4175, |
| "valid_targets_mean": 2460.3, |
| "valid_targets_min": 309 |
| }, |
| { |
| "epoch": 4.390756302521009, |
| "grad_norm": 0.7369699549502026, |
| "learning_rate": 1.4684601676516366e-05, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1716357171535492, |
| "step": 4180, |
| "valid_targets_mean": 2640.8, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 4.3960084033613445, |
| "grad_norm": 0.8430612932856147, |
| "learning_rate": 1.4634117884508738e-05, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17793697118759155, |
| "step": 4185, |
| "valid_targets_mean": 1770.9, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 4.401260504201681, |
| "grad_norm": 0.7931502126995679, |
| "learning_rate": 1.458367090646105e-05, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20347827672958374, |
| "step": 4190, |
| "valid_targets_mean": 2522.5, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 4.406512605042017, |
| "grad_norm": 0.7167848190563175, |
| "learning_rate": 1.4533261088477257e-05, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18484370410442352, |
| "step": 4195, |
| "valid_targets_mean": 2692.8, |
| "valid_targets_min": 747 |
| }, |
| { |
| "epoch": 4.411764705882353, |
| "grad_norm": 0.7138856506553442, |
| "learning_rate": 1.448288877640637e-05, |
| "loss": 0.1824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1668294370174408, |
| "step": 4200, |
| "valid_targets_mean": 2518.8, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 4.417016806722689, |
| "grad_norm": 0.6504444444519508, |
| "learning_rate": 1.4432554315840082e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18564704060554504, |
| "step": 4205, |
| "valid_targets_mean": 3140.6, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 4.4222689075630255, |
| "grad_norm": 0.8499270398136098, |
| "learning_rate": 1.438225805211039e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18404464423656464, |
| "step": 4210, |
| "valid_targets_mean": 1649.0, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 4.427521008403361, |
| "grad_norm": 0.715092529952324, |
| "learning_rate": 1.4332000330287248e-05, |
| "loss": 0.1821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1709214150905609, |
| "step": 4215, |
| "valid_targets_mean": 2421.9, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 4.432773109243698, |
| "grad_norm": 0.7288642734691909, |
| "learning_rate": 1.428178149517617e-05, |
| "loss": 0.1939, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20450027287006378, |
| "step": 4220, |
| "valid_targets_mean": 2933.5, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 4.438025210084033, |
| "grad_norm": 0.795039692170866, |
| "learning_rate": 1.4231601891315876e-05, |
| "loss": 0.192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18002474308013916, |
| "step": 4225, |
| "valid_targets_mean": 2059.5, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 4.44327731092437, |
| "grad_norm": 0.988082973084519, |
| "learning_rate": 1.418146186297594e-05, |
| "loss": 0.1796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18671777844429016, |
| "step": 4230, |
| "valid_targets_mean": 1872.4, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 4.448529411764706, |
| "grad_norm": 0.7931578128546755, |
| "learning_rate": 1.413136175415441e-05, |
| "loss": 0.1714, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19192029535770416, |
| "step": 4235, |
| "valid_targets_mean": 2010.4, |
| "valid_targets_min": 848 |
| }, |
| { |
| "epoch": 4.453781512605042, |
| "grad_norm": 0.8177205538850968, |
| "learning_rate": 1.4081301908575457e-05, |
| "loss": 0.1848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17905864119529724, |
| "step": 4240, |
| "valid_targets_mean": 1845.2, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 4.459033613445378, |
| "grad_norm": 0.7284329325277255, |
| "learning_rate": 1.4031282669687035e-05, |
| "loss": 0.1836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1842656135559082, |
| "step": 4245, |
| "valid_targets_mean": 2472.1, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 4.464285714285714, |
| "grad_norm": 0.7240658652686646, |
| "learning_rate": 1.3981304380658474e-05, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19007527828216553, |
| "step": 4250, |
| "valid_targets_mean": 2486.7, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 4.46953781512605, |
| "grad_norm": 0.7916628114284047, |
| "learning_rate": 1.3931367384378183e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2028101086616516, |
| "step": 4255, |
| "valid_targets_mean": 2322.4, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 4.474789915966387, |
| "grad_norm": 0.7379642382110667, |
| "learning_rate": 1.3881472023451262e-05, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18040382862091064, |
| "step": 4260, |
| "valid_targets_mean": 2429.3, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 4.480042016806722, |
| "grad_norm": 0.7027762915252015, |
| "learning_rate": 1.3831618640197153e-05, |
| "loss": 0.1781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1830647736787796, |
| "step": 4265, |
| "valid_targets_mean": 2796.7, |
| "valid_targets_min": 887 |
| }, |
| { |
| "epoch": 4.485294117647059, |
| "grad_norm": 0.716947336725011, |
| "learning_rate": 1.3781807576647315e-05, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1749706119298935, |
| "step": 4270, |
| "valid_targets_mean": 2428.2, |
| "valid_targets_min": 805 |
| }, |
| { |
| "epoch": 4.4905462184873945, |
| "grad_norm": 0.7292281203695309, |
| "learning_rate": 1.373203917454285e-05, |
| "loss": 0.1799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1867130696773529, |
| "step": 4275, |
| "valid_targets_mean": 2838.0, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 4.495798319327731, |
| "grad_norm": 0.7290851774469034, |
| "learning_rate": 1.3682313775332186e-05, |
| "loss": 0.1899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16877129673957825, |
| "step": 4280, |
| "valid_targets_mean": 2704.8, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 4.501050420168067, |
| "grad_norm": 0.9037910643162406, |
| "learning_rate": 1.3632631720168705e-05, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1778022050857544, |
| "step": 4285, |
| "valid_targets_mean": 1608.9, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 4.506302521008403, |
| "grad_norm": 0.7874366555714657, |
| "learning_rate": 1.358299334990842e-05, |
| "loss": 0.1771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1755077838897705, |
| "step": 4290, |
| "valid_targets_mean": 2098.4, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 4.51155462184874, |
| "grad_norm": 0.8040088928448513, |
| "learning_rate": 1.3533399005107635e-05, |
| "loss": 0.198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1978076994419098, |
| "step": 4295, |
| "valid_targets_mean": 2012.0, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 4.516806722689076, |
| "grad_norm": 0.6756346527241319, |
| "learning_rate": 1.3483849026020603e-05, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17955875396728516, |
| "step": 4300, |
| "valid_targets_mean": 2901.0, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 4.522058823529412, |
| "grad_norm": 0.7127125041012732, |
| "learning_rate": 1.3434343752597199e-05, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18654534220695496, |
| "step": 4305, |
| "valid_targets_mean": 2637.3, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 4.527310924369748, |
| "grad_norm": 0.6197339001895822, |
| "learning_rate": 1.3384883524480576e-05, |
| "loss": 0.1813, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15983977913856506, |
| "step": 4310, |
| "valid_targets_mean": 3360.6, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 4.532563025210084, |
| "grad_norm": 0.7186207642971952, |
| "learning_rate": 1.333546868100486e-05, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18633624911308289, |
| "step": 4315, |
| "valid_targets_mean": 2568.3, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 4.53781512605042, |
| "grad_norm": 0.6506719666430806, |
| "learning_rate": 1.3286099561192784e-05, |
| "loss": 0.1806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20066654682159424, |
| "step": 4320, |
| "valid_targets_mean": 3334.8, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 4.543067226890757, |
| "grad_norm": 0.7139868060577005, |
| "learning_rate": 1.3236776503753397e-05, |
| "loss": 0.1825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1832045167684555, |
| "step": 4325, |
| "valid_targets_mean": 2449.9, |
| "valid_targets_min": 889 |
| }, |
| { |
| "epoch": 4.548319327731092, |
| "grad_norm": 0.8346149773596157, |
| "learning_rate": 1.3187499847079713e-05, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17674115300178528, |
| "step": 4330, |
| "valid_targets_mean": 1668.5, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 4.553571428571429, |
| "grad_norm": 0.8581192326236325, |
| "learning_rate": 1.3138269929246427e-05, |
| "loss": 0.1752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.169841468334198, |
| "step": 4335, |
| "valid_targets_mean": 2480.5, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 4.5588235294117645, |
| "grad_norm": 0.6712603189184432, |
| "learning_rate": 1.308908708800753e-05, |
| "loss": 0.1947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17790794372558594, |
| "step": 4340, |
| "valid_targets_mean": 3218.3, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 4.564075630252101, |
| "grad_norm": 0.8382631585908171, |
| "learning_rate": 1.3039951660794063e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20454202592372894, |
| "step": 4345, |
| "valid_targets_mean": 2153.2, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 4.569327731092437, |
| "grad_norm": 0.7788139909395001, |
| "learning_rate": 1.2990863984711773e-05, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.187415212392807, |
| "step": 4350, |
| "valid_targets_mean": 2221.0, |
| "valid_targets_min": 784 |
| }, |
| { |
| "epoch": 4.574579831932773, |
| "grad_norm": 0.8228381865776829, |
| "learning_rate": 1.294182439653878e-05, |
| "loss": 0.1882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2052648365497589, |
| "step": 4355, |
| "valid_targets_mean": 2024.1, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 4.579831932773109, |
| "grad_norm": 0.7969097110247945, |
| "learning_rate": 1.2892833232723297e-05, |
| "loss": 0.1863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19444799423217773, |
| "step": 4360, |
| "valid_targets_mean": 2430.7, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 4.5850840336134455, |
| "grad_norm": 0.8950927024396919, |
| "learning_rate": 1.2843890829381303e-05, |
| "loss": 0.1819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1735416203737259, |
| "step": 4365, |
| "valid_targets_mean": 1948.1, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 4.590336134453781, |
| "grad_norm": 0.7524319791833006, |
| "learning_rate": 1.2794997522294263e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17769590020179749, |
| "step": 4370, |
| "valid_targets_mean": 2317.9, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 4.595588235294118, |
| "grad_norm": 0.8185328703075273, |
| "learning_rate": 1.2746153646906766e-05, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17284256219863892, |
| "step": 4375, |
| "valid_targets_mean": 1852.3, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 4.600840336134453, |
| "grad_norm": 0.8366151911421962, |
| "learning_rate": 1.2697359538324303e-05, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17999669909477234, |
| "step": 4380, |
| "valid_targets_mean": 2349.4, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 4.60609243697479, |
| "grad_norm": 0.74572952017287, |
| "learning_rate": 1.2648615531310907e-05, |
| "loss": 0.1805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18219012022018433, |
| "step": 4385, |
| "valid_targets_mean": 2272.4, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 4.6113445378151265, |
| "grad_norm": 0.7591238610620517, |
| "learning_rate": 1.259992196028688e-05, |
| "loss": 0.1772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1870465874671936, |
| "step": 4390, |
| "valid_targets_mean": 2377.6, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 4.616596638655462, |
| "grad_norm": 0.7984813374731973, |
| "learning_rate": 1.2551279159326495e-05, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1903630644083023, |
| "step": 4395, |
| "valid_targets_mean": 2266.4, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 4.621848739495798, |
| "grad_norm": 0.7169284378785025, |
| "learning_rate": 1.2502687462155709e-05, |
| "loss": 0.1767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17516914010047913, |
| "step": 4400, |
| "valid_targets_mean": 2642.4, |
| "valid_targets_min": 1050 |
| }, |
| { |
| "epoch": 4.6271008403361344, |
| "grad_norm": 0.7778626068632182, |
| "learning_rate": 1.2454147202149865e-05, |
| "loss": 0.1873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18522366881370544, |
| "step": 4405, |
| "valid_targets_mean": 2276.4, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 4.632352941176471, |
| "grad_norm": 0.7163788723425591, |
| "learning_rate": 1.2405658712331409e-05, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17094354331493378, |
| "step": 4410, |
| "valid_targets_mean": 2692.1, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 4.637605042016807, |
| "grad_norm": 0.7021250334619412, |
| "learning_rate": 1.2357222325367604e-05, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2073124796152115, |
| "step": 4415, |
| "valid_targets_mean": 3277.5, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 4.642857142857143, |
| "grad_norm": 0.7042673790509252, |
| "learning_rate": 1.2308838373568249e-05, |
| "loss": 0.1788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18093574047088623, |
| "step": 4420, |
| "valid_targets_mean": 3193.1, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 4.648109243697479, |
| "grad_norm": 0.7080962295239951, |
| "learning_rate": 1.2260507188883395e-05, |
| "loss": 0.1802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.179480642080307, |
| "step": 4425, |
| "valid_targets_mean": 2543.3, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 4.6533613445378155, |
| "grad_norm": 0.7498653248193045, |
| "learning_rate": 1.2212229102901077e-05, |
| "loss": 0.1869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1921127885580063, |
| "step": 4430, |
| "valid_targets_mean": 2489.6, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 4.658613445378151, |
| "grad_norm": 0.7571679788787566, |
| "learning_rate": 1.2164004446845037e-05, |
| "loss": 0.1803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19102567434310913, |
| "step": 4435, |
| "valid_targets_mean": 2422.0, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 4.663865546218488, |
| "grad_norm": 0.7458838101603535, |
| "learning_rate": 1.2115833551572438e-05, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18319690227508545, |
| "step": 4440, |
| "valid_targets_mean": 2450.1, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 4.669117647058823, |
| "grad_norm": 0.7046359584542661, |
| "learning_rate": 1.2067716747571616e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1766650229692459, |
| "step": 4445, |
| "valid_targets_mean": 2313.4, |
| "valid_targets_min": 843 |
| }, |
| { |
| "epoch": 4.67436974789916, |
| "grad_norm": 0.8345834489540149, |
| "learning_rate": 1.201965436495978e-05, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19209042191505432, |
| "step": 4450, |
| "valid_targets_mean": 2150.6, |
| "valid_targets_min": 962 |
| }, |
| { |
| "epoch": 4.679621848739496, |
| "grad_norm": 0.763774531100772, |
| "learning_rate": 1.1971646733480784e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20099681615829468, |
| "step": 4455, |
| "valid_targets_mean": 2721.1, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 4.684873949579832, |
| "grad_norm": 0.6918104106739509, |
| "learning_rate": 1.1923694182502848e-05, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17281074821949005, |
| "step": 4460, |
| "valid_targets_mean": 2406.6, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 4.690126050420168, |
| "grad_norm": 0.7551738929861327, |
| "learning_rate": 1.1875797041016286e-05, |
| "loss": 0.1825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1859922856092453, |
| "step": 4465, |
| "valid_targets_mean": 2412.7, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 4.695378151260504, |
| "grad_norm": 0.7758417255586617, |
| "learning_rate": 1.1827955637631283e-05, |
| "loss": 0.1811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16596679389476776, |
| "step": 4470, |
| "valid_targets_mean": 2247.4, |
| "valid_targets_min": 833 |
| }, |
| { |
| "epoch": 4.70063025210084, |
| "grad_norm": 0.6806231945697778, |
| "learning_rate": 1.1780170300575602e-05, |
| "loss": 0.1812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1946016550064087, |
| "step": 4475, |
| "valid_targets_mean": 3193.5, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 4.705882352941177, |
| "grad_norm": 0.7375240636905129, |
| "learning_rate": 1.1732441357692353e-05, |
| "loss": 0.1871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17887581884860992, |
| "step": 4480, |
| "valid_targets_mean": 2464.6, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 4.711134453781512, |
| "grad_norm": 0.7620340981837231, |
| "learning_rate": 1.1684769136437742e-05, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19154343008995056, |
| "step": 4485, |
| "valid_targets_mean": 2281.2, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 4.716386554621849, |
| "grad_norm": 0.82056252467419, |
| "learning_rate": 1.1637153963878815e-05, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19052766263484955, |
| "step": 4490, |
| "valid_targets_mean": 2145.5, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 4.7216386554621845, |
| "grad_norm": 0.7301286521046133, |
| "learning_rate": 1.1589596166691231e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1829635053873062, |
| "step": 4495, |
| "valid_targets_mean": 2482.4, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 4.726890756302521, |
| "grad_norm": 0.7903970658437431, |
| "learning_rate": 1.1542096071157012e-05, |
| "loss": 0.1753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1784076690673828, |
| "step": 4500, |
| "valid_targets_mean": 2605.2, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 4.732142857142857, |
| "grad_norm": 0.7637658355202966, |
| "learning_rate": 1.1494654003162285e-05, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18634071946144104, |
| "step": 4505, |
| "valid_targets_mean": 2553.0, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 4.737394957983193, |
| "grad_norm": 0.7221781006332623, |
| "learning_rate": 1.1447270288195089e-05, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17665636539459229, |
| "step": 4510, |
| "valid_targets_mean": 2349.6, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 4.742647058823529, |
| "grad_norm": 0.720008738864535, |
| "learning_rate": 1.1399945251343114e-05, |
| "loss": 0.1815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.183954656124115, |
| "step": 4515, |
| "valid_targets_mean": 2651.1, |
| "valid_targets_min": 963 |
| }, |
| { |
| "epoch": 4.7478991596638656, |
| "grad_norm": 0.7439764441972336, |
| "learning_rate": 1.1352679217291457e-05, |
| "loss": 0.1842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18053632974624634, |
| "step": 4520, |
| "valid_targets_mean": 2257.0, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 4.753151260504202, |
| "grad_norm": 0.6873632051406735, |
| "learning_rate": 1.1305472510320419e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16327188909053802, |
| "step": 4525, |
| "valid_targets_mean": 2640.4, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 4.758403361344538, |
| "grad_norm": 0.7442947567531205, |
| "learning_rate": 1.1258325454303286e-05, |
| "loss": 0.195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1675795316696167, |
| "step": 4530, |
| "valid_targets_mean": 2390.1, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 4.7636554621848735, |
| "grad_norm": 0.7354254137750549, |
| "learning_rate": 1.1211238372704073e-05, |
| "loss": 0.1887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17392656207084656, |
| "step": 4535, |
| "valid_targets_mean": 2248.0, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 4.76890756302521, |
| "grad_norm": 0.7224478673738945, |
| "learning_rate": 1.1164211588575339e-05, |
| "loss": 0.1845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16614243388175964, |
| "step": 4540, |
| "valid_targets_mean": 2204.6, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 4.774159663865547, |
| "grad_norm": 0.6780397730456732, |
| "learning_rate": 1.1117245424555967e-05, |
| "loss": 0.1836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17192646861076355, |
| "step": 4545, |
| "valid_targets_mean": 2732.8, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 4.779411764705882, |
| "grad_norm": 0.8114966919737321, |
| "learning_rate": 1.1070340202868915e-05, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16627684235572815, |
| "step": 4550, |
| "valid_targets_mean": 2037.4, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 4.784663865546219, |
| "grad_norm": 0.7089064475714499, |
| "learning_rate": 1.1023496245319056e-05, |
| "loss": 0.1743, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20096446573734283, |
| "step": 4555, |
| "valid_targets_mean": 3190.9, |
| "valid_targets_min": 1018 |
| }, |
| { |
| "epoch": 4.7899159663865545, |
| "grad_norm": 0.7629594666078792, |
| "learning_rate": 1.0976713873290925e-05, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18434454500675201, |
| "step": 4560, |
| "valid_targets_mean": 2231.0, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 4.795168067226891, |
| "grad_norm": 0.7206103511159119, |
| "learning_rate": 1.0929993407746543e-05, |
| "loss": 0.1787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1781184822320938, |
| "step": 4565, |
| "valid_targets_mean": 2413.1, |
| "valid_targets_min": 924 |
| }, |
| { |
| "epoch": 4.800420168067227, |
| "grad_norm": 0.7319103361120156, |
| "learning_rate": 1.0883335169223212e-05, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19576598703861237, |
| "step": 4570, |
| "valid_targets_mean": 2644.1, |
| "valid_targets_min": 1339 |
| }, |
| { |
| "epoch": 4.805672268907563, |
| "grad_norm": 0.7224561194750161, |
| "learning_rate": 1.0836739477831297e-05, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16441801190376282, |
| "step": 4575, |
| "valid_targets_mean": 2237.8, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 4.810924369747899, |
| "grad_norm": 0.8825086906465849, |
| "learning_rate": 1.0790206653252055e-05, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18621914088726044, |
| "step": 4580, |
| "valid_targets_mean": 2011.2, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 4.8161764705882355, |
| "grad_norm": 0.6887944713418872, |
| "learning_rate": 1.0743737014735434e-05, |
| "loss": 0.1796, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18349093198776245, |
| "step": 4585, |
| "valid_targets_mean": 2805.9, |
| "valid_targets_min": 595 |
| }, |
| { |
| "epoch": 4.821428571428571, |
| "grad_norm": 0.8266516711323478, |
| "learning_rate": 1.0697330881097857e-05, |
| "loss": 0.1889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18345323204994202, |
| "step": 4590, |
| "valid_targets_mean": 2207.9, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 4.826680672268908, |
| "grad_norm": 0.7454608401910962, |
| "learning_rate": 1.0650988570720077e-05, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16886943578720093, |
| "step": 4595, |
| "valid_targets_mean": 2130.4, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 4.831932773109243, |
| "grad_norm": 0.7525541827091601, |
| "learning_rate": 1.0604710401544963e-05, |
| "loss": 0.1889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2049073427915573, |
| "step": 4600, |
| "valid_targets_mean": 2671.1, |
| "valid_targets_min": 938 |
| }, |
| { |
| "epoch": 4.83718487394958, |
| "grad_norm": 0.7221773649936342, |
| "learning_rate": 1.0558496691075318e-05, |
| "loss": 0.1874, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18932510912418365, |
| "step": 4605, |
| "valid_targets_mean": 2382.8, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 4.842436974789916, |
| "grad_norm": 0.6282371291333917, |
| "learning_rate": 1.0512347756371726e-05, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18067455291748047, |
| "step": 4610, |
| "valid_targets_mean": 3488.6, |
| "valid_targets_min": 1483 |
| }, |
| { |
| "epoch": 4.847689075630252, |
| "grad_norm": 0.7736804746763539, |
| "learning_rate": 1.0466263914050362e-05, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.187209352850914, |
| "step": 4615, |
| "valid_targets_mean": 2130.1, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 4.852941176470588, |
| "grad_norm": 0.8194923770615844, |
| "learning_rate": 1.0420245480280804e-05, |
| "loss": 0.1711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19902583956718445, |
| "step": 4620, |
| "valid_targets_mean": 2030.2, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 4.858193277310924, |
| "grad_norm": 0.7237311731603411, |
| "learning_rate": 1.0374292770783891e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18148672580718994, |
| "step": 4625, |
| "valid_targets_mean": 2961.3, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 4.86344537815126, |
| "grad_norm": 0.6669660493298567, |
| "learning_rate": 1.0328406100829542e-05, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17993488907814026, |
| "step": 4630, |
| "valid_targets_mean": 3014.6, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 4.868697478991597, |
| "grad_norm": 0.8700432106817276, |
| "learning_rate": 1.0282585785234578e-05, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18658801913261414, |
| "step": 4635, |
| "valid_targets_mean": 1932.2, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 4.873949579831933, |
| "grad_norm": 0.6217143473547485, |
| "learning_rate": 1.023683213836061e-05, |
| "loss": 0.1788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1737050712108612, |
| "step": 4640, |
| "valid_targets_mean": 3531.2, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 4.879201680672269, |
| "grad_norm": 0.9539626771397886, |
| "learning_rate": 1.0191145474111823e-05, |
| "loss": 0.1846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19349545240402222, |
| "step": 4645, |
| "valid_targets_mean": 1414.2, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 4.884453781512605, |
| "grad_norm": 0.6923182425799058, |
| "learning_rate": 1.0145526105932872e-05, |
| "loss": 0.1712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16115731000900269, |
| "step": 4650, |
| "valid_targets_mean": 2663.4, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 4.889705882352941, |
| "grad_norm": 0.6914625755370188, |
| "learning_rate": 1.0099974346806714e-05, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1792561411857605, |
| "step": 4655, |
| "valid_targets_mean": 2781.5, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 4.894957983193278, |
| "grad_norm": 0.7734782088863728, |
| "learning_rate": 1.0054490509252423e-05, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20624291896820068, |
| "step": 4660, |
| "valid_targets_mean": 2440.4, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 4.900210084033613, |
| "grad_norm": 0.7941952415974891, |
| "learning_rate": 1.0009074905323118e-05, |
| "loss": 0.1686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17345239222049713, |
| "step": 4665, |
| "valid_targets_mean": 2916.6, |
| "valid_targets_min": 1297 |
| }, |
| { |
| "epoch": 4.90546218487395, |
| "grad_norm": 0.8030163177897169, |
| "learning_rate": 9.963727846603784e-06, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18559759855270386, |
| "step": 4670, |
| "valid_targets_mean": 2144.8, |
| "valid_targets_min": 987 |
| }, |
| { |
| "epoch": 4.910714285714286, |
| "grad_norm": 0.7030553547126519, |
| "learning_rate": 9.918449644209087e-06, |
| "loss": 0.1852, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18912020325660706, |
| "step": 4675, |
| "valid_targets_mean": 2720.7, |
| "valid_targets_min": 1084 |
| }, |
| { |
| "epoch": 4.915966386554622, |
| "grad_norm": 0.6845418285443712, |
| "learning_rate": 9.873240608781341e-06, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.202968031167984, |
| "step": 4680, |
| "valid_targets_mean": 3153.9, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 4.921218487394958, |
| "grad_norm": 0.7655672446200298, |
| "learning_rate": 9.828101050488308e-06, |
| "loss": 0.1873, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18019559979438782, |
| "step": 4685, |
| "valid_targets_mean": 1993.6, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 4.926470588235294, |
| "grad_norm": 0.7622908992963848, |
| "learning_rate": 9.783031279021063e-06, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19854578375816345, |
| "step": 4690, |
| "valid_targets_mean": 2434.5, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 4.93172268907563, |
| "grad_norm": 0.7356813022171075, |
| "learning_rate": 9.738031603591926e-06, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1860363483428955, |
| "step": 4695, |
| "valid_targets_mean": 2400.0, |
| "valid_targets_min": 934 |
| }, |
| { |
| "epoch": 4.936974789915967, |
| "grad_norm": 0.720810615748148, |
| "learning_rate": 9.69310233293227e-06, |
| "loss": 0.1853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1856434941291809, |
| "step": 4700, |
| "valid_targets_mean": 2621.8, |
| "valid_targets_min": 1276 |
| }, |
| { |
| "epoch": 4.942226890756302, |
| "grad_norm": 0.7063545010234002, |
| "learning_rate": 9.648243775290476e-06, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16022886335849762, |
| "step": 4705, |
| "valid_targets_mean": 2576.8, |
| "valid_targets_min": 1221 |
| }, |
| { |
| "epoch": 4.947478991596639, |
| "grad_norm": 0.7386993073314914, |
| "learning_rate": 9.60345623842974e-06, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17438361048698425, |
| "step": 4710, |
| "valid_targets_mean": 2572.9, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 4.9527310924369745, |
| "grad_norm": 0.7347227314045449, |
| "learning_rate": 9.558740029626046e-06, |
| "loss": 0.1749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1749304234981537, |
| "step": 4715, |
| "valid_targets_mean": 2584.6, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 4.957983193277311, |
| "grad_norm": 0.728403778635231, |
| "learning_rate": 9.51409545566597e-06, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18584081530570984, |
| "step": 4720, |
| "valid_targets_mean": 2500.6, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 4.963235294117647, |
| "grad_norm": 0.7578264772501891, |
| "learning_rate": 9.469522822844663e-06, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1682163029909134, |
| "step": 4725, |
| "valid_targets_mean": 2061.4, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 4.968487394957983, |
| "grad_norm": 0.7750388844604879, |
| "learning_rate": 9.425022436963664e-06, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19586464762687683, |
| "step": 4730, |
| "valid_targets_mean": 2407.8, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 4.973739495798319, |
| "grad_norm": 0.7766444281597565, |
| "learning_rate": 9.380594603328875e-06, |
| "loss": 0.1984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2102508395910263, |
| "step": 4735, |
| "valid_targets_mean": 2843.3, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 4.9789915966386555, |
| "grad_norm": 0.760942443434771, |
| "learning_rate": 9.336239626748432e-06, |
| "loss": 0.1806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17757880687713623, |
| "step": 4740, |
| "valid_targets_mean": 2666.6, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 4.984243697478991, |
| "grad_norm": 0.7731058692289628, |
| "learning_rate": 9.291957811530602e-06, |
| "loss": 0.1837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18547788262367249, |
| "step": 4745, |
| "valid_targets_mean": 2214.3, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 4.989495798319328, |
| "grad_norm": 0.700031528165842, |
| "learning_rate": 9.247749461481712e-06, |
| "loss": 0.1696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18496280908584595, |
| "step": 4750, |
| "valid_targets_mean": 2794.8, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 4.994747899159664, |
| "grad_norm": 0.6273143784305558, |
| "learning_rate": 9.203614879904083e-06, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15987840294837952, |
| "step": 4755, |
| "valid_targets_mean": 3185.1, |
| "valid_targets_min": 1250 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.6788365442881951, |
| "learning_rate": 9.159554369593901e-06, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17320957779884338, |
| "step": 4760, |
| "valid_targets_mean": 2633.3, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 5.005252100840337, |
| "grad_norm": 0.7483605516753753, |
| "learning_rate": 9.115568232839193e-06, |
| "loss": 0.1509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12966476380825043, |
| "step": 4765, |
| "valid_targets_mean": 1753.9, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 5.010504201680672, |
| "grad_norm": 0.7211521050334696, |
| "learning_rate": 9.071656771417721e-06, |
| "loss": 0.1588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16123877465724945, |
| "step": 4770, |
| "valid_targets_mean": 2470.6, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 5.015756302521009, |
| "grad_norm": 0.7296273456769096, |
| "learning_rate": 9.027820286594902e-06, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14505019783973694, |
| "step": 4775, |
| "valid_targets_mean": 2658.1, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 5.0210084033613445, |
| "grad_norm": 0.7817862758275839, |
| "learning_rate": 8.984059079121785e-06, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15351414680480957, |
| "step": 4780, |
| "valid_targets_mean": 2114.3, |
| "valid_targets_min": 589 |
| }, |
| { |
| "epoch": 5.026260504201681, |
| "grad_norm": 0.7668268893222531, |
| "learning_rate": 8.940373449232935e-06, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16739562153816223, |
| "step": 4785, |
| "valid_targets_mean": 2364.6, |
| "valid_targets_min": 802 |
| }, |
| { |
| "epoch": 5.031512605042017, |
| "grad_norm": 0.820070132627084, |
| "learning_rate": 8.896763696644405e-06, |
| "loss": 0.1568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15973633527755737, |
| "step": 4790, |
| "valid_targets_mean": 1928.4, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 5.036764705882353, |
| "grad_norm": 0.7252481874686856, |
| "learning_rate": 8.853230120551693e-06, |
| "loss": 0.1583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14669166505336761, |
| "step": 4795, |
| "valid_targets_mean": 2317.4, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 5.042016806722689, |
| "grad_norm": 0.8044647525929012, |
| "learning_rate": 8.809773019627635e-06, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17486470937728882, |
| "step": 4800, |
| "valid_targets_mean": 2453.2, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 5.0472689075630255, |
| "grad_norm": 0.7168891105498033, |
| "learning_rate": 8.766392692020413e-06, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16313612461090088, |
| "step": 4805, |
| "valid_targets_mean": 3045.1, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 5.052521008403361, |
| "grad_norm": 0.8391271783579383, |
| "learning_rate": 8.723089435351497e-06, |
| "loss": 0.1626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17179730534553528, |
| "step": 4810, |
| "valid_targets_mean": 2010.1, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 5.057773109243698, |
| "grad_norm": 0.7301522003326225, |
| "learning_rate": 8.679863546713559e-06, |
| "loss": 0.1576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17533841729164124, |
| "step": 4815, |
| "valid_targets_mean": 3249.5, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 5.063025210084033, |
| "grad_norm": 0.886339846842999, |
| "learning_rate": 8.636715322668498e-06, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16565924882888794, |
| "step": 4820, |
| "valid_targets_mean": 2003.6, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 5.06827731092437, |
| "grad_norm": 0.7726449898609571, |
| "learning_rate": 8.593645059245365e-06, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15337593853473663, |
| "step": 4825, |
| "valid_targets_mean": 2167.6, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 5.073529411764706, |
| "grad_norm": 0.7695203697189681, |
| "learning_rate": 8.550653051938333e-06, |
| "loss": 0.1626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1670958697795868, |
| "step": 4830, |
| "valid_targets_mean": 2386.7, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 5.078781512605042, |
| "grad_norm": 0.8074962356870891, |
| "learning_rate": 8.507739595704695e-06, |
| "loss": 0.1523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1489427387714386, |
| "step": 4835, |
| "valid_targets_mean": 2025.5, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 5.084033613445378, |
| "grad_norm": 0.8716776759288114, |
| "learning_rate": 8.464904984962832e-06, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16994109749794006, |
| "step": 4840, |
| "valid_targets_mean": 2000.9, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 5.089285714285714, |
| "grad_norm": 0.8076509459810718, |
| "learning_rate": 8.422149513590151e-06, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17325329780578613, |
| "step": 4845, |
| "valid_targets_mean": 2370.3, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 5.09453781512605, |
| "grad_norm": 0.8070190471856774, |
| "learning_rate": 8.37947347492115e-06, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15762285888195038, |
| "step": 4850, |
| "valid_targets_mean": 2040.4, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 5.099789915966387, |
| "grad_norm": 0.74092533277044, |
| "learning_rate": 8.33687716174532e-06, |
| "loss": 0.1603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16209125518798828, |
| "step": 4855, |
| "valid_targets_mean": 2598.8, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 5.105042016806722, |
| "grad_norm": 0.860251504616201, |
| "learning_rate": 8.294360866305192e-06, |
| "loss": 0.1628, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15497906506061554, |
| "step": 4860, |
| "valid_targets_mean": 2211.9, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 5.110294117647059, |
| "grad_norm": 0.7907729718003471, |
| "learning_rate": 8.251924880294317e-06, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16414563357830048, |
| "step": 4865, |
| "valid_targets_mean": 2080.1, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 5.1155462184873945, |
| "grad_norm": 0.8047837776866085, |
| "learning_rate": 8.20956949485527e-06, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15285125374794006, |
| "step": 4870, |
| "valid_targets_mean": 1991.6, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 5.120798319327731, |
| "grad_norm": 0.7304681966773338, |
| "learning_rate": 8.167295000577622e-06, |
| "loss": 0.1693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15932945907115936, |
| "step": 4875, |
| "valid_targets_mean": 2356.6, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 5.126050420168067, |
| "grad_norm": 0.7843064737707304, |
| "learning_rate": 8.125101687496e-06, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1509605348110199, |
| "step": 4880, |
| "valid_targets_mean": 2156.1, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 5.131302521008403, |
| "grad_norm": 0.6507131542748491, |
| "learning_rate": 8.082989845088038e-06, |
| "loss": 0.1609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.168035089969635, |
| "step": 4885, |
| "valid_targets_mean": 3697.9, |
| "valid_targets_min": 1139 |
| }, |
| { |
| "epoch": 5.13655462184874, |
| "grad_norm": 0.7983692941356186, |
| "learning_rate": 8.040959762272441e-06, |
| "loss": 0.1711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17778906226158142, |
| "step": 4890, |
| "valid_targets_mean": 2277.1, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 5.141806722689076, |
| "grad_norm": 0.717526944817668, |
| "learning_rate": 7.999011727406995e-06, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1474049985408783, |
| "step": 4895, |
| "valid_targets_mean": 3174.6, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 5.147058823529412, |
| "grad_norm": 0.6501295927520986, |
| "learning_rate": 7.957146028286524e-06, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15974193811416626, |
| "step": 4900, |
| "valid_targets_mean": 3719.8, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 5.152310924369748, |
| "grad_norm": 0.7634163772813823, |
| "learning_rate": 7.915362952141017e-06, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13993379473686218, |
| "step": 4905, |
| "valid_targets_mean": 2612.3, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 5.157563025210084, |
| "grad_norm": 0.8229169359259055, |
| "learning_rate": 7.873662785633594e-06, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17392058670520782, |
| "step": 4910, |
| "valid_targets_mean": 2420.1, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 5.16281512605042, |
| "grad_norm": 0.8391334241227872, |
| "learning_rate": 7.832045814858538e-06, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15847104787826538, |
| "step": 4915, |
| "valid_targets_mean": 2340.0, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 5.168067226890757, |
| "grad_norm": 0.7113772435226458, |
| "learning_rate": 7.790512325339367e-06, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17543965578079224, |
| "step": 4920, |
| "valid_targets_mean": 2999.2, |
| "valid_targets_min": 1254 |
| }, |
| { |
| "epoch": 5.173319327731092, |
| "grad_norm": 0.8373320616460568, |
| "learning_rate": 7.74906260202685e-06, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16569611430168152, |
| "step": 4925, |
| "valid_targets_mean": 2456.8, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 5.178571428571429, |
| "grad_norm": 0.756975477682416, |
| "learning_rate": 7.707696929297053e-06, |
| "loss": 0.162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15648490190505981, |
| "step": 4930, |
| "valid_targets_mean": 2480.5, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 5.1838235294117645, |
| "grad_norm": 0.841074398063682, |
| "learning_rate": 7.666415590949382e-06, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16663537919521332, |
| "step": 4935, |
| "valid_targets_mean": 2205.2, |
| "valid_targets_min": 817 |
| }, |
| { |
| "epoch": 5.189075630252101, |
| "grad_norm": 0.8588889722655582, |
| "learning_rate": 7.625218870204676e-06, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16082826256752014, |
| "step": 4940, |
| "valid_targets_mean": 2507.4, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 5.194327731092437, |
| "grad_norm": 0.7390042440173223, |
| "learning_rate": 7.584107049703195e-06, |
| "loss": 0.1645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15865691006183624, |
| "step": 4945, |
| "valid_targets_mean": 2532.7, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 5.199579831932773, |
| "grad_norm": 0.7806217716341791, |
| "learning_rate": 7.5430804115027615e-06, |
| "loss": 0.1606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15922147035598755, |
| "step": 4950, |
| "valid_targets_mean": 2130.4, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 5.204831932773109, |
| "grad_norm": 0.6872497366416, |
| "learning_rate": 7.502139237076744e-06, |
| "loss": 0.1603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16006314754486084, |
| "step": 4955, |
| "valid_targets_mean": 3239.2, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 5.2100840336134455, |
| "grad_norm": 0.8265925780625734, |
| "learning_rate": 7.461283807312194e-06, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15462356805801392, |
| "step": 4960, |
| "valid_targets_mean": 2074.3, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 5.215336134453781, |
| "grad_norm": 0.8400103721164567, |
| "learning_rate": 7.420514402507886e-06, |
| "loss": 0.1716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16285106539726257, |
| "step": 4965, |
| "valid_targets_mean": 2134.1, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 5.220588235294118, |
| "grad_norm": 0.7819781182832531, |
| "learning_rate": 7.379831302372389e-06, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15541312098503113, |
| "step": 4970, |
| "valid_targets_mean": 2262.2, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 5.225840336134453, |
| "grad_norm": 0.8105251128609028, |
| "learning_rate": 7.3392347860221556e-06, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16982173919677734, |
| "step": 4975, |
| "valid_targets_mean": 2223.4, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 5.23109243697479, |
| "grad_norm": 0.6863440387762159, |
| "learning_rate": 7.298725131979629e-06, |
| "loss": 0.1632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15579064190387726, |
| "step": 4980, |
| "valid_targets_mean": 3175.9, |
| "valid_targets_min": 1177 |
| }, |
| { |
| "epoch": 5.236344537815126, |
| "grad_norm": 0.7441930568222063, |
| "learning_rate": 7.258302618171287e-06, |
| "loss": 0.1701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1511012315750122, |
| "step": 4985, |
| "valid_targets_mean": 2616.9, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 5.241596638655462, |
| "grad_norm": 0.7374029049491165, |
| "learning_rate": 7.217967521925775e-06, |
| "loss": 0.1621, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16436655819416046, |
| "step": 4990, |
| "valid_targets_mean": 2690.6, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 5.246848739495798, |
| "grad_norm": 0.7497430314524601, |
| "learning_rate": 7.177720119971998e-06, |
| "loss": 0.1527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17379173636436462, |
| "step": 4995, |
| "valid_targets_mean": 2911.5, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 5.2521008403361344, |
| "grad_norm": 0.7942479630297596, |
| "learning_rate": 7.137560688437184e-06, |
| "loss": 0.1658, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1384781152009964, |
| "step": 5000, |
| "valid_targets_mean": 1960.1, |
| "valid_targets_min": 765 |
| }, |
| { |
| "epoch": 5.257352941176471, |
| "grad_norm": 0.6952857832526612, |
| "learning_rate": 7.097489502845047e-06, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12435892224311829, |
| "step": 5005, |
| "valid_targets_mean": 2232.8, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 5.262605042016807, |
| "grad_norm": 0.7259264839559267, |
| "learning_rate": 7.0575068381138525e-06, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15408116579055786, |
| "step": 5010, |
| "valid_targets_mean": 2326.8, |
| "valid_targets_min": 1105 |
| }, |
| { |
| "epoch": 5.267857142857143, |
| "grad_norm": 0.6907832100331577, |
| "learning_rate": 7.0176129685545414e-06, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1581760197877884, |
| "step": 5015, |
| "valid_targets_mean": 2910.8, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 5.273109243697479, |
| "grad_norm": 0.7359189102249872, |
| "learning_rate": 6.977808167868867e-06, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1630137860774994, |
| "step": 5020, |
| "valid_targets_mean": 3007.1, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 5.2783613445378155, |
| "grad_norm": 0.7813513338182236, |
| "learning_rate": 6.9380927091475085e-06, |
| "loss": 0.1568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16749534010887146, |
| "step": 5025, |
| "valid_targets_mean": 2539.6, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 5.283613445378151, |
| "grad_norm": 0.7597593894886342, |
| "learning_rate": 6.898466864868165e-06, |
| "loss": 0.1606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16621197760105133, |
| "step": 5030, |
| "valid_targets_mean": 2721.4, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 5.288865546218488, |
| "grad_norm": 0.7182742303119539, |
| "learning_rate": 6.858930906893751e-06, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15185761451721191, |
| "step": 5035, |
| "valid_targets_mean": 2491.1, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 5.294117647058823, |
| "grad_norm": 0.8593841083426136, |
| "learning_rate": 6.819485106470454e-06, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15788263082504272, |
| "step": 5040, |
| "valid_targets_mean": 1728.0, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 5.29936974789916, |
| "grad_norm": 0.8035500930290126, |
| "learning_rate": 6.780129734225949e-06, |
| "loss": 0.1486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15254664421081543, |
| "step": 5045, |
| "valid_targets_mean": 2170.8, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 5.304621848739496, |
| "grad_norm": 0.8459834255980975, |
| "learning_rate": 6.740865060167483e-06, |
| "loss": 0.1595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16684821248054504, |
| "step": 5050, |
| "valid_targets_mean": 1869.9, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 5.309873949579832, |
| "grad_norm": 0.7852698744711136, |
| "learning_rate": 6.701691353680049e-06, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1623380482196808, |
| "step": 5055, |
| "valid_targets_mean": 2586.2, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 5.315126050420168, |
| "grad_norm": 0.7811887298191118, |
| "learning_rate": 6.662608883524542e-06, |
| "loss": 0.155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13154323399066925, |
| "step": 5060, |
| "valid_targets_mean": 1648.8, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 5.320378151260504, |
| "grad_norm": 0.660895377255489, |
| "learning_rate": 6.6236179178359115e-06, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15457244217395782, |
| "step": 5065, |
| "valid_targets_mean": 3175.9, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 5.32563025210084, |
| "grad_norm": 0.7245039671860787, |
| "learning_rate": 6.5847187241213e-06, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14748461544513702, |
| "step": 5070, |
| "valid_targets_mean": 2657.9, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 5.330882352941177, |
| "grad_norm": 0.7753382710745726, |
| "learning_rate": 6.5459115692582386e-06, |
| "loss": 0.1565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16546081006526947, |
| "step": 5075, |
| "valid_targets_mean": 2395.2, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 5.336134453781512, |
| "grad_norm": 0.7698920766313514, |
| "learning_rate": 6.507196719492819e-06, |
| "loss": 0.1547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1609654426574707, |
| "step": 5080, |
| "valid_targets_mean": 2615.0, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 5.341386554621849, |
| "grad_norm": 0.8553168767751825, |
| "learning_rate": 6.468574440437801e-06, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15425896644592285, |
| "step": 5085, |
| "valid_targets_mean": 1917.0, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 5.3466386554621845, |
| "grad_norm": 0.7379979219387762, |
| "learning_rate": 6.43004499707089e-06, |
| "loss": 0.1704, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18386310338974, |
| "step": 5090, |
| "valid_targets_mean": 2954.1, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 5.351890756302521, |
| "grad_norm": 0.800532265924272, |
| "learning_rate": 6.3916086537328545e-06, |
| "loss": 0.1569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1512497365474701, |
| "step": 5095, |
| "valid_targets_mean": 2645.6, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 5.357142857142857, |
| "grad_norm": 0.7258456117778306, |
| "learning_rate": 6.3532656741257145e-06, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15273120999336243, |
| "step": 5100, |
| "valid_targets_mean": 2574.7, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 5.362394957983193, |
| "grad_norm": 0.732365954356259, |
| "learning_rate": 6.315016321310965e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16224431991577148, |
| "step": 5105, |
| "valid_targets_mean": 2581.6, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 5.367647058823529, |
| "grad_norm": 0.7789962344565333, |
| "learning_rate": 6.276860857707727e-06, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17684108018875122, |
| "step": 5110, |
| "valid_targets_mean": 2496.4, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 5.3728991596638656, |
| "grad_norm": 0.8532814228814727, |
| "learning_rate": 6.238799545090994e-06, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1521385908126831, |
| "step": 5115, |
| "valid_targets_mean": 2414.0, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 5.378151260504202, |
| "grad_norm": 0.7899952744078172, |
| "learning_rate": 6.20083264458981e-06, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1502818763256073, |
| "step": 5120, |
| "valid_targets_mean": 2204.8, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 5.383403361344538, |
| "grad_norm": 0.6387635570636864, |
| "learning_rate": 6.162960416685469e-06, |
| "loss": 0.1602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1471373438835144, |
| "step": 5125, |
| "valid_targets_mean": 3084.1, |
| "valid_targets_min": 1468 |
| }, |
| { |
| "epoch": 5.388655462184874, |
| "grad_norm": 0.8485693482893446, |
| "learning_rate": 6.125183121209741e-06, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1780264526605606, |
| "step": 5130, |
| "valid_targets_mean": 2274.9, |
| "valid_targets_min": 1094 |
| }, |
| { |
| "epoch": 5.39390756302521, |
| "grad_norm": 0.7495677095087009, |
| "learning_rate": 6.087501017343107e-06, |
| "loss": 0.1644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15651904046535492, |
| "step": 5135, |
| "valid_targets_mean": 2542.9, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 5.399159663865547, |
| "grad_norm": 0.7435758493446045, |
| "learning_rate": 6.0499143636129384e-06, |
| "loss": 0.163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1455836445093155, |
| "step": 5140, |
| "valid_targets_mean": 2512.5, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 5.404411764705882, |
| "grad_norm": 0.8993390562265813, |
| "learning_rate": 6.012423417891766e-06, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17336681485176086, |
| "step": 5145, |
| "valid_targets_mean": 2680.2, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 5.409663865546219, |
| "grad_norm": 0.8004525963625007, |
| "learning_rate": 5.975028437395493e-06, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15126681327819824, |
| "step": 5150, |
| "valid_targets_mean": 2013.7, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 5.4149159663865545, |
| "grad_norm": 0.7799255786777086, |
| "learning_rate": 5.937729678681612e-06, |
| "loss": 0.1576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15724611282348633, |
| "step": 5155, |
| "valid_targets_mean": 2525.8, |
| "valid_targets_min": 1280 |
| }, |
| { |
| "epoch": 5.420168067226891, |
| "grad_norm": 0.7841845158497852, |
| "learning_rate": 5.9005273976474684e-06, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15903203189373016, |
| "step": 5160, |
| "valid_targets_mean": 2379.1, |
| "valid_targets_min": 1163 |
| }, |
| { |
| "epoch": 5.425420168067227, |
| "grad_norm": 0.6717665505168996, |
| "learning_rate": 5.8634218495285126e-06, |
| "loss": 0.1577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14495673775672913, |
| "step": 5165, |
| "valid_targets_mean": 2827.6, |
| "valid_targets_min": 1100 |
| }, |
| { |
| "epoch": 5.430672268907563, |
| "grad_norm": 0.8298875239928819, |
| "learning_rate": 5.8264132888965155e-06, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14547504484653473, |
| "step": 5170, |
| "valid_targets_mean": 2200.4, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 5.435924369747899, |
| "grad_norm": 0.7078895304712665, |
| "learning_rate": 5.789501969657853e-06, |
| "loss": 0.1562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14443817734718323, |
| "step": 5175, |
| "valid_targets_mean": 2713.6, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 5.4411764705882355, |
| "grad_norm": 0.7468395911409705, |
| "learning_rate": 5.752688145051761e-06, |
| "loss": 0.1645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15606167912483215, |
| "step": 5180, |
| "valid_targets_mean": 2896.7, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 5.446428571428571, |
| "grad_norm": 0.7339528998149712, |
| "learning_rate": 5.715972067648561e-06, |
| "loss": 0.1598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16431309282779694, |
| "step": 5185, |
| "valid_targets_mean": 2671.4, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 5.451680672268908, |
| "grad_norm": 0.7898995773556446, |
| "learning_rate": 5.679353989347989e-06, |
| "loss": 0.1562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14948245882987976, |
| "step": 5190, |
| "valid_targets_mean": 2137.9, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 5.456932773109243, |
| "grad_norm": 0.8149040646058742, |
| "learning_rate": 5.642834161377408e-06, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16367627680301666, |
| "step": 5195, |
| "valid_targets_mean": 2087.3, |
| "valid_targets_min": 1040 |
| }, |
| { |
| "epoch": 5.46218487394958, |
| "grad_norm": 0.6719154088237885, |
| "learning_rate": 5.606412834290121e-06, |
| "loss": 0.1574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14343780279159546, |
| "step": 5200, |
| "valid_targets_mean": 3016.2, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 5.467436974789916, |
| "grad_norm": 0.8508194897949711, |
| "learning_rate": 5.570090257963645e-06, |
| "loss": 0.1638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16275382041931152, |
| "step": 5205, |
| "valid_targets_mean": 1842.1, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 5.472689075630252, |
| "grad_norm": 0.7598842769868193, |
| "learning_rate": 5.533866681597981e-06, |
| "loss": 0.155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1676841378211975, |
| "step": 5210, |
| "valid_targets_mean": 2668.4, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 5.477941176470588, |
| "grad_norm": 0.8473153688144975, |
| "learning_rate": 5.497742353713928e-06, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17238308489322662, |
| "step": 5215, |
| "valid_targets_mean": 2029.6, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 5.483193277310924, |
| "grad_norm": 0.737492773817561, |
| "learning_rate": 5.461717522151371e-06, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15577836334705353, |
| "step": 5220, |
| "valid_targets_mean": 2799.9, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 5.48844537815126, |
| "grad_norm": 0.7013802768068832, |
| "learning_rate": 5.4257924340675535e-06, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16768768429756165, |
| "step": 5225, |
| "valid_targets_mean": 3200.6, |
| "valid_targets_min": 1303 |
| }, |
| { |
| "epoch": 5.493697478991597, |
| "grad_norm": 0.6898526895385486, |
| "learning_rate": 5.389967335935429e-06, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15428847074508667, |
| "step": 5230, |
| "valid_targets_mean": 2979.0, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 5.498949579831933, |
| "grad_norm": 0.8269332396210477, |
| "learning_rate": 5.3542424735419306e-06, |
| "loss": 0.1662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1691667139530182, |
| "step": 5235, |
| "valid_targets_mean": 2126.2, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 5.504201680672269, |
| "grad_norm": 0.7582781505938827, |
| "learning_rate": 5.318618091986294e-06, |
| "loss": 0.1595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16203898191452026, |
| "step": 5240, |
| "valid_targets_mean": 2414.2, |
| "valid_targets_min": 758 |
| }, |
| { |
| "epoch": 5.509453781512605, |
| "grad_norm": 0.964837540275934, |
| "learning_rate": 5.283094435678398e-06, |
| "loss": 0.1643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18285033106803894, |
| "step": 5245, |
| "valid_targets_mean": 2520.3, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 5.514705882352941, |
| "grad_norm": 0.7407984840086744, |
| "learning_rate": 5.2476717483370685e-06, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18044058978557587, |
| "step": 5250, |
| "valid_targets_mean": 2980.8, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 5.519957983193278, |
| "grad_norm": 0.670814241203273, |
| "learning_rate": 5.212350272988394e-06, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13862532377243042, |
| "step": 5255, |
| "valid_targets_mean": 2928.0, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 5.525210084033613, |
| "grad_norm": 0.7638249491401231, |
| "learning_rate": 5.177130251964088e-06, |
| "loss": 0.1669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15651783347129822, |
| "step": 5260, |
| "valid_targets_mean": 2388.1, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 5.53046218487395, |
| "grad_norm": 0.7464606207804972, |
| "learning_rate": 5.1420119268998085e-06, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15144014358520508, |
| "step": 5265, |
| "valid_targets_mean": 2414.2, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 5.535714285714286, |
| "grad_norm": 0.6723804956667677, |
| "learning_rate": 5.106995538733488e-06, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12311984598636627, |
| "step": 5270, |
| "valid_targets_mean": 2505.5, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 5.540966386554622, |
| "grad_norm": 0.7514104012472849, |
| "learning_rate": 5.07208132770372e-06, |
| "loss": 0.1568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16300344467163086, |
| "step": 5275, |
| "valid_targets_mean": 2621.9, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 5.546218487394958, |
| "grad_norm": 0.8709704943028632, |
| "learning_rate": 5.037269533348075e-06, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15614300966262817, |
| "step": 5280, |
| "valid_targets_mean": 2086.8, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 5.551470588235294, |
| "grad_norm": 0.8145404233606028, |
| "learning_rate": 5.002560394501463e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1704893410205841, |
| "step": 5285, |
| "valid_targets_mean": 2252.9, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 5.55672268907563, |
| "grad_norm": 0.7858067778473078, |
| "learning_rate": 4.9679541492945135e-06, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17581012845039368, |
| "step": 5290, |
| "valid_targets_mean": 2497.4, |
| "valid_targets_min": 832 |
| }, |
| { |
| "epoch": 5.561974789915967, |
| "grad_norm": 0.7444934360144145, |
| "learning_rate": 4.933451035151913e-06, |
| "loss": 0.1596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16977301239967346, |
| "step": 5295, |
| "valid_targets_mean": 2621.8, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 5.567226890756302, |
| "grad_norm": 0.7002188781201552, |
| "learning_rate": 4.899051288790806e-06, |
| "loss": 0.1643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15018996596336365, |
| "step": 5300, |
| "valid_targets_mean": 2713.4, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 5.572478991596639, |
| "grad_norm": 0.7598676053646428, |
| "learning_rate": 4.86475514621916e-06, |
| "loss": 0.165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16991931200027466, |
| "step": 5305, |
| "valid_targets_mean": 2667.0, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 5.5777310924369745, |
| "grad_norm": 0.8820515115776142, |
| "learning_rate": 4.830562842734112e-06, |
| "loss": 0.1591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1688452661037445, |
| "step": 5310, |
| "valid_targets_mean": 2134.6, |
| "valid_targets_min": 903 |
| }, |
| { |
| "epoch": 5.582983193277311, |
| "grad_norm": 0.7149756144412622, |
| "learning_rate": 4.796474612920421e-06, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15258319675922394, |
| "step": 5315, |
| "valid_targets_mean": 2937.4, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 5.588235294117647, |
| "grad_norm": 0.6941030908245607, |
| "learning_rate": 4.762490690648813e-06, |
| "loss": 0.1652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17828604578971863, |
| "step": 5320, |
| "valid_targets_mean": 3366.6, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 5.593487394957983, |
| "grad_norm": 0.7755309453396569, |
| "learning_rate": 4.728611309074374e-06, |
| "loss": 0.1583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16606014966964722, |
| "step": 5325, |
| "valid_targets_mean": 2534.5, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 5.598739495798319, |
| "grad_norm": 0.7161574736206265, |
| "learning_rate": 4.694836700634975e-06, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1472625732421875, |
| "step": 5330, |
| "valid_targets_mean": 2363.2, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 5.6039915966386555, |
| "grad_norm": 0.9658673174845026, |
| "learning_rate": 4.661167097049668e-06, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15956471860408783, |
| "step": 5335, |
| "valid_targets_mean": 2047.2, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 5.609243697478991, |
| "grad_norm": 0.8292596385955369, |
| "learning_rate": 4.62760272931708e-06, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16373419761657715, |
| "step": 5340, |
| "valid_targets_mean": 2055.4, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 5.614495798319328, |
| "grad_norm": 0.7872816299655447, |
| "learning_rate": 4.594143827713844e-06, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16614991426467896, |
| "step": 5345, |
| "valid_targets_mean": 2267.2, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 5.619747899159664, |
| "grad_norm": 0.6885239670075206, |
| "learning_rate": 4.56079062179303e-06, |
| "loss": 0.1614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1568869948387146, |
| "step": 5350, |
| "valid_targets_mean": 3092.1, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 5.625, |
| "grad_norm": 0.7063945748122799, |
| "learning_rate": 4.527543340382538e-06, |
| "loss": 0.1653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15817028284072876, |
| "step": 5355, |
| "valid_targets_mean": 3193.8, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 5.630252100840336, |
| "grad_norm": 0.7483586106813811, |
| "learning_rate": 4.494402211583569e-06, |
| "loss": 0.1674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1763601005077362, |
| "step": 5360, |
| "valid_targets_mean": 2585.2, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 5.635504201680672, |
| "grad_norm": 0.7266651690365762, |
| "learning_rate": 4.461367462769009e-06, |
| "loss": 0.1649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15703195333480835, |
| "step": 5365, |
| "valid_targets_mean": 2579.4, |
| "valid_targets_min": 943 |
| }, |
| { |
| "epoch": 5.640756302521009, |
| "grad_norm": 0.7723418200616802, |
| "learning_rate": 4.428439320581923e-06, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16179069876670837, |
| "step": 5370, |
| "valid_targets_mean": 2583.6, |
| "valid_targets_min": 1207 |
| }, |
| { |
| "epoch": 5.6460084033613445, |
| "grad_norm": 0.6951598907006209, |
| "learning_rate": 4.3956180109339705e-06, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15667061507701874, |
| "step": 5375, |
| "valid_targets_mean": 2790.9, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 5.651260504201681, |
| "grad_norm": 0.7579446080195453, |
| "learning_rate": 4.362903759003849e-06, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15197469294071198, |
| "step": 5380, |
| "valid_targets_mean": 2506.1, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 5.656512605042017, |
| "grad_norm": 0.7299857797114069, |
| "learning_rate": 4.33029678923576e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1476059854030609, |
| "step": 5385, |
| "valid_targets_mean": 2806.4, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 5.661764705882353, |
| "grad_norm": 0.7781274130758863, |
| "learning_rate": 4.297797325337889e-06, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1483781933784485, |
| "step": 5390, |
| "valid_targets_mean": 2407.4, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 5.667016806722689, |
| "grad_norm": 0.7313088256357814, |
| "learning_rate": 4.265405590280822e-06, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15789197385311127, |
| "step": 5395, |
| "valid_targets_mean": 3041.6, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 5.6722689075630255, |
| "grad_norm": 0.8103212447323822, |
| "learning_rate": 4.233121806296072e-06, |
| "loss": 0.1651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17392036318778992, |
| "step": 5400, |
| "valid_targets_mean": 2288.4, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 5.677521008403361, |
| "grad_norm": 0.7595385849740667, |
| "learning_rate": 4.200946194874514e-06, |
| "loss": 0.1584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15691381692886353, |
| "step": 5405, |
| "valid_targets_mean": 2395.4, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 5.682773109243698, |
| "grad_norm": 0.7278254832783921, |
| "learning_rate": 4.168878976764872e-06, |
| "loss": 0.164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1525121033191681, |
| "step": 5410, |
| "valid_targets_mean": 2631.4, |
| "valid_targets_min": 1157 |
| }, |
| { |
| "epoch": 5.688025210084033, |
| "grad_norm": 0.8021682749292429, |
| "learning_rate": 4.136920371972228e-06, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14895716309547424, |
| "step": 5415, |
| "valid_targets_mean": 1936.1, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 5.69327731092437, |
| "grad_norm": 0.6953948453787546, |
| "learning_rate": 4.105070599756482e-06, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15940669178962708, |
| "step": 5420, |
| "valid_targets_mean": 2777.6, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 5.698529411764706, |
| "grad_norm": 0.770187756365488, |
| "learning_rate": 4.073329878630856e-06, |
| "loss": 0.1667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16655011475086212, |
| "step": 5425, |
| "valid_targets_mean": 2557.6, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 5.703781512605042, |
| "grad_norm": 0.7698518711299432, |
| "learning_rate": 4.041698426360425e-06, |
| "loss": 0.1695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1650160849094391, |
| "step": 5430, |
| "valid_targets_mean": 2342.6, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 5.709033613445378, |
| "grad_norm": 0.7840326454397952, |
| "learning_rate": 4.010176459960569e-06, |
| "loss": 0.1603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.161130890250206, |
| "step": 5435, |
| "valid_targets_mean": 2237.3, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 5.714285714285714, |
| "grad_norm": 0.6973943107045614, |
| "learning_rate": 3.978764195695528e-06, |
| "loss": 0.1572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14485879242420197, |
| "step": 5440, |
| "valid_targets_mean": 2737.0, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 5.71953781512605, |
| "grad_norm": 0.8240293274129915, |
| "learning_rate": 3.947461849076912e-06, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19433113932609558, |
| "step": 5445, |
| "valid_targets_mean": 2314.3, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 5.724789915966387, |
| "grad_norm": 0.8114689626823407, |
| "learning_rate": 3.916269634862193e-06, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15822897851467133, |
| "step": 5450, |
| "valid_targets_mean": 2607.1, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 5.730042016806722, |
| "grad_norm": 0.8364269359269342, |
| "learning_rate": 3.885187767053269e-06, |
| "loss": 0.1544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1558850109577179, |
| "step": 5455, |
| "valid_targets_mean": 1694.3, |
| "valid_targets_min": 838 |
| }, |
| { |
| "epoch": 5.735294117647059, |
| "grad_norm": 0.8692400632474553, |
| "learning_rate": 3.854216458894973e-06, |
| "loss": 0.1636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16702617704868317, |
| "step": 5460, |
| "valid_targets_mean": 2202.1, |
| "valid_targets_min": 777 |
| }, |
| { |
| "epoch": 5.740546218487395, |
| "grad_norm": 0.7101368299314894, |
| "learning_rate": 3.823355922873606e-06, |
| "loss": 0.1624, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14841680228710175, |
| "step": 5465, |
| "valid_targets_mean": 2778.5, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 5.745798319327731, |
| "grad_norm": 0.7291139806638217, |
| "learning_rate": 3.792606370715508e-06, |
| "loss": 0.1557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1669558882713318, |
| "step": 5470, |
| "valid_targets_mean": 2786.6, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 5.751050420168067, |
| "grad_norm": 0.8199168939791637, |
| "learning_rate": 3.761968013385584e-06, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15248140692710876, |
| "step": 5475, |
| "valid_targets_mean": 1965.8, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 5.756302521008403, |
| "grad_norm": 0.7220120926134376, |
| "learning_rate": 3.731441061085843e-06, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15842077136039734, |
| "step": 5480, |
| "valid_targets_mean": 2855.1, |
| "valid_targets_min": 1118 |
| }, |
| { |
| "epoch": 5.76155462184874, |
| "grad_norm": 0.7691870517732631, |
| "learning_rate": 3.701025723253988e-06, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14176911115646362, |
| "step": 5485, |
| "valid_targets_mean": 2196.8, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 5.766806722689076, |
| "grad_norm": 0.6895030971240736, |
| "learning_rate": 3.67072220856197e-06, |
| "loss": 0.1692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15497374534606934, |
| "step": 5490, |
| "valid_targets_mean": 2655.5, |
| "valid_targets_min": 1184 |
| }, |
| { |
| "epoch": 5.772058823529412, |
| "grad_norm": 0.7338262928726779, |
| "learning_rate": 3.640530724914517e-06, |
| "loss": 0.1609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16165027022361755, |
| "step": 5495, |
| "valid_targets_mean": 2627.9, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 5.777310924369748, |
| "grad_norm": 0.7406660843906033, |
| "learning_rate": 3.61045147944777e-06, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14221808314323425, |
| "step": 5500, |
| "valid_targets_mean": 2517.7, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 5.782563025210084, |
| "grad_norm": 0.7608572974428726, |
| "learning_rate": 3.5804846785278315e-06, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15930047631263733, |
| "step": 5505, |
| "valid_targets_mean": 2888.9, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 5.78781512605042, |
| "grad_norm": 0.7935824693797842, |
| "learning_rate": 3.5506305277493326e-06, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1513899266719818, |
| "step": 5510, |
| "valid_targets_mean": 2279.6, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 5.793067226890757, |
| "grad_norm": 0.790428932578931, |
| "learning_rate": 3.520889231934057e-06, |
| "loss": 0.1624, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1564992070198059, |
| "step": 5515, |
| "valid_targets_mean": 2152.1, |
| "valid_targets_min": 1278 |
| }, |
| { |
| "epoch": 5.798319327731092, |
| "grad_norm": 0.8386478323895583, |
| "learning_rate": 3.4912609951295084e-06, |
| "loss": 0.1692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1771148443222046, |
| "step": 5520, |
| "valid_targets_mean": 2142.2, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 5.803571428571429, |
| "grad_norm": 0.8169074903755393, |
| "learning_rate": 3.461746020607526e-06, |
| "loss": 0.1659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16074536740779877, |
| "step": 5525, |
| "valid_targets_mean": 2207.6, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 5.8088235294117645, |
| "grad_norm": 0.7542209212555967, |
| "learning_rate": 3.432344510862895e-06, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17460983991622925, |
| "step": 5530, |
| "valid_targets_mean": 2285.8, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 5.814075630252101, |
| "grad_norm": 0.9980332994549753, |
| "learning_rate": 3.403056667611917e-06, |
| "loss": 0.1583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17128345370292664, |
| "step": 5535, |
| "valid_targets_mean": 2691.8, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 5.819327731092437, |
| "grad_norm": 0.7583521616551634, |
| "learning_rate": 3.373882691791088e-06, |
| "loss": 0.1609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15085886418819427, |
| "step": 5540, |
| "valid_targets_mean": 2659.0, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 5.824579831932773, |
| "grad_norm": 0.8477434832925683, |
| "learning_rate": 3.344822783555679e-06, |
| "loss": 0.1623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16110014915466309, |
| "step": 5545, |
| "valid_targets_mean": 1985.5, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 5.829831932773109, |
| "grad_norm": 0.7643511912140655, |
| "learning_rate": 3.315877142278363e-06, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16038095951080322, |
| "step": 5550, |
| "valid_targets_mean": 2380.6, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 5.8350840336134455, |
| "grad_norm": 0.7518728544106923, |
| "learning_rate": 3.287045966547866e-06, |
| "loss": 0.1632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17358054220676422, |
| "step": 5555, |
| "valid_targets_mean": 2760.2, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 5.840336134453781, |
| "grad_norm": 0.7124048514016621, |
| "learning_rate": 3.258329454167599e-06, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1632152795791626, |
| "step": 5560, |
| "valid_targets_mean": 2886.0, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 5.845588235294118, |
| "grad_norm": 0.8638758876946544, |
| "learning_rate": 3.2297278021542833e-06, |
| "loss": 0.1732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18239599466323853, |
| "step": 5565, |
| "valid_targets_mean": 2045.9, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 5.850840336134453, |
| "grad_norm": 0.8074069942626705, |
| "learning_rate": 3.201241206736614e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19121696054935455, |
| "step": 5570, |
| "valid_targets_mean": 2512.3, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 5.85609243697479, |
| "grad_norm": 0.8094730562236274, |
| "learning_rate": 3.1728698633539266e-06, |
| "loss": 0.1632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1697961837053299, |
| "step": 5575, |
| "valid_targets_mean": 2204.6, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 5.8613445378151265, |
| "grad_norm": 0.7593441846784588, |
| "learning_rate": 3.1446139666548212e-06, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1595013290643692, |
| "step": 5580, |
| "valid_targets_mean": 2633.0, |
| "valid_targets_min": 707 |
| }, |
| { |
| "epoch": 5.866596638655462, |
| "grad_norm": 0.7957651638135713, |
| "learning_rate": 3.1164737104958707e-06, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15644320845603943, |
| "step": 5585, |
| "valid_targets_mean": 1890.6, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 5.871848739495798, |
| "grad_norm": 0.8090053281592035, |
| "learning_rate": 3.0884492879402452e-06, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17713585495948792, |
| "step": 5590, |
| "valid_targets_mean": 2193.5, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 5.8771008403361344, |
| "grad_norm": 0.7500689718315519, |
| "learning_rate": 3.0605408912564184e-06, |
| "loss": 0.1647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16628164052963257, |
| "step": 5595, |
| "valid_targets_mean": 2580.8, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 5.882352941176471, |
| "grad_norm": 0.8192677926893119, |
| "learning_rate": 3.032748711916851e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16836728155612946, |
| "step": 5600, |
| "valid_targets_mean": 2461.7, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 5.887605042016807, |
| "grad_norm": 0.7874830104284019, |
| "learning_rate": 3.0050729405966495e-06, |
| "loss": 0.1632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16090510785579681, |
| "step": 5605, |
| "valid_targets_mean": 2267.6, |
| "valid_targets_min": 244 |
| }, |
| { |
| "epoch": 5.892857142857143, |
| "grad_norm": 0.7833656235582289, |
| "learning_rate": 2.9775137671722754e-06, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1637769341468811, |
| "step": 5610, |
| "valid_targets_mean": 2443.2, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 5.898109243697479, |
| "grad_norm": 0.7228128266155345, |
| "learning_rate": 2.9500713807202565e-06, |
| "loss": 0.154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15642684698104858, |
| "step": 5615, |
| "valid_targets_mean": 2638.7, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 5.9033613445378155, |
| "grad_norm": 0.6752375605078036, |
| "learning_rate": 2.9227459695158543e-06, |
| "loss": 0.1565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15065337717533112, |
| "step": 5620, |
| "valid_targets_mean": 3194.4, |
| "valid_targets_min": 1263 |
| }, |
| { |
| "epoch": 5.908613445378151, |
| "grad_norm": 0.8638709102103872, |
| "learning_rate": 2.895537721031809e-06, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16943012177944183, |
| "step": 5625, |
| "valid_targets_mean": 1833.1, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 5.913865546218488, |
| "grad_norm": 0.7646968532660349, |
| "learning_rate": 2.8684468219370364e-06, |
| "loss": 0.1532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14894887804985046, |
| "step": 5630, |
| "valid_targets_mean": 2673.2, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 5.919117647058823, |
| "grad_norm": 0.7612881911075914, |
| "learning_rate": 2.841473458095334e-06, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14882472157478333, |
| "step": 5635, |
| "valid_targets_mean": 2316.6, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 5.92436974789916, |
| "grad_norm": 0.7425817529470462, |
| "learning_rate": 2.8146178145641355e-06, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1679328829050064, |
| "step": 5640, |
| "valid_targets_mean": 2502.5, |
| "valid_targets_min": 687 |
| }, |
| { |
| "epoch": 5.929621848739496, |
| "grad_norm": 0.9027720359549637, |
| "learning_rate": 2.787880075593217e-06, |
| "loss": 0.1669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15756511688232422, |
| "step": 5645, |
| "valid_targets_mean": 2311.6, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 5.934873949579832, |
| "grad_norm": 0.6980735937613616, |
| "learning_rate": 2.7612604246234355e-06, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16025885939598083, |
| "step": 5650, |
| "valid_targets_mean": 2912.9, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 5.940126050420168, |
| "grad_norm": 0.7529592237919616, |
| "learning_rate": 2.7347590442854867e-06, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17594562470912933, |
| "step": 5655, |
| "valid_targets_mean": 2683.8, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 5.945378151260504, |
| "grad_norm": 0.7696301031774723, |
| "learning_rate": 2.7083761163986433e-06, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17107313871383667, |
| "step": 5660, |
| "valid_targets_mean": 2896.2, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 5.95063025210084, |
| "grad_norm": 0.7798340627342268, |
| "learning_rate": 2.682111821969493e-06, |
| "loss": 0.1654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16536115109920502, |
| "step": 5665, |
| "valid_targets_mean": 2587.5, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 5.955882352941177, |
| "grad_norm": 0.7149524883372318, |
| "learning_rate": 2.6559663411907233e-06, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1709938943386078, |
| "step": 5670, |
| "valid_targets_mean": 2945.9, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 5.961134453781512, |
| "grad_norm": 0.7165019494853891, |
| "learning_rate": 2.629939853439856e-06, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16053658723831177, |
| "step": 5675, |
| "valid_targets_mean": 2915.6, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 5.966386554621849, |
| "grad_norm": 0.9589101754966618, |
| "learning_rate": 2.604032537278052e-06, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15422767400741577, |
| "step": 5680, |
| "valid_targets_mean": 1772.9, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 5.9716386554621845, |
| "grad_norm": 0.7874586260627973, |
| "learning_rate": 2.5782445704488447e-06, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14686915278434753, |
| "step": 5685, |
| "valid_targets_mean": 2175.2, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 5.976890756302521, |
| "grad_norm": 0.8291299717722125, |
| "learning_rate": 2.5525761298769515e-06, |
| "loss": 0.1672, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17729215323925018, |
| "step": 5690, |
| "valid_targets_mean": 2213.9, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 5.982142857142857, |
| "grad_norm": 0.8550297198565612, |
| "learning_rate": 2.527027391667054e-06, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18570925295352936, |
| "step": 5695, |
| "valid_targets_mean": 2631.9, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 5.987394957983193, |
| "grad_norm": 0.8225215202521778, |
| "learning_rate": 2.501598531102587e-06, |
| "loss": 0.1619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1654691994190216, |
| "step": 5700, |
| "valid_targets_mean": 2116.9, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 5.992647058823529, |
| "grad_norm": 0.7818605889350404, |
| "learning_rate": 2.47628972264452e-06, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15820591151714325, |
| "step": 5705, |
| "valid_targets_mean": 2376.9, |
| "valid_targets_min": 775 |
| }, |
| { |
| "epoch": 5.9978991596638656, |
| "grad_norm": 0.7205251991716778, |
| "learning_rate": 2.4511011399301944e-06, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16490915417671204, |
| "step": 5710, |
| "valid_targets_mean": 3045.2, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 6.003151260504202, |
| "grad_norm": 0.79777985742783, |
| "learning_rate": 2.4260329557721107e-06, |
| "loss": 0.1556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16908371448516846, |
| "step": 5715, |
| "valid_targets_mean": 2234.9, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 6.008403361344538, |
| "grad_norm": 0.7056977699167971, |
| "learning_rate": 2.4010853421567237e-06, |
| "loss": 0.1435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1342272162437439, |
| "step": 5720, |
| "valid_targets_mean": 2620.8, |
| "valid_targets_min": 1276 |
| }, |
| { |
| "epoch": 6.013655462184874, |
| "grad_norm": 0.7206882042436742, |
| "learning_rate": 2.376258470243309e-06, |
| "loss": 0.1564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1475621461868286, |
| "step": 5725, |
| "valid_targets_mean": 2910.7, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 6.01890756302521, |
| "grad_norm": 0.6958104794523656, |
| "learning_rate": 2.351552510362758e-06, |
| "loss": 0.1515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14622151851654053, |
| "step": 5730, |
| "valid_targets_mean": 3744.4, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 6.024159663865547, |
| "grad_norm": 0.74834161850093, |
| "learning_rate": 2.326967632016406e-06, |
| "loss": 0.1535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1483282744884491, |
| "step": 5735, |
| "valid_targets_mean": 2573.9, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 6.029411764705882, |
| "grad_norm": 0.7566577246672258, |
| "learning_rate": 2.302504003874888e-06, |
| "loss": 0.1518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14986348152160645, |
| "step": 5740, |
| "valid_targets_mean": 2467.8, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 6.034663865546219, |
| "grad_norm": 0.7394059807325174, |
| "learning_rate": 2.2781617937769675e-06, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15996532142162323, |
| "step": 5745, |
| "valid_targets_mean": 3097.9, |
| "valid_targets_min": 914 |
| }, |
| { |
| "epoch": 6.0399159663865545, |
| "grad_norm": 0.7291797979840863, |
| "learning_rate": 2.2539411687283907e-06, |
| "loss": 0.1588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15175995230674744, |
| "step": 5750, |
| "valid_targets_mean": 2689.8, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 6.045168067226891, |
| "grad_norm": 0.8021207951201383, |
| "learning_rate": 2.229842294900744e-06, |
| "loss": 0.1484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15454252064228058, |
| "step": 5755, |
| "valid_targets_mean": 2140.5, |
| "valid_targets_min": 829 |
| }, |
| { |
| "epoch": 6.050420168067227, |
| "grad_norm": 0.7912228519081135, |
| "learning_rate": 2.205865337630302e-06, |
| "loss": 0.1542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15131813287734985, |
| "step": 5760, |
| "valid_targets_mean": 2908.2, |
| "valid_targets_min": 1220 |
| }, |
| { |
| "epoch": 6.055672268907563, |
| "grad_norm": 0.7907789459812723, |
| "learning_rate": 2.182010461416899e-06, |
| "loss": 0.1562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1566312164068222, |
| "step": 5765, |
| "valid_targets_mean": 2503.7, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 6.060924369747899, |
| "grad_norm": 0.8839642676042035, |
| "learning_rate": 2.158277829922817e-06, |
| "loss": 0.15, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1570267528295517, |
| "step": 5770, |
| "valid_targets_mean": 1742.3, |
| "valid_targets_min": 544 |
| }, |
| { |
| "epoch": 6.0661764705882355, |
| "grad_norm": 0.8625467723504546, |
| "learning_rate": 2.1346676059716253e-06, |
| "loss": 0.1558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14902624487876892, |
| "step": 5775, |
| "valid_targets_mean": 2078.1, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 6.071428571428571, |
| "grad_norm": 0.7087088554579924, |
| "learning_rate": 2.1111799515471066e-06, |
| "loss": 0.144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13471050560474396, |
| "step": 5780, |
| "valid_targets_mean": 2473.5, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 6.076680672268908, |
| "grad_norm": 0.7327436066837598, |
| "learning_rate": 2.0878150277921195e-06, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13805945217609406, |
| "step": 5785, |
| "valid_targets_mean": 2741.4, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 6.081932773109243, |
| "grad_norm": 0.8315227818730387, |
| "learning_rate": 2.064572995007492e-06, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14630141854286194, |
| "step": 5790, |
| "valid_targets_mean": 2002.4, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 6.08718487394958, |
| "grad_norm": 0.8401948839242035, |
| "learning_rate": 2.0414540126509274e-06, |
| "loss": 0.1529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16226598620414734, |
| "step": 5795, |
| "valid_targets_mean": 2131.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 6.092436974789916, |
| "grad_norm": 0.8776927085638933, |
| "learning_rate": 2.0184582393359253e-06, |
| "loss": 0.1492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15649349987506866, |
| "step": 5800, |
| "valid_targets_mean": 1861.4, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 6.097689075630252, |
| "grad_norm": 0.8211711286578806, |
| "learning_rate": 1.99558583283066e-06, |
| "loss": 0.1557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14332887530326843, |
| "step": 5805, |
| "valid_targets_mean": 2022.8, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 6.102941176470588, |
| "grad_norm": 0.732033944801811, |
| "learning_rate": 1.9728369500569333e-06, |
| "loss": 0.1415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13911320269107819, |
| "step": 5810, |
| "valid_targets_mean": 2577.7, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 6.108193277310924, |
| "grad_norm": 0.8099862293022083, |
| "learning_rate": 1.950211747089077e-06, |
| "loss": 0.1567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14890515804290771, |
| "step": 5815, |
| "valid_targets_mean": 2239.7, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 6.11344537815126, |
| "grad_norm": 0.8280954650156288, |
| "learning_rate": 1.927710379152881e-06, |
| "loss": 0.1514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15409252047538757, |
| "step": 5820, |
| "valid_targets_mean": 2037.0, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 6.118697478991597, |
| "grad_norm": 0.7720826623857413, |
| "learning_rate": 1.9053330006245452e-06, |
| "loss": 0.1487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1435692012310028, |
| "step": 5825, |
| "valid_targets_mean": 2505.6, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 6.123949579831933, |
| "grad_norm": 0.8602830964405195, |
| "learning_rate": 1.8830797650296006e-06, |
| "loss": 0.1536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15629276633262634, |
| "step": 5830, |
| "valid_targets_mean": 1843.5, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 6.129201680672269, |
| "grad_norm": 0.7886878487521178, |
| "learning_rate": 1.8609508250418628e-06, |
| "loss": 0.163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17373371124267578, |
| "step": 5835, |
| "valid_targets_mean": 2652.3, |
| "valid_targets_min": 1395 |
| }, |
| { |
| "epoch": 6.1344537815126055, |
| "grad_norm": 0.8219543982430842, |
| "learning_rate": 1.8389463324823986e-06, |
| "loss": 0.1471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14603424072265625, |
| "step": 5840, |
| "valid_targets_mean": 2208.8, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 6.139705882352941, |
| "grad_norm": 0.8240205796466581, |
| "learning_rate": 1.81706643831846e-06, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1447804570198059, |
| "step": 5845, |
| "valid_targets_mean": 2197.1, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 6.144957983193278, |
| "grad_norm": 0.7863349767944662, |
| "learning_rate": 1.7953112926624715e-06, |
| "loss": 0.1574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14369264245033264, |
| "step": 5850, |
| "valid_targets_mean": 2488.8, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 6.150210084033613, |
| "grad_norm": 0.7481918069687116, |
| "learning_rate": 1.7736810447709852e-06, |
| "loss": 0.1404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14041663706302643, |
| "step": 5855, |
| "valid_targets_mean": 2419.5, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 6.15546218487395, |
| "grad_norm": 0.7548879647168044, |
| "learning_rate": 1.7521758430436553e-06, |
| "loss": 0.1568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15782803297042847, |
| "step": 5860, |
| "valid_targets_mean": 2704.7, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 6.160714285714286, |
| "grad_norm": 0.8818736318364171, |
| "learning_rate": 1.7307958350222366e-06, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1596248298883438, |
| "step": 5865, |
| "valid_targets_mean": 2219.8, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 6.165966386554622, |
| "grad_norm": 0.8306669309571554, |
| "learning_rate": 1.7095411673895545e-06, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16560135781764984, |
| "step": 5870, |
| "valid_targets_mean": 2339.6, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 6.171218487394958, |
| "grad_norm": 0.7839020315929305, |
| "learning_rate": 1.6884119859685034e-06, |
| "loss": 0.1571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16316699981689453, |
| "step": 5875, |
| "valid_targets_mean": 2607.8, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 6.176470588235294, |
| "grad_norm": 0.7562882938551625, |
| "learning_rate": 1.6674084357210562e-06, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1440119594335556, |
| "step": 5880, |
| "valid_targets_mean": 2218.6, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 6.18172268907563, |
| "grad_norm": 0.7626842826181003, |
| "learning_rate": 1.6465306607472608e-06, |
| "loss": 0.1489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13738971948623657, |
| "step": 5885, |
| "valid_targets_mean": 2323.1, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 6.186974789915967, |
| "grad_norm": 0.7942359627663949, |
| "learning_rate": 1.625778804284246e-06, |
| "loss": 0.146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14948052167892456, |
| "step": 5890, |
| "valid_targets_mean": 2511.6, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 6.192226890756302, |
| "grad_norm": 0.8431028429315225, |
| "learning_rate": 1.6051530087052558e-06, |
| "loss": 0.1459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15867841243743896, |
| "step": 5895, |
| "valid_targets_mean": 2291.1, |
| "valid_targets_min": 940 |
| }, |
| { |
| "epoch": 6.197478991596639, |
| "grad_norm": 0.8666438002772852, |
| "learning_rate": 1.5846534155186511e-06, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14912620186805725, |
| "step": 5900, |
| "valid_targets_mean": 1881.3, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 6.2027310924369745, |
| "grad_norm": 0.8110997063724646, |
| "learning_rate": 1.564280165366956e-06, |
| "loss": 0.1573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1503579318523407, |
| "step": 5905, |
| "valid_targets_mean": 2042.6, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 6.207983193277311, |
| "grad_norm": 0.7289206797878542, |
| "learning_rate": 1.544033398025886e-06, |
| "loss": 0.153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15290409326553345, |
| "step": 5910, |
| "valid_targets_mean": 2841.8, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 6.213235294117647, |
| "grad_norm": 0.8826762189160628, |
| "learning_rate": 1.5239132524033951e-06, |
| "loss": 0.1446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15168313682079315, |
| "step": 5915, |
| "valid_targets_mean": 2273.7, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 6.218487394957983, |
| "grad_norm": 0.6729261276809203, |
| "learning_rate": 1.50391986653871e-06, |
| "loss": 0.1476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1368652582168579, |
| "step": 5920, |
| "valid_targets_mean": 3169.6, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 6.223739495798319, |
| "grad_norm": 0.7965190893498632, |
| "learning_rate": 1.4840533776013954e-06, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1640886664390564, |
| "step": 5925, |
| "valid_targets_mean": 2498.8, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 6.2289915966386555, |
| "grad_norm": 0.7757965453046244, |
| "learning_rate": 1.4643139218904035e-06, |
| "loss": 0.152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14865760505199432, |
| "step": 5930, |
| "valid_targets_mean": 2731.4, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 6.234243697478991, |
| "grad_norm": 0.7962903371122022, |
| "learning_rate": 1.4447016348331477e-06, |
| "loss": 0.1482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13591375946998596, |
| "step": 5935, |
| "valid_targets_mean": 2047.8, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 6.239495798319328, |
| "grad_norm": 0.7557635968086313, |
| "learning_rate": 1.4252166509845777e-06, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15759332478046417, |
| "step": 5940, |
| "valid_targets_mean": 2775.9, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 6.244747899159663, |
| "grad_norm": 0.7204075261247243, |
| "learning_rate": 1.4058591040262259e-06, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14412742853164673, |
| "step": 5945, |
| "valid_targets_mean": 2885.9, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 6.25, |
| "grad_norm": 0.7821960625396808, |
| "learning_rate": 1.3866291267653309e-06, |
| "loss": 0.1514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15519963204860687, |
| "step": 5950, |
| "valid_targets_mean": 2386.9, |
| "valid_targets_min": 917 |
| }, |
| { |
| "epoch": 6.255252100840336, |
| "grad_norm": 0.7211652670433405, |
| "learning_rate": 1.3675268511339067e-06, |
| "loss": 0.1501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14521880447864532, |
| "step": 5955, |
| "valid_targets_mean": 2996.6, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 6.260504201680672, |
| "grad_norm": 0.8118712246185013, |
| "learning_rate": 1.3485524081878288e-06, |
| "loss": 0.1498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16166505217552185, |
| "step": 5960, |
| "valid_targets_mean": 2691.8, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 6.265756302521009, |
| "grad_norm": 0.859100591202131, |
| "learning_rate": 1.3297059281059533e-06, |
| "loss": 0.1561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1694069802761078, |
| "step": 5965, |
| "valid_targets_mean": 2484.4, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 6.2710084033613445, |
| "grad_norm": 0.6880675870848753, |
| "learning_rate": 1.3109875401892146e-06, |
| "loss": 0.1491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13731975853443146, |
| "step": 5970, |
| "valid_targets_mean": 3048.2, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 6.276260504201681, |
| "grad_norm": 0.78207546197356, |
| "learning_rate": 1.2923973728597373e-06, |
| "loss": 0.1425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13927319645881653, |
| "step": 5975, |
| "valid_targets_mean": 2147.8, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 6.281512605042017, |
| "grad_norm": 0.9014126476888846, |
| "learning_rate": 1.2739355536599508e-06, |
| "loss": 0.1429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1446988582611084, |
| "step": 5980, |
| "valid_targets_mean": 1929.1, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 6.286764705882353, |
| "grad_norm": 0.7420292923016639, |
| "learning_rate": 1.2556022092517362e-06, |
| "loss": 0.1521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14270836114883423, |
| "step": 5985, |
| "valid_targets_mean": 2397.7, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 6.292016806722689, |
| "grad_norm": 0.7955077467970862, |
| "learning_rate": 1.237397465415524e-06, |
| "loss": 0.1453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1445448398590088, |
| "step": 5990, |
| "valid_targets_mean": 2025.7, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 6.2972689075630255, |
| "grad_norm": 0.8287126470993438, |
| "learning_rate": 1.2193214470494664e-06, |
| "loss": 0.1517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1324065625667572, |
| "step": 5995, |
| "valid_targets_mean": 1985.8, |
| "valid_targets_min": 867 |
| }, |
| { |
| "epoch": 6.302521008403361, |
| "grad_norm": 0.7561550704661556, |
| "learning_rate": 1.201374278168541e-06, |
| "loss": 0.1452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15818336606025696, |
| "step": 6000, |
| "valid_targets_mean": 2369.2, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 6.307773109243698, |
| "grad_norm": 0.7629710579022473, |
| "learning_rate": 1.1835560819037429e-06, |
| "loss": 0.1427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12634852528572083, |
| "step": 6005, |
| "valid_targets_mean": 2487.6, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 6.313025210084033, |
| "grad_norm": 0.8264383119430665, |
| "learning_rate": 1.1658669805012112e-06, |
| "loss": 0.144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14036674797534943, |
| "step": 6010, |
| "valid_targets_mean": 1953.5, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 6.31827731092437, |
| "grad_norm": 0.8768123841384081, |
| "learning_rate": 1.1483070953213904e-06, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1594979465007782, |
| "step": 6015, |
| "valid_targets_mean": 2033.9, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 6.323529411764706, |
| "grad_norm": 0.8008028472783635, |
| "learning_rate": 1.130876546838211e-06, |
| "loss": 0.1592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16434642672538757, |
| "step": 6020, |
| "valid_targets_mean": 2647.7, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 6.328781512605042, |
| "grad_norm": 0.778716540961378, |
| "learning_rate": 1.1135754546382627e-06, |
| "loss": 0.1439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15541379153728485, |
| "step": 6025, |
| "valid_targets_mean": 2563.2, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 6.334033613445378, |
| "grad_norm": 0.7658767727670047, |
| "learning_rate": 1.0964039374199564e-06, |
| "loss": 0.1476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14019645750522614, |
| "step": 6030, |
| "valid_targets_mean": 2198.1, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 6.339285714285714, |
| "grad_norm": 0.7848881321896162, |
| "learning_rate": 1.07936211299273e-06, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15517699718475342, |
| "step": 6035, |
| "valid_targets_mean": 2547.2, |
| "valid_targets_min": 825 |
| }, |
| { |
| "epoch": 6.34453781512605, |
| "grad_norm": 1.1562955954823186, |
| "learning_rate": 1.0624500982762376e-06, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1641463041305542, |
| "step": 6040, |
| "valid_targets_mean": 2856.1, |
| "valid_targets_min": 933 |
| }, |
| { |
| "epoch": 6.349789915966387, |
| "grad_norm": 1.243869663850212, |
| "learning_rate": 1.045668009299523e-06, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1688794195652008, |
| "step": 6045, |
| "valid_targets_mean": 1660.8, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 6.355042016806722, |
| "grad_norm": 0.9029029473166272, |
| "learning_rate": 1.029015961200266e-06, |
| "loss": 0.1539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16218698024749756, |
| "step": 6050, |
| "valid_targets_mean": 1781.9, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 6.360294117647059, |
| "grad_norm": 0.839913681660097, |
| "learning_rate": 1.012494068223946e-06, |
| "loss": 0.1545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14709152281284332, |
| "step": 6055, |
| "valid_targets_mean": 1895.1, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 6.3655462184873945, |
| "grad_norm": 0.7974623565020086, |
| "learning_rate": 9.961024437230948e-07, |
| "loss": 0.1493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13561251759529114, |
| "step": 6060, |
| "valid_targets_mean": 2064.5, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 6.370798319327731, |
| "grad_norm": 0.709502267033278, |
| "learning_rate": 9.798412001565038e-07, |
| "loss": 0.1591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16175958514213562, |
| "step": 6065, |
| "valid_targets_mean": 3175.9, |
| "valid_targets_min": 780 |
| }, |
| { |
| "epoch": 6.376050420168067, |
| "grad_norm": 0.9037744133249849, |
| "learning_rate": 9.63710449088453e-07, |
| "loss": 0.1499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15407252311706543, |
| "step": 6070, |
| "valid_targets_mean": 1908.1, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 6.381302521008403, |
| "grad_norm": 0.797641245566909, |
| "learning_rate": 9.477103011879408e-07, |
| "loss": 0.1475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15560175478458405, |
| "step": 6075, |
| "valid_targets_mean": 2465.2, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 6.38655462184874, |
| "grad_norm": 0.7237125765315087, |
| "learning_rate": 9.318408662279399e-07, |
| "loss": 0.1527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14476794004440308, |
| "step": 6080, |
| "valid_targets_mean": 2732.1, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 6.391806722689076, |
| "grad_norm": 0.7575017424625796, |
| "learning_rate": 9.161022530846253e-07, |
| "loss": 0.1525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13442182540893555, |
| "step": 6085, |
| "valid_targets_mean": 2915.2, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 6.397058823529412, |
| "grad_norm": 0.8267114749782785, |
| "learning_rate": 9.004945697366452e-07, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14276978373527527, |
| "step": 6090, |
| "valid_targets_mean": 2019.4, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 6.402310924369748, |
| "grad_norm": 0.7237677872215658, |
| "learning_rate": 8.850179232643641e-07, |
| "loss": 0.1501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14779332280158997, |
| "step": 6095, |
| "valid_targets_mean": 2826.4, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 6.407563025210084, |
| "grad_norm": 0.8400966461486415, |
| "learning_rate": 8.696724198491369e-07, |
| "loss": 0.1537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15353678166866302, |
| "step": 6100, |
| "valid_targets_mean": 2215.9, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 6.41281512605042, |
| "grad_norm": 0.7477003864167849, |
| "learning_rate": 8.544581647725825e-07, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1523742377758026, |
| "step": 6105, |
| "valid_targets_mean": 2844.5, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 6.418067226890757, |
| "grad_norm": 0.8178307661739669, |
| "learning_rate": 8.393752624158603e-07, |
| "loss": 0.1498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14179328083992004, |
| "step": 6110, |
| "valid_targets_mean": 1932.0, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 6.423319327731092, |
| "grad_norm": 0.6634779755671151, |
| "learning_rate": 8.244238162589435e-07, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14001640677452087, |
| "step": 6115, |
| "valid_targets_mean": 3367.4, |
| "valid_targets_min": 1289 |
| }, |
| { |
| "epoch": 6.428571428571429, |
| "grad_norm": 0.7620021165612041, |
| "learning_rate": 8.096039288799251e-07, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15005478262901306, |
| "step": 6120, |
| "valid_targets_mean": 2588.8, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 6.4338235294117645, |
| "grad_norm": 0.7934644918251871, |
| "learning_rate": 7.949157019543064e-07, |
| "loss": 0.1559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17349065840244293, |
| "step": 6125, |
| "valid_targets_mean": 2498.0, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 6.439075630252101, |
| "grad_norm": 0.7690205077229771, |
| "learning_rate": 7.803592362542911e-07, |
| "loss": 0.1503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16106484830379486, |
| "step": 6130, |
| "valid_targets_mean": 2574.9, |
| "valid_targets_min": 1357 |
| }, |
| { |
| "epoch": 6.444327731092437, |
| "grad_norm": 0.8681115870866193, |
| "learning_rate": 7.659346316481086e-07, |
| "loss": 0.1505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14451289176940918, |
| "step": 6135, |
| "valid_targets_mean": 1931.4, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 6.449579831932773, |
| "grad_norm": 0.7601643918944068, |
| "learning_rate": 7.516419870993296e-07, |
| "loss": 0.1493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15384207665920258, |
| "step": 6140, |
| "valid_targets_mean": 2423.4, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 6.454831932773109, |
| "grad_norm": 0.7370958836376663, |
| "learning_rate": 7.374814006661667e-07, |
| "loss": 0.152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1404162049293518, |
| "step": 6145, |
| "valid_targets_mean": 2909.4, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 6.4600840336134455, |
| "grad_norm": 0.8042467319801916, |
| "learning_rate": 7.234529695008241e-07, |
| "loss": 0.1459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15728093683719635, |
| "step": 6150, |
| "valid_targets_mean": 2223.1, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 6.465336134453781, |
| "grad_norm": 0.7816915471785587, |
| "learning_rate": 7.095567898488175e-07, |
| "loss": 0.156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16815775632858276, |
| "step": 6155, |
| "valid_targets_mean": 2402.7, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 6.470588235294118, |
| "grad_norm": 0.9016085189910406, |
| "learning_rate": 6.957929570483224e-07, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16057243943214417, |
| "step": 6160, |
| "valid_targets_mean": 2306.2, |
| "valid_targets_min": 640 |
| }, |
| { |
| "epoch": 6.475840336134453, |
| "grad_norm": 0.7983769298179959, |
| "learning_rate": 6.821615655295155e-07, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16977722942829132, |
| "step": 6165, |
| "valid_targets_mean": 2523.9, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 6.48109243697479, |
| "grad_norm": 0.8711158720727042, |
| "learning_rate": 6.686627088139253e-07, |
| "loss": 0.1579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17021444439888, |
| "step": 6170, |
| "valid_targets_mean": 2276.9, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 6.486344537815126, |
| "grad_norm": 0.7653732434373907, |
| "learning_rate": 6.552964795137895e-07, |
| "loss": 0.1529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16731613874435425, |
| "step": 6175, |
| "valid_targets_mean": 2977.2, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 6.491596638655462, |
| "grad_norm": 0.7898921304427059, |
| "learning_rate": 6.420629693314317e-07, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14303874969482422, |
| "step": 6180, |
| "valid_targets_mean": 2086.4, |
| "valid_targets_min": 722 |
| }, |
| { |
| "epoch": 6.496848739495798, |
| "grad_norm": 0.8022544168817034, |
| "learning_rate": 6.289622690586151e-07, |
| "loss": 0.1472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15002703666687012, |
| "step": 6185, |
| "valid_targets_mean": 2577.0, |
| "valid_targets_min": 967 |
| }, |
| { |
| "epoch": 6.5021008403361344, |
| "grad_norm": 0.7765235327781467, |
| "learning_rate": 6.159944685759289e-07, |
| "loss": 0.1598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1665143221616745, |
| "step": 6190, |
| "valid_targets_mean": 2581.1, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 6.507352941176471, |
| "grad_norm": 0.6652766905185039, |
| "learning_rate": 6.031596568521792e-07, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15390489995479584, |
| "step": 6195, |
| "valid_targets_mean": 3575.8, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 6.512605042016807, |
| "grad_norm": 0.823897053974955, |
| "learning_rate": 5.904579219437567e-07, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14515843987464905, |
| "step": 6200, |
| "valid_targets_mean": 2476.0, |
| "valid_targets_min": 897 |
| }, |
| { |
| "epoch": 6.517857142857143, |
| "grad_norm": 0.8693729158649441, |
| "learning_rate": 5.778893509940497e-07, |
| "loss": 0.1456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14359763264656067, |
| "step": 6205, |
| "valid_targets_mean": 1601.5, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 6.523109243697479, |
| "grad_norm": 0.7360524356141547, |
| "learning_rate": 5.654540302328526e-07, |
| "loss": 0.1464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1544869840145111, |
| "step": 6210, |
| "valid_targets_mean": 3031.3, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 6.5283613445378155, |
| "grad_norm": 0.8214329921549752, |
| "learning_rate": 5.531520449757465e-07, |
| "loss": 0.1569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15624156594276428, |
| "step": 6215, |
| "valid_targets_mean": 2231.3, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 6.533613445378151, |
| "grad_norm": 0.7526069627643952, |
| "learning_rate": 5.409834796235447e-07, |
| "loss": 0.1503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14001137018203735, |
| "step": 6220, |
| "valid_targets_mean": 2640.0, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 6.538865546218488, |
| "grad_norm": 0.8221429966093985, |
| "learning_rate": 5.28948417661701e-07, |
| "loss": 0.153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1630651354789734, |
| "step": 6225, |
| "valid_targets_mean": 2143.7, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 6.544117647058823, |
| "grad_norm": 0.8173958277347929, |
| "learning_rate": 5.170469416597223e-07, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14818143844604492, |
| "step": 6230, |
| "valid_targets_mean": 2997.8, |
| "valid_targets_min": 1061 |
| }, |
| { |
| "epoch": 6.54936974789916, |
| "grad_norm": 0.7574217024984009, |
| "learning_rate": 5.05279133270633e-07, |
| "loss": 0.1438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1506175696849823, |
| "step": 6235, |
| "valid_targets_mean": 2813.8, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 6.554621848739496, |
| "grad_norm": 0.8789551921829356, |
| "learning_rate": 4.936450732303866e-07, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17505599558353424, |
| "step": 6240, |
| "valid_targets_mean": 2185.9, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 6.559873949579832, |
| "grad_norm": 0.7800209416470806, |
| "learning_rate": 4.821448413573237e-07, |
| "loss": 0.1542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1431932896375656, |
| "step": 6245, |
| "valid_targets_mean": 2216.9, |
| "valid_targets_min": 759 |
| }, |
| { |
| "epoch": 6.565126050420168, |
| "grad_norm": 0.7715463308797006, |
| "learning_rate": 4.70778516551631e-07, |
| "loss": 0.162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15793776512145996, |
| "step": 6250, |
| "valid_targets_mean": 2604.6, |
| "valid_targets_min": 873 |
| }, |
| { |
| "epoch": 6.570378151260504, |
| "grad_norm": 0.7929402427060284, |
| "learning_rate": 4.595461767947829e-07, |
| "loss": 0.1543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17367711663246155, |
| "step": 6255, |
| "valid_targets_mean": 2793.5, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 6.57563025210084, |
| "grad_norm": 0.7558379818924563, |
| "learning_rate": 4.484478991490249e-07, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1597421020269394, |
| "step": 6260, |
| "valid_targets_mean": 2706.1, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 6.580882352941177, |
| "grad_norm": 0.8203283121654529, |
| "learning_rate": 4.374837597568338e-07, |
| "loss": 0.1526, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13600069284439087, |
| "step": 6265, |
| "valid_targets_mean": 2013.9, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 6.586134453781512, |
| "grad_norm": 0.7685017317264076, |
| "learning_rate": 4.266538338403936e-07, |
| "loss": 0.147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1418771594762802, |
| "step": 6270, |
| "valid_targets_mean": 2087.0, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 6.591386554621849, |
| "grad_norm": 0.7689705022584826, |
| "learning_rate": 4.159581957010894e-07, |
| "loss": 0.149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15910068154335022, |
| "step": 6275, |
| "valid_targets_mean": 2749.8, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 6.5966386554621845, |
| "grad_norm": 0.8350274594286426, |
| "learning_rate": 4.0539691871898545e-07, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14839161932468414, |
| "step": 6280, |
| "valid_targets_mean": 2080.6, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 6.601890756302521, |
| "grad_norm": 0.7123586297209112, |
| "learning_rate": 3.949700753523344e-07, |
| "loss": 0.1468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14631910622119904, |
| "step": 6285, |
| "valid_targets_mean": 2960.0, |
| "valid_targets_min": 763 |
| }, |
| { |
| "epoch": 6.607142857142857, |
| "grad_norm": 0.7608218792468966, |
| "learning_rate": 3.8467773713707134e-07, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14922720193862915, |
| "step": 6290, |
| "valid_targets_mean": 2525.2, |
| "valid_targets_min": 1231 |
| }, |
| { |
| "epoch": 6.612394957983193, |
| "grad_norm": 0.781295609634859, |
| "learning_rate": 3.7451997468632486e-07, |
| "loss": 0.142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1524946689605713, |
| "step": 6295, |
| "valid_targets_mean": 2446.9, |
| "valid_targets_min": 692 |
| }, |
| { |
| "epoch": 6.617647058823529, |
| "grad_norm": 1.3621692596047696, |
| "learning_rate": 3.6449685768993327e-07, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15170569717884064, |
| "step": 6300, |
| "valid_targets_mean": 2007.3, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 6.6228991596638656, |
| "grad_norm": 0.9081109225494257, |
| "learning_rate": 3.5460845491396944e-07, |
| "loss": 0.1547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.154941126704216, |
| "step": 6305, |
| "valid_targets_mean": 2046.6, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 6.628151260504202, |
| "grad_norm": 0.7545604154002317, |
| "learning_rate": 3.448548342002589e-07, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15161868929862976, |
| "step": 6310, |
| "valid_targets_mean": 2837.8, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 6.633403361344538, |
| "grad_norm": 0.8680496469961246, |
| "learning_rate": 3.352360624659312e-07, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1834527552127838, |
| "step": 6315, |
| "valid_targets_mean": 2255.1, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 6.6386554621848735, |
| "grad_norm": 0.7171097775844976, |
| "learning_rate": 3.2575220570294276e-07, |
| "loss": 0.1529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15503129363059998, |
| "step": 6320, |
| "valid_targets_mean": 2962.4, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 6.64390756302521, |
| "grad_norm": 0.6658600775544034, |
| "learning_rate": 3.164033289776369e-07, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12674590945243835, |
| "step": 6325, |
| "valid_targets_mean": 2999.2, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 6.649159663865547, |
| "grad_norm": 0.7748035457490327, |
| "learning_rate": 3.071894964302935e-07, |
| "loss": 0.1477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16250720620155334, |
| "step": 6330, |
| "valid_targets_mean": 2583.9, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 6.654411764705882, |
| "grad_norm": 0.7894017447041788, |
| "learning_rate": 2.981107712746867e-07, |
| "loss": 0.1448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14615963399410248, |
| "step": 6335, |
| "valid_targets_mean": 2359.9, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 6.659663865546219, |
| "grad_norm": 0.7275796769976358, |
| "learning_rate": 2.891672157976522e-07, |
| "loss": 0.1389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1456836611032486, |
| "step": 6340, |
| "valid_targets_mean": 2687.1, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 6.6649159663865545, |
| "grad_norm": 0.7464610444598423, |
| "learning_rate": 2.803588913586608e-07, |
| "loss": 0.154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15692494809627533, |
| "step": 6345, |
| "valid_targets_mean": 2862.6, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 6.670168067226891, |
| "grad_norm": 0.7409587755798085, |
| "learning_rate": 2.716858583894033e-07, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14683926105499268, |
| "step": 6350, |
| "valid_targets_mean": 2565.6, |
| "valid_targets_min": 1187 |
| }, |
| { |
| "epoch": 6.675420168067227, |
| "grad_norm": 0.8489660086658728, |
| "learning_rate": 2.6314817639335964e-07, |
| "loss": 0.1486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14783814549446106, |
| "step": 6355, |
| "valid_targets_mean": 2178.1, |
| "valid_targets_min": 1163 |
| }, |
| { |
| "epoch": 6.680672268907563, |
| "grad_norm": 0.7446724408854097, |
| "learning_rate": 2.547459039454103e-07, |
| "loss": 0.1542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13613933324813843, |
| "step": 6360, |
| "valid_targets_mean": 2619.4, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 6.685924369747899, |
| "grad_norm": 0.7468301149926823, |
| "learning_rate": 2.4647909869142117e-07, |
| "loss": 0.15, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15531302988529205, |
| "step": 6365, |
| "valid_targets_mean": 2749.7, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 6.6911764705882355, |
| "grad_norm": 0.8038823609900482, |
| "learning_rate": 2.3834781734784817e-07, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14846262335777283, |
| "step": 6370, |
| "valid_targets_mean": 2125.0, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 6.696428571428571, |
| "grad_norm": 0.7769587079233549, |
| "learning_rate": 2.3035211570135995e-07, |
| "loss": 0.1528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1341462880373001, |
| "step": 6375, |
| "valid_targets_mean": 1821.1, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 6.701680672268908, |
| "grad_norm": 0.7298168762864212, |
| "learning_rate": 2.224920486084403e-07, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15344950556755066, |
| "step": 6380, |
| "valid_targets_mean": 2839.2, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 6.706932773109243, |
| "grad_norm": 0.778338115342936, |
| "learning_rate": 2.1476766999502408e-07, |
| "loss": 0.1428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13469842076301575, |
| "step": 6385, |
| "valid_targets_mean": 2178.6, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 6.71218487394958, |
| "grad_norm": 0.816451492189734, |
| "learning_rate": 2.071790328561152e-07, |
| "loss": 0.1497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15425826609134674, |
| "step": 6390, |
| "valid_targets_mean": 2324.4, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 6.717436974789916, |
| "grad_norm": 0.8201419970370695, |
| "learning_rate": 1.997261892554403e-07, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15658767521381378, |
| "step": 6395, |
| "valid_targets_mean": 2310.4, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 6.722689075630252, |
| "grad_norm": 0.7500376618247141, |
| "learning_rate": 1.9240919032506688e-07, |
| "loss": 0.147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14455173909664154, |
| "step": 6400, |
| "valid_targets_mean": 2628.5, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 6.727941176470588, |
| "grad_norm": 0.7584572682030627, |
| "learning_rate": 1.8522808626507683e-07, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15599125623703003, |
| "step": 6405, |
| "valid_targets_mean": 2658.8, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 6.733193277310924, |
| "grad_norm": 0.7357895023796207, |
| "learning_rate": 1.781829263432111e-07, |
| "loss": 0.1594, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14581039547920227, |
| "step": 6410, |
| "valid_targets_mean": 2959.5, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 6.73844537815126, |
| "grad_norm": 0.6891830564600709, |
| "learning_rate": 1.7127375889452569e-07, |
| "loss": 0.1528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13923324644565582, |
| "step": 6415, |
| "valid_targets_mean": 2834.0, |
| "valid_targets_min": 1194 |
| }, |
| { |
| "epoch": 6.743697478991597, |
| "grad_norm": 0.7199729752533398, |
| "learning_rate": 1.6450063132107396e-07, |
| "loss": 0.1479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1373451054096222, |
| "step": 6420, |
| "valid_targets_mean": 2572.8, |
| "valid_targets_min": 626 |
| }, |
| { |
| "epoch": 6.748949579831933, |
| "grad_norm": 0.7647019920185888, |
| "learning_rate": 1.5786359009156928e-07, |
| "loss": 0.1433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15924891829490662, |
| "step": 6425, |
| "valid_targets_mean": 2990.7, |
| "valid_targets_min": 793 |
| }, |
| { |
| "epoch": 6.754201680672269, |
| "grad_norm": 0.8310727483362449, |
| "learning_rate": 1.5136268074107398e-07, |
| "loss": 0.157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1688929796218872, |
| "step": 6430, |
| "valid_targets_mean": 2370.5, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 6.759453781512605, |
| "grad_norm": 0.825061605955483, |
| "learning_rate": 1.44997947870682e-07, |
| "loss": 0.1639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16266357898712158, |
| "step": 6435, |
| "valid_targets_mean": 2281.9, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 6.764705882352941, |
| "grad_norm": 0.8533595418248784, |
| "learning_rate": 1.3876943514721465e-07, |
| "loss": 0.1525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16743487119674683, |
| "step": 6440, |
| "valid_targets_mean": 2262.5, |
| "valid_targets_min": 970 |
| }, |
| { |
| "epoch": 6.769957983193278, |
| "grad_norm": 0.7748683785377023, |
| "learning_rate": 1.3267718530292296e-07, |
| "loss": 0.1554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14080220460891724, |
| "step": 6445, |
| "valid_targets_mean": 2343.4, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 6.775210084033613, |
| "grad_norm": 0.8320606022762239, |
| "learning_rate": 1.267212401351925e-07, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1550496518611908, |
| "step": 6450, |
| "valid_targets_mean": 2402.6, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 6.78046218487395, |
| "grad_norm": 0.7474317684737926, |
| "learning_rate": 1.2090164050625907e-07, |
| "loss": 0.1736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16620126366615295, |
| "step": 6455, |
| "valid_targets_mean": 3082.7, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 6.785714285714286, |
| "grad_norm": 0.9565980511087515, |
| "learning_rate": 1.1521842634292013e-07, |
| "loss": 0.1559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.160188689827919, |
| "step": 6460, |
| "valid_targets_mean": 1479.5, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 6.790966386554622, |
| "grad_norm": 0.8532947647691757, |
| "learning_rate": 1.0967163663627044e-07, |
| "loss": 0.15, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15419529378414154, |
| "step": 6465, |
| "valid_targets_mean": 2052.6, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 6.796218487394958, |
| "grad_norm": 0.8255781206219238, |
| "learning_rate": 1.0426130944143353e-07, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14306730031967163, |
| "step": 6470, |
| "valid_targets_mean": 1963.2, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 6.801470588235294, |
| "grad_norm": 0.8837049669576724, |
| "learning_rate": 9.898748187729513e-08, |
| "loss": 0.1549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15094450116157532, |
| "step": 6475, |
| "valid_targets_mean": 2181.6, |
| "valid_targets_min": 919 |
| }, |
| { |
| "epoch": 6.80672268907563, |
| "grad_norm": 0.7790666833598698, |
| "learning_rate": 9.385019012625007e-08, |
| "loss": 0.1469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14933770895004272, |
| "step": 6480, |
| "valid_targets_mean": 2469.9, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 6.811974789915967, |
| "grad_norm": 0.9087222050552412, |
| "learning_rate": 8.884946943395811e-08, |
| "loss": 0.1573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16928185522556305, |
| "step": 6485, |
| "valid_targets_mean": 1823.7, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 6.817226890756302, |
| "grad_norm": 0.7419966743487549, |
| "learning_rate": 8.398535410910402e-08, |
| "loss": 0.161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16752246022224426, |
| "step": 6490, |
| "valid_targets_mean": 3067.3, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 6.822478991596639, |
| "grad_norm": 0.7768443736140654, |
| "learning_rate": 7.925787752314674e-08, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14006970822811127, |
| "step": 6495, |
| "valid_targets_mean": 2286.3, |
| "valid_targets_min": 837 |
| }, |
| { |
| "epoch": 6.8277310924369745, |
| "grad_norm": 0.7839422460590042, |
| "learning_rate": 7.466707211010838e-08, |
| "loss": 0.1526, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15227356553077698, |
| "step": 6500, |
| "valid_targets_mean": 2435.8, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 6.832983193277311, |
| "grad_norm": 0.8085913813487312, |
| "learning_rate": 7.02129693663478e-08, |
| "loss": 0.1468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14806930720806122, |
| "step": 6505, |
| "valid_targets_mean": 2763.4, |
| "valid_targets_min": 809 |
| }, |
| { |
| "epoch": 6.838235294117647, |
| "grad_norm": 0.830479023779582, |
| "learning_rate": 6.589559985033189e-08, |
| "loss": 0.1577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15857365727424622, |
| "step": 6510, |
| "valid_targets_mean": 2199.1, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 6.843487394957983, |
| "grad_norm": 0.7805037615428879, |
| "learning_rate": 6.171499318244234e-08, |
| "loss": 0.1557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1644633412361145, |
| "step": 6515, |
| "valid_targets_mean": 2826.9, |
| "valid_targets_min": 1091 |
| }, |
| { |
| "epoch": 6.848739495798319, |
| "grad_norm": 0.8243868421023237, |
| "learning_rate": 5.767117804476696e-08, |
| "loss": 0.1468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1619555652141571, |
| "step": 6520, |
| "valid_targets_mean": 2291.1, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 6.8539915966386555, |
| "grad_norm": 0.6718196143534856, |
| "learning_rate": 5.376418218089541e-08, |
| "loss": 0.1468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1486797034740448, |
| "step": 6525, |
| "valid_targets_mean": 3316.1, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 6.859243697478991, |
| "grad_norm": 0.7639600711267872, |
| "learning_rate": 4.99940323957393e-08, |
| "loss": 0.1506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15114453434944153, |
| "step": 6530, |
| "valid_targets_mean": 2355.1, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 6.864495798319328, |
| "grad_norm": 0.7434040074285687, |
| "learning_rate": 4.63607545553435e-08, |
| "loss": 0.1491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16190582513809204, |
| "step": 6535, |
| "valid_targets_mean": 2631.9, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 6.869747899159664, |
| "grad_norm": 0.7576726635038536, |
| "learning_rate": 4.2864373586706254e-08, |
| "loss": 0.1539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1667475700378418, |
| "step": 6540, |
| "valid_targets_mean": 3037.7, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 6.875, |
| "grad_norm": 0.7949042840267881, |
| "learning_rate": 3.950491347761487e-08, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15799729526042938, |
| "step": 6545, |
| "valid_targets_mean": 2813.3, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 6.880252100840336, |
| "grad_norm": 0.7599470557620672, |
| "learning_rate": 3.628239727647254e-08, |
| "loss": 0.1517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14834260940551758, |
| "step": 6550, |
| "valid_targets_mean": 2786.1, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 6.885504201680672, |
| "grad_norm": 0.7438096344765326, |
| "learning_rate": 3.319684709215176e-08, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1484309434890747, |
| "step": 6555, |
| "valid_targets_mean": 2842.8, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 6.890756302521009, |
| "grad_norm": 0.8034592781374419, |
| "learning_rate": 3.024828409383007e-08, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1651192605495453, |
| "step": 6560, |
| "valid_targets_mean": 2401.8, |
| "valid_targets_min": 1118 |
| }, |
| { |
| "epoch": 6.8960084033613445, |
| "grad_norm": 0.7481979263488755, |
| "learning_rate": 2.743672851085233e-08, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13949503004550934, |
| "step": 6565, |
| "valid_targets_mean": 2675.6, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 6.901260504201681, |
| "grad_norm": 0.8092072610442079, |
| "learning_rate": 2.4762199632588634e-08, |
| "loss": 0.1466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17036761343479156, |
| "step": 6570, |
| "valid_targets_mean": 2485.1, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 6.906512605042017, |
| "grad_norm": 0.8049873065525076, |
| "learning_rate": 2.2224715808309983e-08, |
| "loss": 0.156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15256905555725098, |
| "step": 6575, |
| "valid_targets_mean": 2644.2, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 6.911764705882353, |
| "grad_norm": 0.8617962635473019, |
| "learning_rate": 1.9824294447043923e-08, |
| "loss": 0.1571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15142729878425598, |
| "step": 6580, |
| "valid_targets_mean": 2083.2, |
| "valid_targets_min": 512 |
| }, |
| { |
| "epoch": 6.917016806722689, |
| "grad_norm": 0.8008776691217604, |
| "learning_rate": 1.7560952017481313e-08, |
| "loss": 0.1515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1459037810564041, |
| "step": 6585, |
| "valid_targets_mean": 2554.2, |
| "valid_targets_min": 952 |
| }, |
| { |
| "epoch": 6.9222689075630255, |
| "grad_norm": 0.7191951703364022, |
| "learning_rate": 1.5434704047836424e-08, |
| "loss": 0.1475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.145742267370224, |
| "step": 6590, |
| "valid_targets_mean": 2792.4, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 6.927521008403361, |
| "grad_norm": 0.7871859947545846, |
| "learning_rate": 1.344556512576256e-08, |
| "loss": 0.1575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1482214331626892, |
| "step": 6595, |
| "valid_targets_mean": 2457.0, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 6.932773109243698, |
| "grad_norm": 0.7643202727978451, |
| "learning_rate": 1.1593548898236606e-08, |
| "loss": 0.162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15590517222881317, |
| "step": 6600, |
| "valid_targets_mean": 2423.8, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 6.938025210084033, |
| "grad_norm": 0.8242802199893152, |
| "learning_rate": 9.878668071474639e-09, |
| "loss": 0.1556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1575925648212433, |
| "step": 6605, |
| "valid_targets_mean": 2134.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 6.94327731092437, |
| "grad_norm": 0.7939290019589629, |
| "learning_rate": 8.3009344108409e-09, |
| "loss": 0.1626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1599077582359314, |
| "step": 6610, |
| "valid_targets_mean": 2462.1, |
| "valid_targets_min": 1122 |
| }, |
| { |
| "epoch": 6.948529411764706, |
| "grad_norm": 0.8359337734301073, |
| "learning_rate": 6.860358740763406e-09, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15786179900169373, |
| "step": 6615, |
| "valid_targets_mean": 2346.8, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 6.953781512605042, |
| "grad_norm": 0.8230966514103626, |
| "learning_rate": 5.55695094467179e-09, |
| "loss": 0.1569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15767702460289001, |
| "step": 6620, |
| "valid_targets_mean": 2301.7, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 6.959033613445378, |
| "grad_norm": 0.8839955512653498, |
| "learning_rate": 4.3907199649151355e-09, |
| "loss": 0.1555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14466795325279236, |
| "step": 6625, |
| "valid_targets_mean": 1904.7, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 6.964285714285714, |
| "grad_norm": 0.7315947556803873, |
| "learning_rate": 3.361673802708687e-09, |
| "loss": 0.1543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1519755721092224, |
| "step": 6630, |
| "valid_targets_mean": 2944.4, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 6.96953781512605, |
| "grad_norm": 0.9022304224894817, |
| "learning_rate": 2.469819518080563e-09, |
| "loss": 0.1613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1760965883731842, |
| "step": 6635, |
| "valid_targets_mean": 2122.0, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 6.974789915966387, |
| "grad_norm": 0.9761476002877811, |
| "learning_rate": 1.7151632298140209e-09, |
| "loss": 0.1531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14784833788871765, |
| "step": 6640, |
| "valid_targets_mean": 2816.7, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 6.980042016806722, |
| "grad_norm": 0.7716322233500594, |
| "learning_rate": 1.0977101154163727e-09, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.155085951089859, |
| "step": 6645, |
| "valid_targets_mean": 2472.3, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 6.985294117647059, |
| "grad_norm": 0.8463421638101505, |
| "learning_rate": 6.174644110767958e-10, |
| "loss": 0.1534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16529741883277893, |
| "step": 6650, |
| "valid_targets_mean": 2150.7, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 6.990546218487395, |
| "grad_norm": 0.7405547503921337, |
| "learning_rate": 2.744294116419077e-10, |
| "loss": 0.146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13631612062454224, |
| "step": 6655, |
| "valid_targets_mean": 2381.4, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 6.995798319327731, |
| "grad_norm": 0.8184309324867913, |
| "learning_rate": 6.860747058468064e-11, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15874159336090088, |
| "step": 6660, |
| "valid_targets_mean": 2120.4, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1511024534702301, |
| "step": 6664, |
| "total_flos": 1189037529694208.0, |
| "train_loss": 0.22791378844041926, |
| "train_runtime": 28576.9639, |
| "train_samples_per_second": 3.731, |
| "train_steps_per_second": 0.233, |
| "valid_targets_mean": 3122.5, |
| "valid_targets_min": 647 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 6664, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 200, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1189037529694208.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|