| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4368, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.008012820512820512, |
| "grad_norm": 8.40942474050559, |
| "learning_rate": 3.661327231121282e-07, |
| "loss": 0.8612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4234336018562317, |
| "step": 5, |
| "valid_targets_mean": 2232.1, |
| "valid_targets_min": 951 |
| }, |
| { |
| "epoch": 0.016025641025641024, |
| "grad_norm": 8.48364139790815, |
| "learning_rate": 8.237986270022884e-07, |
| "loss": 0.8812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4549936056137085, |
| "step": 10, |
| "valid_targets_mean": 2954.6, |
| "valid_targets_min": 2024 |
| }, |
| { |
| "epoch": 0.02403846153846154, |
| "grad_norm": 8.720393584369761, |
| "learning_rate": 1.2814645308924487e-06, |
| "loss": 0.9171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4603043496608734, |
| "step": 15, |
| "valid_targets_mean": 2330.5, |
| "valid_targets_min": 1188 |
| }, |
| { |
| "epoch": 0.03205128205128205, |
| "grad_norm": 6.401065214818598, |
| "learning_rate": 1.7391304347826088e-06, |
| "loss": 0.8352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3336380124092102, |
| "step": 20, |
| "valid_targets_mean": 1985.0, |
| "valid_targets_min": 455 |
| }, |
| { |
| "epoch": 0.04006410256410257, |
| "grad_norm": 4.816552094508015, |
| "learning_rate": 2.196796338672769e-06, |
| "loss": 0.8584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40010353922843933, |
| "step": 25, |
| "valid_targets_mean": 2756.9, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 0.04807692307692308, |
| "grad_norm": 4.335386813313282, |
| "learning_rate": 2.654462242562929e-06, |
| "loss": 0.7732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4342009425163269, |
| "step": 30, |
| "valid_targets_mean": 2161.2, |
| "valid_targets_min": 1193 |
| }, |
| { |
| "epoch": 0.05608974358974359, |
| "grad_norm": 3.177645784938531, |
| "learning_rate": 3.1121281464530894e-06, |
| "loss": 0.748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3209277391433716, |
| "step": 35, |
| "valid_targets_mean": 2150.0, |
| "valid_targets_min": 1202 |
| }, |
| { |
| "epoch": 0.0641025641025641, |
| "grad_norm": 2.628557761103501, |
| "learning_rate": 3.56979405034325e-06, |
| "loss": 0.7037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3309406638145447, |
| "step": 40, |
| "valid_targets_mean": 2116.4, |
| "valid_targets_min": 475 |
| }, |
| { |
| "epoch": 0.07211538461538461, |
| "grad_norm": 1.7033923530978847, |
| "learning_rate": 4.0274599542334094e-06, |
| "loss": 0.679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24123963713645935, |
| "step": 45, |
| "valid_targets_mean": 1675.2, |
| "valid_targets_min": 435 |
| }, |
| { |
| "epoch": 0.08012820512820513, |
| "grad_norm": 1.4563809782956156, |
| "learning_rate": 4.48512585812357e-06, |
| "loss": 0.6983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31092941761016846, |
| "step": 50, |
| "valid_targets_mean": 2253.2, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 0.08814102564102565, |
| "grad_norm": 1.205430924212798, |
| "learning_rate": 4.94279176201373e-06, |
| "loss": 0.6497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3203188180923462, |
| "step": 55, |
| "valid_targets_mean": 2870.5, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 0.09615384615384616, |
| "grad_norm": 1.1392627369044308, |
| "learning_rate": 5.400457665903891e-06, |
| "loss": 0.6527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30013489723205566, |
| "step": 60, |
| "valid_targets_mean": 2388.1, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 0.10416666666666667, |
| "grad_norm": 1.1352639246979592, |
| "learning_rate": 5.858123569794051e-06, |
| "loss": 0.5812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.349726140499115, |
| "step": 65, |
| "valid_targets_mean": 2654.9, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 0.11217948717948718, |
| "grad_norm": 0.9808130025882383, |
| "learning_rate": 6.31578947368421e-06, |
| "loss": 0.5923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3157884478569031, |
| "step": 70, |
| "valid_targets_mean": 2987.8, |
| "valid_targets_min": 1489 |
| }, |
| { |
| "epoch": 0.1201923076923077, |
| "grad_norm": 0.9209470326055519, |
| "learning_rate": 6.773455377574372e-06, |
| "loss": 0.6071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3476266860961914, |
| "step": 75, |
| "valid_targets_mean": 2909.8, |
| "valid_targets_min": 1067 |
| }, |
| { |
| "epoch": 0.1282051282051282, |
| "grad_norm": 0.9674711198015653, |
| "learning_rate": 7.231121281464531e-06, |
| "loss": 0.5622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25228625535964966, |
| "step": 80, |
| "valid_targets_mean": 2015.8, |
| "valid_targets_min": 1036 |
| }, |
| { |
| "epoch": 0.1362179487179487, |
| "grad_norm": 0.9614682889742122, |
| "learning_rate": 7.688787185354691e-06, |
| "loss": 0.5662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23659241199493408, |
| "step": 85, |
| "valid_targets_mean": 1919.0, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 0.14423076923076922, |
| "grad_norm": 0.9793609220779523, |
| "learning_rate": 8.146453089244852e-06, |
| "loss": 0.5578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2640606164932251, |
| "step": 90, |
| "valid_targets_mean": 1888.8, |
| "valid_targets_min": 1484 |
| }, |
| { |
| "epoch": 0.15224358974358973, |
| "grad_norm": 0.7747222745750588, |
| "learning_rate": 8.604118993135013e-06, |
| "loss": 0.5403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20079509913921356, |
| "step": 95, |
| "valid_targets_mean": 2408.2, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 0.16025641025641027, |
| "grad_norm": 0.8968672399440782, |
| "learning_rate": 9.061784897025172e-06, |
| "loss": 0.5561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2350616157054901, |
| "step": 100, |
| "valid_targets_mean": 2021.5, |
| "valid_targets_min": 1011 |
| }, |
| { |
| "epoch": 0.16826923076923078, |
| "grad_norm": 0.8578003953330227, |
| "learning_rate": 9.519450800915333e-06, |
| "loss": 0.546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32088974118232727, |
| "step": 105, |
| "valid_targets_mean": 3198.9, |
| "valid_targets_min": 1398 |
| }, |
| { |
| "epoch": 0.1762820512820513, |
| "grad_norm": 0.9775604038641746, |
| "learning_rate": 9.977116704805492e-06, |
| "loss": 0.5408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2899416387081146, |
| "step": 110, |
| "valid_targets_mean": 1989.8, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 0.1842948717948718, |
| "grad_norm": 0.9484746064620678, |
| "learning_rate": 1.0434782608695653e-05, |
| "loss": 0.5271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30604788661003113, |
| "step": 115, |
| "valid_targets_mean": 2266.0, |
| "valid_targets_min": 1375 |
| }, |
| { |
| "epoch": 0.19230769230769232, |
| "grad_norm": 0.746255880008432, |
| "learning_rate": 1.0892448512585814e-05, |
| "loss": 0.4977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20729142427444458, |
| "step": 120, |
| "valid_targets_mean": 2384.1, |
| "valid_targets_min": 218 |
| }, |
| { |
| "epoch": 0.20032051282051283, |
| "grad_norm": 0.7438833264963527, |
| "learning_rate": 1.1350114416475973e-05, |
| "loss": 0.5253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22926843166351318, |
| "step": 125, |
| "valid_targets_mean": 2618.1, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 0.20833333333333334, |
| "grad_norm": 0.8570205673450283, |
| "learning_rate": 1.1807780320366134e-05, |
| "loss": 0.5036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24288621544837952, |
| "step": 130, |
| "valid_targets_mean": 1906.1, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 0.21634615384615385, |
| "grad_norm": 0.9417163414734101, |
| "learning_rate": 1.2265446224256295e-05, |
| "loss": 0.5166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2769995927810669, |
| "step": 135, |
| "valid_targets_mean": 2436.2, |
| "valid_targets_min": 1533 |
| }, |
| { |
| "epoch": 0.22435897435897437, |
| "grad_norm": 0.9860064049785607, |
| "learning_rate": 1.2723112128146454e-05, |
| "loss": 0.5362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32120639085769653, |
| "step": 140, |
| "valid_targets_mean": 2255.4, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 0.23237179487179488, |
| "grad_norm": 0.7640125489075233, |
| "learning_rate": 1.3180778032036615e-05, |
| "loss": 0.5095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2866376042366028, |
| "step": 145, |
| "valid_targets_mean": 3077.4, |
| "valid_targets_min": 1777 |
| }, |
| { |
| "epoch": 0.2403846153846154, |
| "grad_norm": 1.0242816861010413, |
| "learning_rate": 1.3638443935926776e-05, |
| "loss": 0.5142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3341456651687622, |
| "step": 150, |
| "valid_targets_mean": 2355.0, |
| "valid_targets_min": 1100 |
| }, |
| { |
| "epoch": 0.2483974358974359, |
| "grad_norm": 0.642501178965298, |
| "learning_rate": 1.4096109839816933e-05, |
| "loss": 0.4688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22167231142520905, |
| "step": 155, |
| "valid_targets_mean": 3613.2, |
| "valid_targets_min": 1137 |
| }, |
| { |
| "epoch": 0.2564102564102564, |
| "grad_norm": 0.9373104786339153, |
| "learning_rate": 1.4553775743707096e-05, |
| "loss": 0.5145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24051184952259064, |
| "step": 160, |
| "valid_targets_mean": 2034.8, |
| "valid_targets_min": 1050 |
| }, |
| { |
| "epoch": 0.2644230769230769, |
| "grad_norm": 0.9417451887793393, |
| "learning_rate": 1.5011441647597256e-05, |
| "loss": 0.5141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25027361512184143, |
| "step": 165, |
| "valid_targets_mean": 1953.4, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 0.2724358974358974, |
| "grad_norm": 0.794295403588529, |
| "learning_rate": 1.5469107551487414e-05, |
| "loss": 0.4797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2761167287826538, |
| "step": 170, |
| "valid_targets_mean": 2741.1, |
| "valid_targets_min": 778 |
| }, |
| { |
| "epoch": 0.28044871794871795, |
| "grad_norm": 1.041873213895435, |
| "learning_rate": 1.5926773455377575e-05, |
| "loss": 0.5241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23646000027656555, |
| "step": 175, |
| "valid_targets_mean": 1639.4, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 0.28846153846153844, |
| "grad_norm": 0.7688575732221453, |
| "learning_rate": 1.6384439359267736e-05, |
| "loss": 0.4861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2567122280597687, |
| "step": 180, |
| "valid_targets_mean": 2919.0, |
| "valid_targets_min": 1857 |
| }, |
| { |
| "epoch": 0.296474358974359, |
| "grad_norm": 0.7996959350311494, |
| "learning_rate": 1.6842105263157896e-05, |
| "loss": 0.5048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23176565766334534, |
| "step": 185, |
| "valid_targets_mean": 2770.1, |
| "valid_targets_min": 1156 |
| }, |
| { |
| "epoch": 0.30448717948717946, |
| "grad_norm": 0.9438242229304544, |
| "learning_rate": 1.7299771167048057e-05, |
| "loss": 0.4708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22697538137435913, |
| "step": 190, |
| "valid_targets_mean": 2171.6, |
| "valid_targets_min": 498 |
| }, |
| { |
| "epoch": 0.3125, |
| "grad_norm": 0.7852768168325834, |
| "learning_rate": 1.7757437070938218e-05, |
| "loss": 0.4839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16673338413238525, |
| "step": 195, |
| "valid_targets_mean": 2226.2, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 0.32051282051282054, |
| "grad_norm": 0.8328845202469579, |
| "learning_rate": 1.8215102974828376e-05, |
| "loss": 0.4659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20564012229442596, |
| "step": 200, |
| "valid_targets_mean": 1902.9, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 0.328525641025641, |
| "grad_norm": 0.9107558293954876, |
| "learning_rate": 1.8672768878718537e-05, |
| "loss": 0.4652, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26834234595298767, |
| "step": 205, |
| "valid_targets_mean": 2476.9, |
| "valid_targets_min": 1814 |
| }, |
| { |
| "epoch": 0.33653846153846156, |
| "grad_norm": 1.040043168249784, |
| "learning_rate": 1.9130434782608697e-05, |
| "loss": 0.4763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26306286454200745, |
| "step": 210, |
| "valid_targets_mean": 2041.9, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 0.34455128205128205, |
| "grad_norm": 0.9252302157522805, |
| "learning_rate": 1.9588100686498858e-05, |
| "loss": 0.4575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2265125960111618, |
| "step": 215, |
| "valid_targets_mean": 2354.1, |
| "valid_targets_min": 1473 |
| }, |
| { |
| "epoch": 0.3525641025641026, |
| "grad_norm": 0.887453457764969, |
| "learning_rate": 2.004576659038902e-05, |
| "loss": 0.4856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22299125790596008, |
| "step": 220, |
| "valid_targets_mean": 2139.2, |
| "valid_targets_min": 1048 |
| }, |
| { |
| "epoch": 0.3605769230769231, |
| "grad_norm": 0.9059800139169017, |
| "learning_rate": 2.050343249427918e-05, |
| "loss": 0.4845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20266111195087433, |
| "step": 225, |
| "valid_targets_mean": 1946.6, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 0.3685897435897436, |
| "grad_norm": 0.7607704862440865, |
| "learning_rate": 2.0961098398169337e-05, |
| "loss": 0.449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26493844389915466, |
| "step": 230, |
| "valid_targets_mean": 3166.2, |
| "valid_targets_min": 1272 |
| }, |
| { |
| "epoch": 0.3766025641025641, |
| "grad_norm": 0.6967071079872735, |
| "learning_rate": 2.14187643020595e-05, |
| "loss": 0.4398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15973234176635742, |
| "step": 235, |
| "valid_targets_mean": 2076.8, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 0.38461538461538464, |
| "grad_norm": 0.9150501001631774, |
| "learning_rate": 2.187643020594966e-05, |
| "loss": 0.4443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2183428257703781, |
| "step": 240, |
| "valid_targets_mean": 2056.5, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 0.3926282051282051, |
| "grad_norm": 0.8206357901155347, |
| "learning_rate": 2.2334096109839817e-05, |
| "loss": 0.4821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24904729425907135, |
| "step": 245, |
| "valid_targets_mean": 2744.9, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 0.40064102564102566, |
| "grad_norm": 0.8526548730570999, |
| "learning_rate": 2.279176201372998e-05, |
| "loss": 0.4571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23037180304527283, |
| "step": 250, |
| "valid_targets_mean": 2357.2, |
| "valid_targets_min": 1310 |
| }, |
| { |
| "epoch": 0.40865384615384615, |
| "grad_norm": 0.7860731322180793, |
| "learning_rate": 2.3249427917620138e-05, |
| "loss": 0.462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2327589988708496, |
| "step": 255, |
| "valid_targets_mean": 2966.1, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 0.4166666666666667, |
| "grad_norm": 0.8509400671372361, |
| "learning_rate": 2.37070938215103e-05, |
| "loss": 0.4554, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25431883335113525, |
| "step": 260, |
| "valid_targets_mean": 2701.1, |
| "valid_targets_min": 2043 |
| }, |
| { |
| "epoch": 0.42467948717948717, |
| "grad_norm": 0.8864607945642146, |
| "learning_rate": 2.4164759725400463e-05, |
| "loss": 0.4772, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28384217619895935, |
| "step": 265, |
| "valid_targets_mean": 2266.1, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 0.4326923076923077, |
| "grad_norm": 0.9413869835853772, |
| "learning_rate": 2.462242562929062e-05, |
| "loss": 0.4575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19929912686347961, |
| "step": 270, |
| "valid_targets_mean": 1698.9, |
| "valid_targets_min": 428 |
| }, |
| { |
| "epoch": 0.4407051282051282, |
| "grad_norm": 0.744625538834592, |
| "learning_rate": 2.508009153318078e-05, |
| "loss": 0.4557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25119954347610474, |
| "step": 275, |
| "valid_targets_mean": 3835.0, |
| "valid_targets_min": 1842 |
| }, |
| { |
| "epoch": 0.44871794871794873, |
| "grad_norm": 0.7738314413345992, |
| "learning_rate": 2.5537757437070943e-05, |
| "loss": 0.4397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1962563693523407, |
| "step": 280, |
| "valid_targets_mean": 2279.1, |
| "valid_targets_min": 1198 |
| }, |
| { |
| "epoch": 0.4567307692307692, |
| "grad_norm": 2.4382247977127856, |
| "learning_rate": 2.59954233409611e-05, |
| "loss": 0.4564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21939444541931152, |
| "step": 285, |
| "valid_targets_mean": 2666.8, |
| "valid_targets_min": 743 |
| }, |
| { |
| "epoch": 0.46474358974358976, |
| "grad_norm": 0.8606788715900447, |
| "learning_rate": 2.645308924485126e-05, |
| "loss": 0.4799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41101521253585815, |
| "step": 290, |
| "valid_targets_mean": 3653.4, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 0.47275641025641024, |
| "grad_norm": 0.838922125549497, |
| "learning_rate": 2.6910755148741422e-05, |
| "loss": 0.4761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2805629074573517, |
| "step": 295, |
| "valid_targets_mean": 2203.1, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 0.4807692307692308, |
| "grad_norm": 0.7860048976376676, |
| "learning_rate": 2.7368421052631583e-05, |
| "loss": 0.4227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1744893491268158, |
| "step": 300, |
| "valid_targets_mean": 2218.8, |
| "valid_targets_min": 1246 |
| }, |
| { |
| "epoch": 0.48878205128205127, |
| "grad_norm": 0.8718270447419633, |
| "learning_rate": 2.782608695652174e-05, |
| "loss": 0.4686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2293800711631775, |
| "step": 305, |
| "valid_targets_mean": 2349.2, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 0.4967948717948718, |
| "grad_norm": 0.809574476298245, |
| "learning_rate": 2.8283752860411904e-05, |
| "loss": 0.4505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.286695659160614, |
| "step": 310, |
| "valid_targets_mean": 2928.5, |
| "valid_targets_min": 1451 |
| }, |
| { |
| "epoch": 0.5048076923076923, |
| "grad_norm": 0.8560435039918013, |
| "learning_rate": 2.8741418764302062e-05, |
| "loss": 0.467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2741186320781708, |
| "step": 315, |
| "valid_targets_mean": 2153.1, |
| "valid_targets_min": 1418 |
| }, |
| { |
| "epoch": 0.5128205128205128, |
| "grad_norm": 0.8443849165623637, |
| "learning_rate": 2.9199084668192223e-05, |
| "loss": 0.513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18281307816505432, |
| "step": 320, |
| "valid_targets_mean": 1734.6, |
| "valid_targets_min": 416 |
| }, |
| { |
| "epoch": 0.5208333333333334, |
| "grad_norm": 0.8696802631590136, |
| "learning_rate": 2.9656750572082384e-05, |
| "loss": 0.4516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18471366167068481, |
| "step": 325, |
| "valid_targets_mean": 1614.6, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 0.5288461538461539, |
| "grad_norm": 0.8651062420057943, |
| "learning_rate": 3.0114416475972544e-05, |
| "loss": 0.468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2343977391719818, |
| "step": 330, |
| "valid_targets_mean": 2271.1, |
| "valid_targets_min": 1220 |
| }, |
| { |
| "epoch": 0.5368589743589743, |
| "grad_norm": 0.8409126784718626, |
| "learning_rate": 3.05720823798627e-05, |
| "loss": 0.4375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2919655740261078, |
| "step": 335, |
| "valid_targets_mean": 3131.4, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 0.5448717948717948, |
| "grad_norm": 0.8010512826037681, |
| "learning_rate": 3.102974828375286e-05, |
| "loss": 0.4293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23436668515205383, |
| "step": 340, |
| "valid_targets_mean": 2680.4, |
| "valid_targets_min": 1639 |
| }, |
| { |
| "epoch": 0.5528846153846154, |
| "grad_norm": 0.7821405770402137, |
| "learning_rate": 3.1487414187643024e-05, |
| "loss": 0.4769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20524126291275024, |
| "step": 345, |
| "valid_targets_mean": 2733.0, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 0.5608974358974359, |
| "grad_norm": 0.7147060886685118, |
| "learning_rate": 3.1945080091533184e-05, |
| "loss": 0.4614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2542196810245514, |
| "step": 350, |
| "valid_targets_mean": 3058.1, |
| "valid_targets_min": 1283 |
| }, |
| { |
| "epoch": 0.5689102564102564, |
| "grad_norm": 0.7484160202180531, |
| "learning_rate": 3.240274599542334e-05, |
| "loss": 0.4498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13721662759780884, |
| "step": 355, |
| "valid_targets_mean": 1732.4, |
| "valid_targets_min": 327 |
| }, |
| { |
| "epoch": 0.5769230769230769, |
| "grad_norm": 0.9659130418383086, |
| "learning_rate": 3.2860411899313506e-05, |
| "loss": 0.4619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26037678122520447, |
| "step": 360, |
| "valid_targets_mean": 1845.2, |
| "valid_targets_min": 1478 |
| }, |
| { |
| "epoch": 0.5849358974358975, |
| "grad_norm": 1.148809792440573, |
| "learning_rate": 3.331807780320366e-05, |
| "loss": 0.4811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24160519242286682, |
| "step": 365, |
| "valid_targets_mean": 2128.8, |
| "valid_targets_min": 1155 |
| }, |
| { |
| "epoch": 0.592948717948718, |
| "grad_norm": 0.7019051186772777, |
| "learning_rate": 3.377574370709382e-05, |
| "loss": 0.4261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25113967061042786, |
| "step": 370, |
| "valid_targets_mean": 3612.8, |
| "valid_targets_min": 1206 |
| }, |
| { |
| "epoch": 0.6009615384615384, |
| "grad_norm": 0.9679216066114925, |
| "learning_rate": 3.423340961098399e-05, |
| "loss": 0.4148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2699517607688904, |
| "step": 375, |
| "valid_targets_mean": 3150.4, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 0.6089743589743589, |
| "grad_norm": 0.7848117406315669, |
| "learning_rate": 3.469107551487414e-05, |
| "loss": 0.4402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20744790136814117, |
| "step": 380, |
| "valid_targets_mean": 2178.5, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 0.6169871794871795, |
| "grad_norm": 0.7080944591453242, |
| "learning_rate": 3.5148741418764304e-05, |
| "loss": 0.417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22987905144691467, |
| "step": 385, |
| "valid_targets_mean": 3240.8, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 0.625, |
| "grad_norm": 0.8894368633337273, |
| "learning_rate": 3.5606407322654464e-05, |
| "loss": 0.4532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20276543498039246, |
| "step": 390, |
| "valid_targets_mean": 1739.2, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 0.6330128205128205, |
| "grad_norm": 0.8437346929099193, |
| "learning_rate": 3.6064073226544625e-05, |
| "loss": 0.4301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2156563401222229, |
| "step": 395, |
| "valid_targets_mean": 2161.9, |
| "valid_targets_min": 1131 |
| }, |
| { |
| "epoch": 0.6410256410256411, |
| "grad_norm": 0.845119808027601, |
| "learning_rate": 3.6521739130434786e-05, |
| "loss": 0.4362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23626503348350525, |
| "step": 400, |
| "valid_targets_mean": 2326.6, |
| "valid_targets_min": 1025 |
| }, |
| { |
| "epoch": 0.6490384615384616, |
| "grad_norm": 0.8230495030251933, |
| "learning_rate": 3.697940503432495e-05, |
| "loss": 0.4493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21271054446697235, |
| "step": 405, |
| "valid_targets_mean": 2119.8, |
| "valid_targets_min": 1356 |
| }, |
| { |
| "epoch": 0.657051282051282, |
| "grad_norm": 0.7566270241967507, |
| "learning_rate": 3.743707093821511e-05, |
| "loss": 0.4543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2143326699733734, |
| "step": 410, |
| "valid_targets_mean": 2758.8, |
| "valid_targets_min": 1504 |
| }, |
| { |
| "epoch": 0.6650641025641025, |
| "grad_norm": 0.8891093819684329, |
| "learning_rate": 3.789473684210526e-05, |
| "loss": 0.4541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21579736471176147, |
| "step": 415, |
| "valid_targets_mean": 2091.5, |
| "valid_targets_min": 1118 |
| }, |
| { |
| "epoch": 0.6730769230769231, |
| "grad_norm": 0.7308770194117645, |
| "learning_rate": 3.835240274599543e-05, |
| "loss": 0.422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18271571397781372, |
| "step": 420, |
| "valid_targets_mean": 2216.1, |
| "valid_targets_min": 1241 |
| }, |
| { |
| "epoch": 0.6810897435897436, |
| "grad_norm": 0.6733014520665108, |
| "learning_rate": 3.8810068649885584e-05, |
| "loss": 0.4426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1795242726802826, |
| "step": 425, |
| "valid_targets_mean": 2813.6, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 0.6891025641025641, |
| "grad_norm": 0.9209305153321826, |
| "learning_rate": 3.9267734553775745e-05, |
| "loss": 0.4429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22252072393894196, |
| "step": 430, |
| "valid_targets_mean": 1781.4, |
| "valid_targets_min": 1204 |
| }, |
| { |
| "epoch": 0.6971153846153846, |
| "grad_norm": 0.7008996722806253, |
| "learning_rate": 3.9725400457665905e-05, |
| "loss": 0.4391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22679556906223297, |
| "step": 435, |
| "valid_targets_mean": 3189.6, |
| "valid_targets_min": 1315 |
| }, |
| { |
| "epoch": 0.7051282051282052, |
| "grad_norm": 0.7933102403594852, |
| "learning_rate": 3.999997445219712e-05, |
| "loss": 0.4132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21799099445343018, |
| "step": 440, |
| "valid_targets_mean": 2205.4, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 0.7131410256410257, |
| "grad_norm": 0.71765578245187, |
| "learning_rate": 3.999968704016428e-05, |
| "loss": 0.4366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14643388986587524, |
| "step": 445, |
| "valid_targets_mean": 1829.5, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 0.7211538461538461, |
| "grad_norm": 0.7680275744504215, |
| "learning_rate": 3.9999080285949514e-05, |
| "loss": 0.4545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28415074944496155, |
| "step": 450, |
| "valid_targets_mean": 3113.9, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 0.7291666666666666, |
| "grad_norm": 0.7819836110236925, |
| "learning_rate": 3.999815419924108e-05, |
| "loss": 0.4581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2930494546890259, |
| "step": 455, |
| "valid_targets_mean": 4082.2, |
| "valid_targets_min": 1368 |
| }, |
| { |
| "epoch": 0.7371794871794872, |
| "grad_norm": 0.7156988765066394, |
| "learning_rate": 3.999690879482614e-05, |
| "loss": 0.4458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22275188565254211, |
| "step": 460, |
| "valid_targets_mean": 2527.4, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 0.7451923076923077, |
| "grad_norm": 0.7545107849171728, |
| "learning_rate": 3.9995344092590506e-05, |
| "loss": 0.4569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17759068310260773, |
| "step": 465, |
| "valid_targets_mean": 2044.2, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 0.7532051282051282, |
| "grad_norm": 0.85883814352422, |
| "learning_rate": 3.999346011751835e-05, |
| "loss": 0.4462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21038851141929626, |
| "step": 470, |
| "valid_targets_mean": 1835.1, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 0.7612179487179487, |
| "grad_norm": 0.8410031574243461, |
| "learning_rate": 3.999125689969176e-05, |
| "loss": 0.4415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17614567279815674, |
| "step": 475, |
| "valid_targets_mean": 1721.4, |
| "valid_targets_min": 1041 |
| }, |
| { |
| "epoch": 0.7692307692307693, |
| "grad_norm": 0.8789804427446964, |
| "learning_rate": 3.9988734474290324e-05, |
| "loss": 0.4357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21839639544487, |
| "step": 480, |
| "valid_targets_mean": 2227.9, |
| "valid_targets_min": 948 |
| }, |
| { |
| "epoch": 0.7772435897435898, |
| "grad_norm": 0.7384347806573924, |
| "learning_rate": 3.9985892881590513e-05, |
| "loss": 0.4596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15238994359970093, |
| "step": 485, |
| "valid_targets_mean": 2098.8, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 0.7852564102564102, |
| "grad_norm": 0.8037359267266503, |
| "learning_rate": 3.9982732166965054e-05, |
| "loss": 0.4343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23122987151145935, |
| "step": 490, |
| "valid_targets_mean": 2579.4, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 0.7932692307692307, |
| "grad_norm": 0.7584123950011441, |
| "learning_rate": 3.997925238088221e-05, |
| "loss": 0.4363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2352125495672226, |
| "step": 495, |
| "valid_targets_mean": 3186.1, |
| "valid_targets_min": 948 |
| }, |
| { |
| "epoch": 0.8012820512820513, |
| "grad_norm": 0.8416323300874318, |
| "learning_rate": 3.9975453578904975e-05, |
| "loss": 0.4351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2356817126274109, |
| "step": 500, |
| "valid_targets_mean": 1878.6, |
| "valid_targets_min": 472 |
| }, |
| { |
| "epoch": 0.8092948717948718, |
| "grad_norm": 0.7515584047530944, |
| "learning_rate": 3.997133582169018e-05, |
| "loss": 0.4142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19595301151275635, |
| "step": 505, |
| "valid_targets_mean": 2488.8, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 0.8173076923076923, |
| "grad_norm": 0.6570619580965038, |
| "learning_rate": 3.996689917498754e-05, |
| "loss": 0.4321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1813373565673828, |
| "step": 510, |
| "valid_targets_mean": 2813.6, |
| "valid_targets_min": 1393 |
| }, |
| { |
| "epoch": 0.8253205128205128, |
| "grad_norm": 0.7003686384566153, |
| "learning_rate": 3.9962143709638585e-05, |
| "loss": 0.4255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18100909888744354, |
| "step": 515, |
| "valid_targets_mean": 2194.2, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 0.8333333333333334, |
| "grad_norm": 0.8533422308466821, |
| "learning_rate": 3.995706950157554e-05, |
| "loss": 0.4638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17890852689743042, |
| "step": 520, |
| "valid_targets_mean": 1537.5, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 0.8413461538461539, |
| "grad_norm": 0.8025876920924326, |
| "learning_rate": 3.995167663182008e-05, |
| "loss": 0.415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2482287734746933, |
| "step": 525, |
| "valid_targets_mean": 2890.6, |
| "valid_targets_min": 500 |
| }, |
| { |
| "epoch": 0.8493589743589743, |
| "grad_norm": 0.817318210827593, |
| "learning_rate": 3.994596518648214e-05, |
| "loss": 0.437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18256166577339172, |
| "step": 530, |
| "valid_targets_mean": 2419.2, |
| "valid_targets_min": 1024 |
| }, |
| { |
| "epoch": 0.8573717948717948, |
| "grad_norm": 0.6865410812285857, |
| "learning_rate": 3.993993525675838e-05, |
| "loss": 0.4527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18624117970466614, |
| "step": 535, |
| "valid_targets_mean": 2568.6, |
| "valid_targets_min": 1364 |
| }, |
| { |
| "epoch": 0.8653846153846154, |
| "grad_norm": 0.8488382487153298, |
| "learning_rate": 3.993358693893086e-05, |
| "loss": 0.4254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2426677644252777, |
| "step": 540, |
| "valid_targets_mean": 1998.9, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 0.8733974358974359, |
| "grad_norm": 0.8652381079639015, |
| "learning_rate": 3.9926920334365457e-05, |
| "loss": 0.4183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.238864004611969, |
| "step": 545, |
| "valid_targets_mean": 2650.5, |
| "valid_targets_min": 359 |
| }, |
| { |
| "epoch": 0.8814102564102564, |
| "grad_norm": 0.7839796519999491, |
| "learning_rate": 3.991993554951023e-05, |
| "loss": 0.4423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22148996591567993, |
| "step": 550, |
| "valid_targets_mean": 2023.8, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 0.8894230769230769, |
| "grad_norm": 0.7542817185661378, |
| "learning_rate": 3.991263269589376e-05, |
| "loss": 0.4718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18125128746032715, |
| "step": 555, |
| "valid_targets_mean": 2083.8, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 0.8974358974358975, |
| "grad_norm": 0.741947108861436, |
| "learning_rate": 3.990501189012332e-05, |
| "loss": 0.4307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22753050923347473, |
| "step": 560, |
| "valid_targets_mean": 3070.9, |
| "valid_targets_min": 1628 |
| }, |
| { |
| "epoch": 0.905448717948718, |
| "grad_norm": 0.8420106848026391, |
| "learning_rate": 3.989707325388305e-05, |
| "loss": 0.4149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21152499318122864, |
| "step": 565, |
| "valid_targets_mean": 2034.4, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 0.9134615384615384, |
| "grad_norm": 0.725218798545047, |
| "learning_rate": 3.9888816913932016e-05, |
| "loss": 0.427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2168159782886505, |
| "step": 570, |
| "valid_targets_mean": 2498.5, |
| "valid_targets_min": 314 |
| }, |
| { |
| "epoch": 0.9214743589743589, |
| "grad_norm": 0.7551268498727862, |
| "learning_rate": 3.988024300210215e-05, |
| "loss": 0.4173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23235228657722473, |
| "step": 575, |
| "valid_targets_mean": 3109.9, |
| "valid_targets_min": 1392 |
| }, |
| { |
| "epoch": 0.9294871794871795, |
| "grad_norm": 0.8917469963673748, |
| "learning_rate": 3.987135165529618e-05, |
| "loss": 0.4279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2358158975839615, |
| "step": 580, |
| "valid_targets_mean": 2129.4, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 0.9375, |
| "grad_norm": 0.7621556301152937, |
| "learning_rate": 3.9862143015485446e-05, |
| "loss": 0.4266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2662770450115204, |
| "step": 585, |
| "valid_targets_mean": 3289.5, |
| "valid_targets_min": 1743 |
| }, |
| { |
| "epoch": 0.9455128205128205, |
| "grad_norm": 0.700543068896193, |
| "learning_rate": 3.985261722970759e-05, |
| "loss": 0.4128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16867512464523315, |
| "step": 590, |
| "valid_targets_mean": 2218.5, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 0.9535256410256411, |
| "grad_norm": 0.815970901264772, |
| "learning_rate": 3.984277445006426e-05, |
| "loss": 0.4353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22275325655937195, |
| "step": 595, |
| "valid_targets_mean": 1926.8, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 0.9615384615384616, |
| "grad_norm": 0.8361593918244778, |
| "learning_rate": 3.9832614833718654e-05, |
| "loss": 0.4177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18687403202056885, |
| "step": 600, |
| "valid_targets_mean": 2228.1, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 0.969551282051282, |
| "grad_norm": 0.7613367304322403, |
| "learning_rate": 3.9822138542893005e-05, |
| "loss": 0.3947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23270726203918457, |
| "step": 605, |
| "valid_targets_mean": 2532.5, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 0.9775641025641025, |
| "grad_norm": 0.8051775177601395, |
| "learning_rate": 3.9811345744866014e-05, |
| "loss": 0.4378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21936899423599243, |
| "step": 610, |
| "valid_targets_mean": 2139.5, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 0.9855769230769231, |
| "grad_norm": 0.9820300582408891, |
| "learning_rate": 3.980023661197016e-05, |
| "loss": 0.4396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2305496335029602, |
| "step": 615, |
| "valid_targets_mean": 1676.1, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 0.9935897435897436, |
| "grad_norm": 0.7251745500664333, |
| "learning_rate": 3.978881132158896e-05, |
| "loss": 0.4072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22141022980213165, |
| "step": 620, |
| "valid_targets_mean": 2821.9, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 1.001602564102564, |
| "grad_norm": 0.7465984644079928, |
| "learning_rate": 3.9777070056154124e-05, |
| "loss": 0.4273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20381376147270203, |
| "step": 625, |
| "valid_targets_mean": 2395.4, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 1.0096153846153846, |
| "grad_norm": 0.6090997256218228, |
| "learning_rate": 3.976501300314264e-05, |
| "loss": 0.3996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19216665625572205, |
| "step": 630, |
| "valid_targets_mean": 3795.2, |
| "valid_targets_min": 1148 |
| }, |
| { |
| "epoch": 1.017628205128205, |
| "grad_norm": 0.9887537640031723, |
| "learning_rate": 3.9752640355073825e-05, |
| "loss": 0.3934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19999739527702332, |
| "step": 635, |
| "valid_targets_mean": 2683.5, |
| "valid_targets_min": 1874 |
| }, |
| { |
| "epoch": 1.0256410256410255, |
| "grad_norm": 0.7712631721878844, |
| "learning_rate": 3.9739952309506175e-05, |
| "loss": 0.4294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1707819700241089, |
| "step": 640, |
| "valid_targets_mean": 2182.8, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 1.0336538461538463, |
| "grad_norm": 0.7915294225622618, |
| "learning_rate": 3.972694906903427e-05, |
| "loss": 0.4052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1669417917728424, |
| "step": 645, |
| "valid_targets_mean": 2294.2, |
| "valid_targets_min": 1128 |
| }, |
| { |
| "epoch": 1.0416666666666667, |
| "grad_norm": 0.7030915254920559, |
| "learning_rate": 3.971363084128552e-05, |
| "loss": 0.3957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2009146809577942, |
| "step": 650, |
| "valid_targets_mean": 3490.4, |
| "valid_targets_min": 260 |
| }, |
| { |
| "epoch": 1.0496794871794872, |
| "grad_norm": 0.8227935946585014, |
| "learning_rate": 3.969999783891685e-05, |
| "loss": 0.4199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2600316107273102, |
| "step": 655, |
| "valid_targets_mean": 2552.5, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 1.0576923076923077, |
| "grad_norm": 0.819150924957127, |
| "learning_rate": 3.96860502796113e-05, |
| "loss": 0.4009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22930988669395447, |
| "step": 660, |
| "valid_targets_mean": 2559.0, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 1.0657051282051282, |
| "grad_norm": 0.8189973867037402, |
| "learning_rate": 3.967178838607456e-05, |
| "loss": 0.4129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15020707249641418, |
| "step": 665, |
| "valid_targets_mean": 1769.4, |
| "valid_targets_min": 1131 |
| }, |
| { |
| "epoch": 1.0737179487179487, |
| "grad_norm": 0.6455047256028397, |
| "learning_rate": 3.965721238603139e-05, |
| "loss": 0.3861, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17924004793167114, |
| "step": 670, |
| "valid_targets_mean": 2953.0, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 1.0817307692307692, |
| "grad_norm": 0.9974279650169392, |
| "learning_rate": 3.964232251222203e-05, |
| "loss": 0.4186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20407584309577942, |
| "step": 675, |
| "valid_targets_mean": 2472.5, |
| "valid_targets_min": 1522 |
| }, |
| { |
| "epoch": 1.0897435897435896, |
| "grad_norm": 0.6570532885048896, |
| "learning_rate": 3.962711900239844e-05, |
| "loss": 0.3995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2124699354171753, |
| "step": 680, |
| "valid_targets_mean": 3709.4, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 1.0977564102564104, |
| "grad_norm": 0.7966806502459381, |
| "learning_rate": 3.961160209932051e-05, |
| "loss": 0.3707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16343654692173004, |
| "step": 685, |
| "valid_targets_mean": 1613.4, |
| "valid_targets_min": 435 |
| }, |
| { |
| "epoch": 1.1057692307692308, |
| "grad_norm": 0.8141799386192287, |
| "learning_rate": 3.95957720507522e-05, |
| "loss": 0.3784, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21225258708000183, |
| "step": 690, |
| "valid_targets_mean": 3180.0, |
| "valid_targets_min": 475 |
| }, |
| { |
| "epoch": 1.1137820512820513, |
| "grad_norm": 0.7663834307163272, |
| "learning_rate": 3.957962910945759e-05, |
| "loss": 0.3945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1471199244260788, |
| "step": 695, |
| "valid_targets_mean": 2677.8, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 1.1217948717948718, |
| "grad_norm": 0.735440023679953, |
| "learning_rate": 3.9563173533196805e-05, |
| "loss": 0.4039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1359565705060959, |
| "step": 700, |
| "valid_targets_mean": 1893.1, |
| "valid_targets_min": 822 |
| }, |
| { |
| "epoch": 1.1298076923076923, |
| "grad_norm": 0.7634365465235168, |
| "learning_rate": 3.954640558472195e-05, |
| "loss": 0.4141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1666882336139679, |
| "step": 705, |
| "valid_targets_mean": 2108.0, |
| "valid_targets_min": 1599 |
| }, |
| { |
| "epoch": 1.1378205128205128, |
| "grad_norm": 0.7962658670444661, |
| "learning_rate": 3.952932553177287e-05, |
| "loss": 0.377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22097454965114594, |
| "step": 710, |
| "valid_targets_mean": 2968.0, |
| "valid_targets_min": 1200 |
| }, |
| { |
| "epoch": 1.1458333333333333, |
| "grad_norm": 0.9117502451013554, |
| "learning_rate": 3.95119336470729e-05, |
| "loss": 0.4146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22754886746406555, |
| "step": 715, |
| "valid_targets_mean": 1757.2, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 1.1538461538461537, |
| "grad_norm": 0.8083486713374696, |
| "learning_rate": 3.949423020832451e-05, |
| "loss": 0.414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17627468705177307, |
| "step": 720, |
| "valid_targets_mean": 1481.2, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 1.1618589743589745, |
| "grad_norm": 0.7333098847473878, |
| "learning_rate": 3.947621549820485e-05, |
| "loss": 0.3805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18278644979000092, |
| "step": 725, |
| "valid_targets_mean": 2522.1, |
| "valid_targets_min": 1157 |
| }, |
| { |
| "epoch": 1.169871794871795, |
| "grad_norm": 0.7401713642953307, |
| "learning_rate": 3.945788980436129e-05, |
| "loss": 0.389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20542725920677185, |
| "step": 730, |
| "valid_targets_mean": 2958.4, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 1.1778846153846154, |
| "grad_norm": 0.8633291622977045, |
| "learning_rate": 3.943925341940673e-05, |
| "loss": 0.4114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16674403846263885, |
| "step": 735, |
| "valid_targets_mean": 1984.1, |
| "valid_targets_min": 315 |
| }, |
| { |
| "epoch": 1.185897435897436, |
| "grad_norm": 0.6862290281154118, |
| "learning_rate": 3.942030664091503e-05, |
| "loss": 0.3787, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1515948474407196, |
| "step": 740, |
| "valid_targets_mean": 2081.1, |
| "valid_targets_min": 1404 |
| }, |
| { |
| "epoch": 1.1939102564102564, |
| "grad_norm": 0.7517010622113833, |
| "learning_rate": 3.9401049771416214e-05, |
| "loss": 0.397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20460815727710724, |
| "step": 745, |
| "valid_targets_mean": 2555.0, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 1.2019230769230769, |
| "grad_norm": 0.7701867921629503, |
| "learning_rate": 3.938148311839162e-05, |
| "loss": 0.4257, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24021926522254944, |
| "step": 750, |
| "valid_targets_mean": 2868.4, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 1.2099358974358974, |
| "grad_norm": 0.8053323182482374, |
| "learning_rate": 3.9361606994269014e-05, |
| "loss": 0.407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1931108832359314, |
| "step": 755, |
| "valid_targets_mean": 2227.1, |
| "valid_targets_min": 1148 |
| }, |
| { |
| "epoch": 1.217948717948718, |
| "grad_norm": 0.6874024005644546, |
| "learning_rate": 3.934142171641763e-05, |
| "loss": 0.3773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21617969870567322, |
| "step": 760, |
| "valid_targets_mean": 3691.2, |
| "valid_targets_min": 1327 |
| }, |
| { |
| "epoch": 1.2259615384615385, |
| "grad_norm": 0.803368730894559, |
| "learning_rate": 3.9320927607143003e-05, |
| "loss": 0.3977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23498323559761047, |
| "step": 765, |
| "valid_targets_mean": 2918.5, |
| "valid_targets_min": 1543 |
| }, |
| { |
| "epoch": 1.233974358974359, |
| "grad_norm": 0.6761209321682878, |
| "learning_rate": 3.9300124993681976e-05, |
| "loss": 0.4127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20131105184555054, |
| "step": 770, |
| "valid_targets_mean": 3544.6, |
| "valid_targets_min": 1438 |
| }, |
| { |
| "epoch": 1.2419871794871795, |
| "grad_norm": 0.8140029717837052, |
| "learning_rate": 3.9279014208197317e-05, |
| "loss": 0.3932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19266082346439362, |
| "step": 775, |
| "valid_targets_mean": 2522.5, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 1.25, |
| "grad_norm": 0.7819556286960125, |
| "learning_rate": 3.925759558777252e-05, |
| "loss": 0.3876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2085326910018921, |
| "step": 780, |
| "valid_targets_mean": 2123.0, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 1.2580128205128205, |
| "grad_norm": 0.7378325645590994, |
| "learning_rate": 3.923586947440639e-05, |
| "loss": 0.4051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24526703357696533, |
| "step": 785, |
| "valid_targets_mean": 3333.6, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 1.266025641025641, |
| "grad_norm": 0.7617824513828749, |
| "learning_rate": 3.921383621500758e-05, |
| "loss": 0.3929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25414544343948364, |
| "step": 790, |
| "valid_targets_mean": 3125.8, |
| "valid_targets_min": 1466 |
| }, |
| { |
| "epoch": 1.2740384615384617, |
| "grad_norm": 0.827506556223389, |
| "learning_rate": 3.919149616138906e-05, |
| "loss": 0.4056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1815040558576584, |
| "step": 795, |
| "valid_targets_mean": 2285.4, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 1.282051282051282, |
| "grad_norm": 0.8523188451016964, |
| "learning_rate": 3.916884967026246e-05, |
| "loss": 0.3955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19575875997543335, |
| "step": 800, |
| "valid_targets_mean": 2627.0, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 1.2900641025641026, |
| "grad_norm": 0.8602226407777478, |
| "learning_rate": 3.914589710323245e-05, |
| "loss": 0.3981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22027531266212463, |
| "step": 805, |
| "valid_targets_mean": 2483.4, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 1.2980769230769231, |
| "grad_norm": 0.7192846478140936, |
| "learning_rate": 3.912263882679091e-05, |
| "loss": 0.3709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12481571733951569, |
| "step": 810, |
| "valid_targets_mean": 1910.9, |
| "valid_targets_min": 737 |
| }, |
| { |
| "epoch": 1.3060897435897436, |
| "grad_norm": 0.7463244398063339, |
| "learning_rate": 3.9099075212311076e-05, |
| "loss": 0.3779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19425347447395325, |
| "step": 815, |
| "valid_targets_mean": 2349.6, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 1.314102564102564, |
| "grad_norm": 0.7798070432766532, |
| "learning_rate": 3.9075206636041646e-05, |
| "loss": 0.3889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16809885203838348, |
| "step": 820, |
| "valid_targets_mean": 2378.0, |
| "valid_targets_min": 1186 |
| }, |
| { |
| "epoch": 1.3221153846153846, |
| "grad_norm": 0.7353506089603916, |
| "learning_rate": 3.905103347910075e-05, |
| "loss": 0.3846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14414098858833313, |
| "step": 825, |
| "valid_targets_mean": 1964.6, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 1.330128205128205, |
| "grad_norm": 0.7469626524872656, |
| "learning_rate": 3.902655612746985e-05, |
| "loss": 0.3986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20464842021465302, |
| "step": 830, |
| "valid_targets_mean": 2803.6, |
| "valid_targets_min": 1178 |
| }, |
| { |
| "epoch": 1.3381410256410255, |
| "grad_norm": 0.8086127489461551, |
| "learning_rate": 3.900177497198761e-05, |
| "loss": 0.4059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2263430953025818, |
| "step": 835, |
| "valid_targets_mean": 2755.0, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 1.3461538461538463, |
| "grad_norm": 0.6460008366891428, |
| "learning_rate": 3.8976690408343635e-05, |
| "loss": 0.3958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16660919785499573, |
| "step": 840, |
| "valid_targets_mean": 3076.5, |
| "valid_targets_min": 1058 |
| }, |
| { |
| "epoch": 1.3541666666666667, |
| "grad_norm": 0.8460991987261154, |
| "learning_rate": 3.8951302837072165e-05, |
| "loss": 0.408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2518458068370819, |
| "step": 845, |
| "valid_targets_mean": 2448.0, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 1.3621794871794872, |
| "grad_norm": 0.821233295005827, |
| "learning_rate": 3.892561266354566e-05, |
| "loss": 0.4159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18111786246299744, |
| "step": 850, |
| "valid_targets_mean": 2694.5, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 1.3701923076923077, |
| "grad_norm": 0.7296441292083241, |
| "learning_rate": 3.889962029796833e-05, |
| "loss": 0.3896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17838101089000702, |
| "step": 855, |
| "valid_targets_mean": 2373.2, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 1.3782051282051282, |
| "grad_norm": 0.7026610730862972, |
| "learning_rate": 3.887332615536962e-05, |
| "loss": 0.4075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21002928912639618, |
| "step": 860, |
| "valid_targets_mean": 3131.4, |
| "valid_targets_min": 1406 |
| }, |
| { |
| "epoch": 1.3862179487179487, |
| "grad_norm": 1.0977711950424043, |
| "learning_rate": 3.8846730655597535e-05, |
| "loss": 0.4108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2301381528377533, |
| "step": 865, |
| "valid_targets_mean": 2209.1, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 1.3942307692307692, |
| "grad_norm": 1.0677689487035835, |
| "learning_rate": 3.881983422331198e-05, |
| "loss": 0.405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22443720698356628, |
| "step": 870, |
| "valid_targets_mean": 1953.8, |
| "valid_targets_min": 1342 |
| }, |
| { |
| "epoch": 1.4022435897435899, |
| "grad_norm": 0.7984589627995452, |
| "learning_rate": 3.879263728797792e-05, |
| "loss": 0.3901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19039490818977356, |
| "step": 875, |
| "valid_targets_mean": 2250.5, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 1.4102564102564101, |
| "grad_norm": 0.7610997708344249, |
| "learning_rate": 3.876514028385861e-05, |
| "loss": 0.3793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18667712807655334, |
| "step": 880, |
| "valid_targets_mean": 2457.6, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 1.4182692307692308, |
| "grad_norm": 0.7660744650444555, |
| "learning_rate": 3.873734365000857e-05, |
| "loss": 0.3793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19710713624954224, |
| "step": 885, |
| "valid_targets_mean": 2400.2, |
| "valid_targets_min": 1439 |
| }, |
| { |
| "epoch": 1.4262820512820513, |
| "grad_norm": 0.9027867349808698, |
| "learning_rate": 3.870924783026663e-05, |
| "loss": 0.4044, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25323033332824707, |
| "step": 890, |
| "valid_targets_mean": 2769.5, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 1.4342948717948718, |
| "grad_norm": 0.6655726580543196, |
| "learning_rate": 3.8680853273248826e-05, |
| "loss": 0.4161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24514815211296082, |
| "step": 895, |
| "valid_targets_mean": 3499.0, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 1.4423076923076923, |
| "grad_norm": 0.7581770160173827, |
| "learning_rate": 3.865216043234126e-05, |
| "loss": 0.3768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21933013200759888, |
| "step": 900, |
| "valid_targets_mean": 3721.2, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 1.4503205128205128, |
| "grad_norm": 0.7738042590711245, |
| "learning_rate": 3.862316976569281e-05, |
| "loss": 0.4284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30224043130874634, |
| "step": 905, |
| "valid_targets_mean": 3316.0, |
| "valid_targets_min": 1100 |
| }, |
| { |
| "epoch": 1.4583333333333333, |
| "grad_norm": 0.6155745043657496, |
| "learning_rate": 3.859388173620785e-05, |
| "loss": 0.3978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2257455587387085, |
| "step": 910, |
| "valid_targets_mean": 4074.5, |
| "valid_targets_min": 1359 |
| }, |
| { |
| "epoch": 1.4663461538461537, |
| "grad_norm": 0.6817808713104984, |
| "learning_rate": 3.8564296811538874e-05, |
| "loss": 0.4026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2565431594848633, |
| "step": 915, |
| "valid_targets_mean": 3401.1, |
| "valid_targets_min": 1271 |
| }, |
| { |
| "epoch": 1.4743589743589745, |
| "grad_norm": 0.7173177986914446, |
| "learning_rate": 3.853441546407898e-05, |
| "loss": 0.3924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24881017208099365, |
| "step": 920, |
| "valid_targets_mean": 3510.5, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 1.482371794871795, |
| "grad_norm": 0.7945715980200994, |
| "learning_rate": 3.850423817095438e-05, |
| "loss": 0.3963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15524527430534363, |
| "step": 925, |
| "valid_targets_mean": 1850.6, |
| "valid_targets_min": 1284 |
| }, |
| { |
| "epoch": 1.4903846153846154, |
| "grad_norm": 0.7598949103076834, |
| "learning_rate": 3.847376541401674e-05, |
| "loss": 0.3804, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16828379034996033, |
| "step": 930, |
| "valid_targets_mean": 1823.9, |
| "valid_targets_min": 1016 |
| }, |
| { |
| "epoch": 1.498397435897436, |
| "grad_norm": 0.7977097435862016, |
| "learning_rate": 3.844299767983551e-05, |
| "loss": 0.3995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20539097487926483, |
| "step": 935, |
| "valid_targets_mean": 2585.9, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 1.5064102564102564, |
| "grad_norm": 0.7796806378947536, |
| "learning_rate": 3.841193545969015e-05, |
| "loss": 0.372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21690428256988525, |
| "step": 940, |
| "valid_targets_mean": 3070.1, |
| "valid_targets_min": 1298 |
| }, |
| { |
| "epoch": 1.5144230769230769, |
| "grad_norm": 0.795763049986929, |
| "learning_rate": 3.8380579249562265e-05, |
| "loss": 0.3871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21313318610191345, |
| "step": 945, |
| "valid_targets_mean": 2357.9, |
| "valid_targets_min": 1087 |
| }, |
| { |
| "epoch": 1.5224358974358974, |
| "grad_norm": 0.7856865708709738, |
| "learning_rate": 3.8348929550127734e-05, |
| "loss": 0.3934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21079853177070618, |
| "step": 950, |
| "valid_targets_mean": 2205.2, |
| "valid_targets_min": 1438 |
| }, |
| { |
| "epoch": 1.530448717948718, |
| "grad_norm": 0.7102354357674125, |
| "learning_rate": 3.831698686674866e-05, |
| "loss": 0.3864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1579192876815796, |
| "step": 955, |
| "valid_targets_mean": 2220.9, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 1.5384615384615383, |
| "grad_norm": 0.7397064308922544, |
| "learning_rate": 3.828475170946534e-05, |
| "loss": 0.4017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21521735191345215, |
| "step": 960, |
| "valid_targets_mean": 2871.2, |
| "valid_targets_min": 1032 |
| }, |
| { |
| "epoch": 1.546474358974359, |
| "grad_norm": 0.9957473984975943, |
| "learning_rate": 3.8252224592988087e-05, |
| "loss": 0.4178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19509410858154297, |
| "step": 965, |
| "valid_targets_mean": 1405.8, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 1.5544871794871795, |
| "grad_norm": 0.804754542638096, |
| "learning_rate": 3.821940603668906e-05, |
| "loss": 0.3824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16173695027828217, |
| "step": 970, |
| "valid_targets_mean": 1865.6, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 1.5625, |
| "grad_norm": 0.7298059783039583, |
| "learning_rate": 3.8186296564593924e-05, |
| "loss": 0.3954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22694705426692963, |
| "step": 975, |
| "valid_targets_mean": 3259.4, |
| "valid_targets_min": 1155 |
| }, |
| { |
| "epoch": 1.5705128205128205, |
| "grad_norm": 0.7890833541271126, |
| "learning_rate": 3.815289670537351e-05, |
| "loss": 0.372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19712330400943756, |
| "step": 980, |
| "valid_targets_mean": 2654.9, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 1.578525641025641, |
| "grad_norm": 0.7721134490148664, |
| "learning_rate": 3.811920699233535e-05, |
| "loss": 0.3662, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16013117134571075, |
| "step": 985, |
| "valid_targets_mean": 2404.1, |
| "valid_targets_min": 1045 |
| }, |
| { |
| "epoch": 1.5865384615384617, |
| "grad_norm": 0.7771772844437951, |
| "learning_rate": 3.8085227963415186e-05, |
| "loss": 0.3862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18366935849189758, |
| "step": 990, |
| "valid_targets_mean": 2047.1, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 1.594551282051282, |
| "grad_norm": 0.7263474584644822, |
| "learning_rate": 3.805096016116838e-05, |
| "loss": 0.4002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23366929590702057, |
| "step": 995, |
| "valid_targets_mean": 3505.8, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 1.6025641025641026, |
| "grad_norm": 0.7734401430489013, |
| "learning_rate": 3.801640413276121e-05, |
| "loss": 0.3876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18875086307525635, |
| "step": 1000, |
| "valid_targets_mean": 2440.6, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 1.6105769230769231, |
| "grad_norm": 1.0978052948369825, |
| "learning_rate": 3.7981560429962204e-05, |
| "loss": 0.3848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19252219796180725, |
| "step": 1005, |
| "valid_targets_mean": 2162.2, |
| "valid_targets_min": 1507 |
| }, |
| { |
| "epoch": 1.6185897435897436, |
| "grad_norm": 0.8249891646453199, |
| "learning_rate": 3.7946429609133274e-05, |
| "loss": 0.3908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2153560221195221, |
| "step": 1010, |
| "valid_targets_mean": 1905.8, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 1.626602564102564, |
| "grad_norm": 0.7433162943053611, |
| "learning_rate": 3.791101223122084e-05, |
| "loss": 0.3959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1687787026166916, |
| "step": 1015, |
| "valid_targets_mean": 1962.5, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 1.6346153846153846, |
| "grad_norm": 0.7062532227721724, |
| "learning_rate": 3.787530886174688e-05, |
| "loss": 0.3808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14789080619812012, |
| "step": 1020, |
| "valid_targets_mean": 2009.1, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 1.6426282051282053, |
| "grad_norm": 0.7284286934878477, |
| "learning_rate": 3.783932007079992e-05, |
| "loss": 0.3724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1761750727891922, |
| "step": 1025, |
| "valid_targets_mean": 2278.1, |
| "valid_targets_min": 1055 |
| }, |
| { |
| "epoch": 1.6506410256410255, |
| "grad_norm": 0.6724344397247881, |
| "learning_rate": 3.7803046433025905e-05, |
| "loss": 0.3876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19518470764160156, |
| "step": 1030, |
| "valid_targets_mean": 2953.0, |
| "valid_targets_min": 1636 |
| }, |
| { |
| "epoch": 1.6586538461538463, |
| "grad_norm": 0.7306814326324378, |
| "learning_rate": 3.7766488527619024e-05, |
| "loss": 0.3828, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2070809304714203, |
| "step": 1035, |
| "valid_targets_mean": 2797.0, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.6966329661882152, |
| "learning_rate": 3.772964693831247e-05, |
| "loss": 0.3898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1665840744972229, |
| "step": 1040, |
| "valid_targets_mean": 2359.0, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 1.6746794871794872, |
| "grad_norm": 0.8183363093585437, |
| "learning_rate": 3.7692522253369136e-05, |
| "loss": 0.3856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20456507802009583, |
| "step": 1045, |
| "valid_targets_mean": 2110.2, |
| "valid_targets_min": 1108 |
| }, |
| { |
| "epoch": 1.6826923076923077, |
| "grad_norm": 0.7326066646720534, |
| "learning_rate": 3.7655115065572194e-05, |
| "loss": 0.3792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1852574348449707, |
| "step": 1050, |
| "valid_targets_mean": 2510.5, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 1.6907051282051282, |
| "grad_norm": 0.8179852635285826, |
| "learning_rate": 3.7617425972215626e-05, |
| "loss": 0.3651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18398068845272064, |
| "step": 1055, |
| "valid_targets_mean": 2575.1, |
| "valid_targets_min": 1176 |
| }, |
| { |
| "epoch": 1.6987179487179487, |
| "grad_norm": 0.7594138822240342, |
| "learning_rate": 3.757945557509472e-05, |
| "loss": 0.3976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2564973831176758, |
| "step": 1060, |
| "valid_targets_mean": 3293.5, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 1.7067307692307692, |
| "grad_norm": 0.7744891981574005, |
| "learning_rate": 3.7541204480496444e-05, |
| "loss": 0.436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2867600917816162, |
| "step": 1065, |
| "valid_targets_mean": 2808.5, |
| "valid_targets_min": 1224 |
| }, |
| { |
| "epoch": 1.7147435897435899, |
| "grad_norm": 0.6569368962525489, |
| "learning_rate": 3.7502673299189745e-05, |
| "loss": 0.3927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20591554045677185, |
| "step": 1070, |
| "valid_targets_mean": 3459.0, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 1.7227564102564101, |
| "grad_norm": 0.731504718928724, |
| "learning_rate": 3.746386264641583e-05, |
| "loss": 0.3947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18665257096290588, |
| "step": 1075, |
| "valid_targets_mean": 2337.9, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 1.7307692307692308, |
| "grad_norm": 0.7677480742647473, |
| "learning_rate": 3.7424773141878324e-05, |
| "loss": 0.4064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18656907975673676, |
| "step": 1080, |
| "valid_targets_mean": 2099.4, |
| "valid_targets_min": 1228 |
| }, |
| { |
| "epoch": 1.7387820512820513, |
| "grad_norm": 0.7989982560887274, |
| "learning_rate": 3.738540540973338e-05, |
| "loss": 0.3992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1916476935148239, |
| "step": 1085, |
| "valid_targets_mean": 2387.1, |
| "valid_targets_min": 1355 |
| }, |
| { |
| "epoch": 1.7467948717948718, |
| "grad_norm": 0.7713226972032743, |
| "learning_rate": 3.7345760078579695e-05, |
| "loss": 0.382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1601388305425644, |
| "step": 1090, |
| "valid_targets_mean": 1695.2, |
| "valid_targets_min": 269 |
| }, |
| { |
| "epoch": 1.7548076923076923, |
| "grad_norm": 0.7153583276085919, |
| "learning_rate": 3.730583778144852e-05, |
| "loss": 0.3881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24518054723739624, |
| "step": 1095, |
| "valid_targets_mean": 3535.8, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 1.7628205128205128, |
| "grad_norm": 0.7238652347725764, |
| "learning_rate": 3.7265639155793494e-05, |
| "loss": 0.3776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15082888305187225, |
| "step": 1100, |
| "valid_targets_mean": 2375.6, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 1.7708333333333335, |
| "grad_norm": 0.7597119444096863, |
| "learning_rate": 3.7225164843480503e-05, |
| "loss": 0.4042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18812818825244904, |
| "step": 1105, |
| "valid_targets_mean": 2196.5, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 1.7788461538461537, |
| "grad_norm": 0.8964624092632014, |
| "learning_rate": 3.7184415490777426e-05, |
| "loss": 0.372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.207992285490036, |
| "step": 1110, |
| "valid_targets_mean": 2188.0, |
| "valid_targets_min": 1124 |
| }, |
| { |
| "epoch": 1.7868589743589745, |
| "grad_norm": 0.6948514781192213, |
| "learning_rate": 3.714339174834379e-05, |
| "loss": 0.3726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18899385631084442, |
| "step": 1115, |
| "valid_targets_mean": 2110.8, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 1.7948717948717947, |
| "grad_norm": 0.7001908243752163, |
| "learning_rate": 3.710209427122044e-05, |
| "loss": 0.4312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19637015461921692, |
| "step": 1120, |
| "valid_targets_mean": 2747.2, |
| "valid_targets_min": 1109 |
| }, |
| { |
| "epoch": 1.8028846153846154, |
| "grad_norm": 0.6314682487629872, |
| "learning_rate": 3.7060523718819e-05, |
| "loss": 0.3815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19258755445480347, |
| "step": 1125, |
| "valid_targets_mean": 3663.5, |
| "valid_targets_min": 1600 |
| }, |
| { |
| "epoch": 1.810897435897436, |
| "grad_norm": 0.8124805310376293, |
| "learning_rate": 3.701868075491139e-05, |
| "loss": 0.4002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18830403685569763, |
| "step": 1130, |
| "valid_targets_mean": 2149.4, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 1.8189102564102564, |
| "grad_norm": 0.7453037484756837, |
| "learning_rate": 3.697656604761926e-05, |
| "loss": 0.3497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17239141464233398, |
| "step": 1135, |
| "valid_targets_mean": 2228.2, |
| "valid_targets_min": 1263 |
| }, |
| { |
| "epoch": 1.8269230769230769, |
| "grad_norm": 0.7597851188699107, |
| "learning_rate": 3.693418026940325e-05, |
| "loss": 0.3694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1435607373714447, |
| "step": 1140, |
| "valid_targets_mean": 1410.1, |
| "valid_targets_min": 446 |
| }, |
| { |
| "epoch": 1.8349358974358974, |
| "grad_norm": 0.6747261559800963, |
| "learning_rate": 3.689152409705229e-05, |
| "loss": 0.3834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1624498814344406, |
| "step": 1145, |
| "valid_targets_mean": 2713.1, |
| "valid_targets_min": 1090 |
| }, |
| { |
| "epoch": 1.842948717948718, |
| "grad_norm": 0.7735869483528329, |
| "learning_rate": 3.6848598211672794e-05, |
| "loss": 0.3872, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2225751131772995, |
| "step": 1150, |
| "valid_targets_mean": 2196.0, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 1.8509615384615383, |
| "grad_norm": 0.8104590197423858, |
| "learning_rate": 3.6805403298677797e-05, |
| "loss": 0.4101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1646331250667572, |
| "step": 1155, |
| "valid_targets_mean": 1976.8, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 1.858974358974359, |
| "grad_norm": 0.6609774232707526, |
| "learning_rate": 3.6761940047775966e-05, |
| "loss": 0.3791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1530018448829651, |
| "step": 1160, |
| "valid_targets_mean": 2702.2, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 1.8669871794871795, |
| "grad_norm": 0.8716057992411466, |
| "learning_rate": 3.671820915296063e-05, |
| "loss": 0.3935, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22766408324241638, |
| "step": 1165, |
| "valid_targets_mean": 2449.6, |
| "valid_targets_min": 1228 |
| }, |
| { |
| "epoch": 1.875, |
| "grad_norm": 0.8210753368155098, |
| "learning_rate": 3.667421131249869e-05, |
| "loss": 0.4034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19551564753055573, |
| "step": 1170, |
| "valid_targets_mean": 1927.8, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 1.8830128205128205, |
| "grad_norm": 0.8627779649045554, |
| "learning_rate": 3.662994722891946e-05, |
| "loss": 0.3899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18560561537742615, |
| "step": 1175, |
| "valid_targets_mean": 1790.8, |
| "valid_targets_min": 1279 |
| }, |
| { |
| "epoch": 1.891025641025641, |
| "grad_norm": 0.6827904826786426, |
| "learning_rate": 3.658541760900344e-05, |
| "loss": 0.3562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19983141124248505, |
| "step": 1180, |
| "valid_targets_mean": 2813.4, |
| "valid_targets_min": 1533 |
| }, |
| { |
| "epoch": 1.8990384615384617, |
| "grad_norm": 0.6841910626255084, |
| "learning_rate": 3.654062316377106e-05, |
| "loss": 0.3845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17266666889190674, |
| "step": 1185, |
| "valid_targets_mean": 2745.6, |
| "valid_targets_min": 303 |
| }, |
| { |
| "epoch": 1.907051282051282, |
| "grad_norm": 0.8254813972995194, |
| "learning_rate": 3.649556460847131e-05, |
| "loss": 0.3928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15996776521205902, |
| "step": 1190, |
| "valid_targets_mean": 1754.0, |
| "valid_targets_min": 894 |
| }, |
| { |
| "epoch": 1.9150641025641026, |
| "grad_norm": 0.7291405879871701, |
| "learning_rate": 3.6450242662570314e-05, |
| "loss": 0.387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.192326158285141, |
| "step": 1195, |
| "valid_targets_mean": 2522.0, |
| "valid_targets_min": 1364 |
| }, |
| { |
| "epoch": 1.9230769230769231, |
| "grad_norm": 0.6684747033924835, |
| "learning_rate": 3.6404658049739854e-05, |
| "loss": 0.3701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12845301628112793, |
| "step": 1200, |
| "valid_targets_mean": 2355.8, |
| "valid_targets_min": 1434 |
| }, |
| { |
| "epoch": 1.9310897435897436, |
| "grad_norm": 0.7501902469595525, |
| "learning_rate": 3.63588114978458e-05, |
| "loss": 0.3906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20027633011341095, |
| "step": 1205, |
| "valid_targets_mean": 2796.9, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 1.939102564102564, |
| "grad_norm": 0.8787778878398708, |
| "learning_rate": 3.6312703738936504e-05, |
| "loss": 0.3808, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17389872670173645, |
| "step": 1210, |
| "valid_targets_mean": 1681.4, |
| "valid_targets_min": 1167 |
| }, |
| { |
| "epoch": 1.9471153846153846, |
| "grad_norm": 0.7032222031644281, |
| "learning_rate": 3.626633550923111e-05, |
| "loss": 0.3797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14461690187454224, |
| "step": 1215, |
| "valid_targets_mean": 1986.5, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 1.9551282051282053, |
| "grad_norm": 0.7669477034061776, |
| "learning_rate": 3.621970754910778e-05, |
| "loss": 0.3969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.158382385969162, |
| "step": 1220, |
| "valid_targets_mean": 2008.5, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 1.9631410256410255, |
| "grad_norm": 0.7419304317666434, |
| "learning_rate": 3.6172820603091885e-05, |
| "loss": 0.3972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2039494663476944, |
| "step": 1225, |
| "valid_targets_mean": 2516.6, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 1.9711538461538463, |
| "grad_norm": 0.6889071670417813, |
| "learning_rate": 3.612567541984413e-05, |
| "loss": 0.3967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14030852913856506, |
| "step": 1230, |
| "valid_targets_mean": 1680.6, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 1.9791666666666665, |
| "grad_norm": 0.7401744379682911, |
| "learning_rate": 3.6078272752148574e-05, |
| "loss": 0.3848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20165783166885376, |
| "step": 1235, |
| "valid_targets_mean": 2676.4, |
| "valid_targets_min": 1282 |
| }, |
| { |
| "epoch": 1.9871794871794872, |
| "grad_norm": 0.7127292270502633, |
| "learning_rate": 3.6030613356900635e-05, |
| "loss": 0.3778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2067841738462448, |
| "step": 1240, |
| "valid_targets_mean": 2912.0, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 1.9951923076923077, |
| "grad_norm": 0.6696204116089755, |
| "learning_rate": 3.598269799509498e-05, |
| "loss": 0.3925, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.133599191904068, |
| "step": 1245, |
| "valid_targets_mean": 2193.4, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 2.003205128205128, |
| "grad_norm": 0.7309611863815216, |
| "learning_rate": 3.5934527431813385e-05, |
| "loss": 0.3699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1557263731956482, |
| "step": 1250, |
| "valid_targets_mean": 2589.4, |
| "valid_targets_min": 1535 |
| }, |
| { |
| "epoch": 2.011217948717949, |
| "grad_norm": 0.7184249082256497, |
| "learning_rate": 3.5886102436212536e-05, |
| "loss": 0.3362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2098970264196396, |
| "step": 1255, |
| "valid_targets_mean": 3387.4, |
| "valid_targets_min": 1266 |
| }, |
| { |
| "epoch": 2.019230769230769, |
| "grad_norm": 0.818316424675812, |
| "learning_rate": 3.583742378151171e-05, |
| "loss": 0.3529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20294536650180817, |
| "step": 1260, |
| "valid_targets_mean": 2087.0, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 2.02724358974359, |
| "grad_norm": 0.8278234776817402, |
| "learning_rate": 3.5788492244980464e-05, |
| "loss": 0.3806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12976673245429993, |
| "step": 1265, |
| "valid_targets_mean": 1713.8, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 2.03525641025641, |
| "grad_norm": 0.6959655858741635, |
| "learning_rate": 3.573930860792621e-05, |
| "loss": 0.3472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15088346600532532, |
| "step": 1270, |
| "valid_targets_mean": 2264.1, |
| "valid_targets_min": 833 |
| }, |
| { |
| "epoch": 2.043269230769231, |
| "grad_norm": 0.7359135223433384, |
| "learning_rate": 3.568987365568173e-05, |
| "loss": 0.3635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21914812922477722, |
| "step": 1275, |
| "valid_targets_mean": 2839.2, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 2.051282051282051, |
| "grad_norm": 0.7969244476786354, |
| "learning_rate": 3.564018817759266e-05, |
| "loss": 0.3536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17785009741783142, |
| "step": 1280, |
| "valid_targets_mean": 2738.1, |
| "valid_targets_min": 1117 |
| }, |
| { |
| "epoch": 2.059294871794872, |
| "grad_norm": 0.7000366520475035, |
| "learning_rate": 3.559025296700484e-05, |
| "loss": 0.3509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1585804522037506, |
| "step": 1285, |
| "valid_targets_mean": 2884.6, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 2.0673076923076925, |
| "grad_norm": 0.8302999135088763, |
| "learning_rate": 3.554006882125173e-05, |
| "loss": 0.346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1665937602519989, |
| "step": 1290, |
| "valid_targets_mean": 2208.9, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 2.0753205128205128, |
| "grad_norm": 0.6867619519062099, |
| "learning_rate": 3.5489636541641586e-05, |
| "loss": 0.3343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1533121019601822, |
| "step": 1295, |
| "valid_targets_mean": 2485.8, |
| "valid_targets_min": 1319 |
| }, |
| { |
| "epoch": 2.0833333333333335, |
| "grad_norm": 0.7660992574595947, |
| "learning_rate": 3.543895693344472e-05, |
| "loss": 0.3459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2186858355998993, |
| "step": 1300, |
| "valid_targets_mean": 3234.2, |
| "valid_targets_min": 1875 |
| }, |
| { |
| "epoch": 2.0913461538461537, |
| "grad_norm": 0.7111187839614682, |
| "learning_rate": 3.538803080588063e-05, |
| "loss": 0.3338, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1263820230960846, |
| "step": 1305, |
| "valid_targets_mean": 2168.0, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 2.0993589743589745, |
| "grad_norm": 0.8189330742251553, |
| "learning_rate": 3.5336858972105076e-05, |
| "loss": 0.3724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17902137339115143, |
| "step": 1310, |
| "valid_targets_mean": 2206.6, |
| "valid_targets_min": 389 |
| }, |
| { |
| "epoch": 2.1073717948717947, |
| "grad_norm": 0.6791884046018158, |
| "learning_rate": 3.528544224919708e-05, |
| "loss": 0.3539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2036716639995575, |
| "step": 1315, |
| "valid_targets_mean": 3792.5, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 2.1153846153846154, |
| "grad_norm": 0.7284182583266996, |
| "learning_rate": 3.5233781458145934e-05, |
| "loss": 0.3485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20440541207790375, |
| "step": 1320, |
| "valid_targets_mean": 3414.0, |
| "valid_targets_min": 989 |
| }, |
| { |
| "epoch": 2.123397435897436, |
| "grad_norm": 0.8141069191193862, |
| "learning_rate": 3.5181877423838034e-05, |
| "loss": 0.3478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12585687637329102, |
| "step": 1325, |
| "valid_targets_mean": 1891.8, |
| "valid_targets_min": 329 |
| }, |
| { |
| "epoch": 2.1314102564102564, |
| "grad_norm": 0.7779645588888344, |
| "learning_rate": 3.512973097504371e-05, |
| "loss": 0.348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19460856914520264, |
| "step": 1330, |
| "valid_targets_mean": 2242.0, |
| "valid_targets_min": 1178 |
| }, |
| { |
| "epoch": 2.139423076923077, |
| "grad_norm": 0.7927049005753485, |
| "learning_rate": 3.507734294440403e-05, |
| "loss": 0.3607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14881053566932678, |
| "step": 1335, |
| "valid_targets_mean": 1846.4, |
| "valid_targets_min": 1157 |
| }, |
| { |
| "epoch": 2.1474358974358974, |
| "grad_norm": 1.2475102978708894, |
| "learning_rate": 3.50247141684175e-05, |
| "loss": 0.344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17731156945228577, |
| "step": 1340, |
| "valid_targets_mean": 1948.9, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 2.155448717948718, |
| "grad_norm": 0.8006723258352239, |
| "learning_rate": 3.497184548742667e-05, |
| "loss": 0.3328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14808142185211182, |
| "step": 1345, |
| "valid_targets_mean": 2546.2, |
| "valid_targets_min": 1636 |
| }, |
| { |
| "epoch": 2.1634615384615383, |
| "grad_norm": 0.7877170951828761, |
| "learning_rate": 3.491873774560473e-05, |
| "loss": 0.3593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15312331914901733, |
| "step": 1350, |
| "valid_targets_mean": 2226.0, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 2.171474358974359, |
| "grad_norm": 0.7625814945603144, |
| "learning_rate": 3.486539179094208e-05, |
| "loss": 0.3636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1644267737865448, |
| "step": 1355, |
| "valid_targets_mean": 2441.2, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 2.1794871794871793, |
| "grad_norm": 0.7774543384531808, |
| "learning_rate": 3.481180847523272e-05, |
| "loss": 0.3601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20621232688426971, |
| "step": 1360, |
| "valid_targets_mean": 2525.8, |
| "valid_targets_min": 884 |
| }, |
| { |
| "epoch": 2.1875, |
| "grad_norm": 0.7288588923791031, |
| "learning_rate": 3.4757988654060684e-05, |
| "loss": 0.341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20766200125217438, |
| "step": 1365, |
| "valid_targets_mean": 3249.2, |
| "valid_targets_min": 1425 |
| }, |
| { |
| "epoch": 2.1955128205128207, |
| "grad_norm": 0.8803087140032898, |
| "learning_rate": 3.470393318678637e-05, |
| "loss": 0.3466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18664687871932983, |
| "step": 1370, |
| "valid_targets_mean": 1891.2, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 2.203525641025641, |
| "grad_norm": 0.9072383303435303, |
| "learning_rate": 3.4649642936532836e-05, |
| "loss": 0.339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16699038445949554, |
| "step": 1375, |
| "valid_targets_mean": 2271.9, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 2.2115384615384617, |
| "grad_norm": 0.8374276049391025, |
| "learning_rate": 3.4595118770171984e-05, |
| "loss": 0.338, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19499821960926056, |
| "step": 1380, |
| "valid_targets_mean": 2261.1, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 2.219551282051282, |
| "grad_norm": 0.7110224511296612, |
| "learning_rate": 3.454036155831077e-05, |
| "loss": 0.3402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16453278064727783, |
| "step": 1385, |
| "valid_targets_mean": 3003.4, |
| "valid_targets_min": 984 |
| }, |
| { |
| "epoch": 2.2275641025641026, |
| "grad_norm": 0.8034598679262911, |
| "learning_rate": 3.4485372175277236e-05, |
| "loss": 0.339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21522057056427002, |
| "step": 1390, |
| "valid_targets_mean": 2669.6, |
| "valid_targets_min": 1629 |
| }, |
| { |
| "epoch": 2.235576923076923, |
| "grad_norm": 0.936818141069857, |
| "learning_rate": 3.44301514991066e-05, |
| "loss": 0.3514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18182526528835297, |
| "step": 1395, |
| "valid_targets_mean": 1872.4, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 2.2435897435897436, |
| "grad_norm": 1.0145081834032068, |
| "learning_rate": 3.4374700411527225e-05, |
| "loss": 0.3338, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18463921546936035, |
| "step": 1400, |
| "valid_targets_mean": 2367.8, |
| "valid_targets_min": 1028 |
| }, |
| { |
| "epoch": 2.251602564102564, |
| "grad_norm": 0.8485161257861278, |
| "learning_rate": 3.431901979794653e-05, |
| "loss": 0.3413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22386862337589264, |
| "step": 1405, |
| "valid_targets_mean": 2464.2, |
| "valid_targets_min": 1088 |
| }, |
| { |
| "epoch": 2.2596153846153846, |
| "grad_norm": 0.6648536661400917, |
| "learning_rate": 3.426311054743685e-05, |
| "loss": 0.3317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17803597450256348, |
| "step": 1410, |
| "valid_targets_mean": 2665.6, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 2.2676282051282053, |
| "grad_norm": 0.8127131589772357, |
| "learning_rate": 3.420697355272127e-05, |
| "loss": 0.3681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18442665040493011, |
| "step": 1415, |
| "valid_targets_mean": 2133.6, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 2.2756410256410255, |
| "grad_norm": 0.7669669977387416, |
| "learning_rate": 3.415060971015933e-05, |
| "loss": 0.3398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14786052703857422, |
| "step": 1420, |
| "valid_targets_mean": 2188.1, |
| "valid_targets_min": 1065 |
| }, |
| { |
| "epoch": 2.2836538461538463, |
| "grad_norm": 0.6858864773705935, |
| "learning_rate": 3.4094019919732736e-05, |
| "loss": 0.3458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18889179825782776, |
| "step": 1425, |
| "valid_targets_mean": 3692.6, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 2.2916666666666665, |
| "grad_norm": 0.7713618046589539, |
| "learning_rate": 3.403720508503098e-05, |
| "loss": 0.3686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15971162915229797, |
| "step": 1430, |
| "valid_targets_mean": 2336.1, |
| "valid_targets_min": 416 |
| }, |
| { |
| "epoch": 2.2996794871794872, |
| "grad_norm": 0.929199437687356, |
| "learning_rate": 3.398016611323693e-05, |
| "loss": 0.3483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20525173842906952, |
| "step": 1435, |
| "valid_targets_mean": 2049.9, |
| "valid_targets_min": 1188 |
| }, |
| { |
| "epoch": 2.3076923076923075, |
| "grad_norm": 0.7351797681344957, |
| "learning_rate": 3.392290391511232e-05, |
| "loss": 0.362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19388672709465027, |
| "step": 1440, |
| "valid_targets_mean": 2718.4, |
| "valid_targets_min": 1272 |
| }, |
| { |
| "epoch": 2.315705128205128, |
| "grad_norm": 0.7830095585397322, |
| "learning_rate": 3.386541940498322e-05, |
| "loss": 0.3424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.200042262673378, |
| "step": 1445, |
| "valid_targets_mean": 2492.6, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 2.323717948717949, |
| "grad_norm": 0.7260002191823239, |
| "learning_rate": 3.380771350072543e-05, |
| "loss": 0.3463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20473235845565796, |
| "step": 1450, |
| "valid_targets_mean": 3114.0, |
| "valid_targets_min": 1678 |
| }, |
| { |
| "epoch": 2.331730769230769, |
| "grad_norm": 0.7003366188583651, |
| "learning_rate": 3.374978712374986e-05, |
| "loss": 0.3536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1109727993607521, |
| "step": 1455, |
| "valid_targets_mean": 1764.2, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 2.33974358974359, |
| "grad_norm": 0.7556951896666148, |
| "learning_rate": 3.369164119898774e-05, |
| "loss": 0.3393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17174313962459564, |
| "step": 1460, |
| "valid_targets_mean": 2113.0, |
| "valid_targets_min": 1189 |
| }, |
| { |
| "epoch": 2.34775641025641, |
| "grad_norm": 0.8200928309772625, |
| "learning_rate": 3.363327665487593e-05, |
| "loss": 0.3544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15979711711406708, |
| "step": 1465, |
| "valid_targets_mean": 2258.0, |
| "valid_targets_min": 1672 |
| }, |
| { |
| "epoch": 2.355769230769231, |
| "grad_norm": 0.8309370694493936, |
| "learning_rate": 3.357469442334206e-05, |
| "loss": 0.3346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14197608828544617, |
| "step": 1470, |
| "valid_targets_mean": 1783.0, |
| "valid_targets_min": 1057 |
| }, |
| { |
| "epoch": 2.363782051282051, |
| "grad_norm": 0.7797104980045181, |
| "learning_rate": 3.351589543978965e-05, |
| "loss": 0.3431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17039065062999725, |
| "step": 1475, |
| "valid_targets_mean": 2508.9, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 2.371794871794872, |
| "grad_norm": 0.7814917434524874, |
| "learning_rate": 3.345688064308317e-05, |
| "loss": 0.3274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15709833800792694, |
| "step": 1480, |
| "valid_targets_mean": 1788.9, |
| "valid_targets_min": 242 |
| }, |
| { |
| "epoch": 2.3798076923076925, |
| "grad_norm": 0.8902647624043396, |
| "learning_rate": 3.339765097553307e-05, |
| "loss": 0.376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1867244690656662, |
| "step": 1485, |
| "valid_targets_mean": 1679.9, |
| "valid_targets_min": 387 |
| }, |
| { |
| "epoch": 2.3878205128205128, |
| "grad_norm": 0.7346094387599812, |
| "learning_rate": 3.33382073828807e-05, |
| "loss": 0.3471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13888698816299438, |
| "step": 1490, |
| "valid_targets_mean": 2292.5, |
| "valid_targets_min": 1131 |
| }, |
| { |
| "epoch": 2.3958333333333335, |
| "grad_norm": 0.9446299732229079, |
| "learning_rate": 3.327855081428326e-05, |
| "loss": 0.3449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18648427724838257, |
| "step": 1495, |
| "valid_targets_mean": 2009.9, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 2.4038461538461537, |
| "grad_norm": 0.9536703972245442, |
| "learning_rate": 3.3218682222298584e-05, |
| "loss": 0.354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1705888956785202, |
| "step": 1500, |
| "valid_targets_mean": 2930.1, |
| "valid_targets_min": 1317 |
| }, |
| { |
| "epoch": 2.4118589743589745, |
| "grad_norm": 0.7903036062618911, |
| "learning_rate": 3.315860256286996e-05, |
| "loss": 0.3293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13649359345436096, |
| "step": 1505, |
| "valid_targets_mean": 1522.0, |
| "valid_targets_min": 971 |
| }, |
| { |
| "epoch": 2.4198717948717947, |
| "grad_norm": 0.9511143375417098, |
| "learning_rate": 3.3098312795310894e-05, |
| "loss": 0.3604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16688911616802216, |
| "step": 1510, |
| "valid_targets_mean": 1994.0, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 2.4278846153846154, |
| "grad_norm": 0.7414997447826995, |
| "learning_rate": 3.303781388228974e-05, |
| "loss": 0.3339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19089877605438232, |
| "step": 1515, |
| "valid_targets_mean": 2811.2, |
| "valid_targets_min": 1503 |
| }, |
| { |
| "epoch": 2.435897435897436, |
| "grad_norm": 0.767828117255108, |
| "learning_rate": 3.297710678981435e-05, |
| "loss": 0.3574, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14534533023834229, |
| "step": 1520, |
| "valid_targets_mean": 2010.8, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 2.4439102564102564, |
| "grad_norm": 0.7887402243405925, |
| "learning_rate": 3.291619248721667e-05, |
| "loss": 0.3573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18452662229537964, |
| "step": 1525, |
| "valid_targets_mean": 2406.5, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 2.451923076923077, |
| "grad_norm": 0.8651403875034883, |
| "learning_rate": 3.285507194713724e-05, |
| "loss": 0.3432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21715617179870605, |
| "step": 1530, |
| "valid_targets_mean": 2057.1, |
| "valid_targets_min": 249 |
| }, |
| { |
| "epoch": 2.4599358974358974, |
| "grad_norm": 0.9068357442847398, |
| "learning_rate": 3.279374614550966e-05, |
| "loss": 0.3353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1632959544658661, |
| "step": 1535, |
| "valid_targets_mean": 1864.1, |
| "valid_targets_min": 500 |
| }, |
| { |
| "epoch": 2.467948717948718, |
| "grad_norm": 0.745269665162631, |
| "learning_rate": 3.2732216061545e-05, |
| "loss": 0.342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1703471690416336, |
| "step": 1540, |
| "valid_targets_mean": 2952.0, |
| "valid_targets_min": 508 |
| }, |
| { |
| "epoch": 2.4759615384615383, |
| "grad_norm": 0.7463621637326882, |
| "learning_rate": 3.2670482677716214e-05, |
| "loss": 0.3561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12429662048816681, |
| "step": 1545, |
| "valid_targets_mean": 1754.8, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 2.483974358974359, |
| "grad_norm": 0.6632562787335162, |
| "learning_rate": 3.2608546979742394e-05, |
| "loss": 0.3604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.142435684800148, |
| "step": 1550, |
| "valid_targets_mean": 2705.5, |
| "valid_targets_min": 1315 |
| }, |
| { |
| "epoch": 2.4919871794871793, |
| "grad_norm": 1.0979260579943735, |
| "learning_rate": 3.254640995657307e-05, |
| "loss": 0.3423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17696614563465118, |
| "step": 1555, |
| "valid_targets_mean": 2757.8, |
| "valid_targets_min": 1335 |
| }, |
| { |
| "epoch": 2.5, |
| "grad_norm": 0.718451828389939, |
| "learning_rate": 3.248407260037239e-05, |
| "loss": 0.3522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17623674869537354, |
| "step": 1560, |
| "valid_targets_mean": 3102.8, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 2.5080128205128203, |
| "grad_norm": 0.5714615297855816, |
| "learning_rate": 3.24215359065033e-05, |
| "loss": 0.3451, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11917003989219666, |
| "step": 1565, |
| "valid_targets_mean": 3913.8, |
| "valid_targets_min": 1852 |
| }, |
| { |
| "epoch": 2.516025641025641, |
| "grad_norm": 0.7253937767608349, |
| "learning_rate": 3.235880087351164e-05, |
| "loss": 0.3532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13781258463859558, |
| "step": 1570, |
| "valid_targets_mean": 2443.8, |
| "valid_targets_min": 1277 |
| }, |
| { |
| "epoch": 2.5240384615384617, |
| "grad_norm": 0.7141718259882394, |
| "learning_rate": 3.2295868503110184e-05, |
| "loss": 0.336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1570618599653244, |
| "step": 1575, |
| "valid_targets_mean": 2712.8, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 2.532051282051282, |
| "grad_norm": 0.7370659727178314, |
| "learning_rate": 3.22327398001627e-05, |
| "loss": 0.3498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16354694962501526, |
| "step": 1580, |
| "valid_targets_mean": 2248.0, |
| "valid_targets_min": 1015 |
| }, |
| { |
| "epoch": 2.5400641025641026, |
| "grad_norm": 0.8429155440531665, |
| "learning_rate": 3.216941577266783e-05, |
| "loss": 0.3389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18911314010620117, |
| "step": 1585, |
| "valid_targets_mean": 1692.5, |
| "valid_targets_min": 473 |
| }, |
| { |
| "epoch": 2.5480769230769234, |
| "grad_norm": 0.8850080126831343, |
| "learning_rate": 3.210589743174308e-05, |
| "loss": 0.376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25558894872665405, |
| "step": 1590, |
| "valid_targets_mean": 2742.9, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 2.5560897435897436, |
| "grad_norm": 0.7791032617822178, |
| "learning_rate": 3.204218579160857e-05, |
| "loss": 0.3491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1383132040500641, |
| "step": 1595, |
| "valid_targets_mean": 2072.0, |
| "valid_targets_min": 1294 |
| }, |
| { |
| "epoch": 2.564102564102564, |
| "grad_norm": 0.8381378811245371, |
| "learning_rate": 3.197828186957094e-05, |
| "loss": 0.344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18840298056602478, |
| "step": 1600, |
| "valid_targets_mean": 1596.6, |
| "valid_targets_min": 338 |
| }, |
| { |
| "epoch": 2.5721153846153846, |
| "grad_norm": 0.8590646227884097, |
| "learning_rate": 3.191418668600705e-05, |
| "loss": 0.3538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16716593503952026, |
| "step": 1605, |
| "valid_targets_mean": 1956.9, |
| "valid_targets_min": 1305 |
| }, |
| { |
| "epoch": 2.5801282051282053, |
| "grad_norm": 0.827636937072311, |
| "learning_rate": 3.184990126434771e-05, |
| "loss": 0.3496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18711942434310913, |
| "step": 1610, |
| "valid_targets_mean": 2087.8, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 2.5881410256410255, |
| "grad_norm": 0.7476429637498967, |
| "learning_rate": 3.178542663106131e-05, |
| "loss": 0.3452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1350896656513214, |
| "step": 1615, |
| "valid_targets_mean": 1842.0, |
| "valid_targets_min": 1224 |
| }, |
| { |
| "epoch": 2.5961538461538463, |
| "grad_norm": 0.6440604251073735, |
| "learning_rate": 3.172076381563748e-05, |
| "loss": 0.3368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1780594140291214, |
| "step": 1620, |
| "valid_targets_mean": 3939.6, |
| "valid_targets_min": 1489 |
| }, |
| { |
| "epoch": 2.6041666666666665, |
| "grad_norm": 0.8225690775334342, |
| "learning_rate": 3.165591385057058e-05, |
| "loss": 0.3391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13189071416854858, |
| "step": 1625, |
| "valid_targets_mean": 1886.9, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 2.6121794871794872, |
| "grad_norm": 0.7321770207000557, |
| "learning_rate": 3.1590877771343316e-05, |
| "loss": 0.3349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2012443244457245, |
| "step": 1630, |
| "valid_targets_mean": 3346.5, |
| "valid_targets_min": 1084 |
| }, |
| { |
| "epoch": 2.6201923076923075, |
| "grad_norm": 0.7457391847366335, |
| "learning_rate": 3.152565661641008e-05, |
| "loss": 0.3506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17787332832813263, |
| "step": 1635, |
| "valid_targets_mean": 2177.1, |
| "valid_targets_min": 934 |
| }, |
| { |
| "epoch": 2.628205128205128, |
| "grad_norm": 0.7502464415879065, |
| "learning_rate": 3.1460251427180474e-05, |
| "loss": 0.3503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16391557455062866, |
| "step": 1640, |
| "valid_targets_mean": 2989.6, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 2.636217948717949, |
| "grad_norm": 0.9095546327940534, |
| "learning_rate": 3.139466324800263e-05, |
| "loss": 0.3692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1844089925289154, |
| "step": 1645, |
| "valid_targets_mean": 1437.8, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 2.644230769230769, |
| "grad_norm": 0.7167811943459642, |
| "learning_rate": 3.132889312614655e-05, |
| "loss": 0.325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1620154082775116, |
| "step": 1650, |
| "valid_targets_mean": 2718.0, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 2.65224358974359, |
| "grad_norm": 0.7082837484361146, |
| "learning_rate": 3.126294211178737e-05, |
| "loss": 0.3712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22598208487033844, |
| "step": 1655, |
| "valid_targets_mean": 3451.8, |
| "valid_targets_min": 959 |
| }, |
| { |
| "epoch": 2.66025641025641, |
| "grad_norm": 0.7905440205287989, |
| "learning_rate": 3.1196811257988634e-05, |
| "loss": 0.3238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.166299968957901, |
| "step": 1660, |
| "valid_targets_mean": 2094.1, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 2.668269230769231, |
| "grad_norm": 0.7476779090208169, |
| "learning_rate": 3.1130501620685394e-05, |
| "loss": 0.3436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13155703246593475, |
| "step": 1665, |
| "valid_targets_mean": 2074.2, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 2.676282051282051, |
| "grad_norm": 0.614252113316522, |
| "learning_rate": 3.106401425866745e-05, |
| "loss": 0.3477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11827291548252106, |
| "step": 1670, |
| "valid_targets_mean": 2858.2, |
| "valid_targets_min": 912 |
| }, |
| { |
| "epoch": 2.684294871794872, |
| "grad_norm": 0.8246290440439452, |
| "learning_rate": 3.099735023356236e-05, |
| "loss": 0.347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21760646998882294, |
| "step": 1675, |
| "valid_targets_mean": 2478.5, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 2.6923076923076925, |
| "grad_norm": 0.8477067106504065, |
| "learning_rate": 3.0930510609818564e-05, |
| "loss": 0.3248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18377399444580078, |
| "step": 1680, |
| "valid_targets_mean": 2193.5, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 2.7003205128205128, |
| "grad_norm": 0.743871662197125, |
| "learning_rate": 3.086349645468831e-05, |
| "loss": 0.3422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16777920722961426, |
| "step": 1685, |
| "valid_targets_mean": 2257.5, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 2.7083333333333335, |
| "grad_norm": 0.8446130888099646, |
| "learning_rate": 3.079630883821067e-05, |
| "loss": 0.3332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1785382628440857, |
| "step": 1690, |
| "valid_targets_mean": 2225.0, |
| "valid_targets_min": 1133 |
| }, |
| { |
| "epoch": 2.7163461538461537, |
| "grad_norm": 0.7190320385340914, |
| "learning_rate": 3.0728948833194436e-05, |
| "loss": 0.3663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1873319000005722, |
| "step": 1695, |
| "valid_targets_mean": 3258.6, |
| "valid_targets_min": 1604 |
| }, |
| { |
| "epoch": 2.7243589743589745, |
| "grad_norm": 0.7955833242225298, |
| "learning_rate": 3.066141751520099e-05, |
| "loss": 0.3468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16164278984069824, |
| "step": 1700, |
| "valid_targets_mean": 2220.6, |
| "valid_targets_min": 948 |
| }, |
| { |
| "epoch": 2.7323717948717947, |
| "grad_norm": 0.8727727023841495, |
| "learning_rate": 3.059371596252712e-05, |
| "loss": 0.3399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1807830035686493, |
| "step": 1705, |
| "valid_targets_mean": 2360.4, |
| "valid_targets_min": 1186 |
| }, |
| { |
| "epoch": 2.7403846153846154, |
| "grad_norm": 0.8285434490328112, |
| "learning_rate": 3.0525845256187834e-05, |
| "loss": 0.3647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19549046456813812, |
| "step": 1710, |
| "valid_targets_mean": 2300.2, |
| "valid_targets_min": 1139 |
| }, |
| { |
| "epoch": 2.748397435897436, |
| "grad_norm": 0.6665940354235458, |
| "learning_rate": 3.0457806479899044e-05, |
| "loss": 0.3145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1639786660671234, |
| "step": 1715, |
| "valid_targets_mean": 3070.1, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 2.7564102564102564, |
| "grad_norm": 0.7400644302712954, |
| "learning_rate": 3.0389600720060318e-05, |
| "loss": 0.344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15920796990394592, |
| "step": 1720, |
| "valid_targets_mean": 2484.5, |
| "valid_targets_min": 1521 |
| }, |
| { |
| "epoch": 2.7644230769230766, |
| "grad_norm": 0.6529233923053657, |
| "learning_rate": 3.0321229065737522e-05, |
| "loss": 0.3434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15723413228988647, |
| "step": 1725, |
| "valid_targets_mean": 2664.8, |
| "valid_targets_min": 1180 |
| }, |
| { |
| "epoch": 2.7724358974358974, |
| "grad_norm": 0.9818917911509216, |
| "learning_rate": 3.0252692608645384e-05, |
| "loss": 0.3592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18439249694347382, |
| "step": 1730, |
| "valid_targets_mean": 1599.9, |
| "valid_targets_min": 931 |
| }, |
| { |
| "epoch": 2.780448717948718, |
| "grad_norm": 0.7429322400334534, |
| "learning_rate": 3.0183992443130127e-05, |
| "loss": 0.3221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1347109079360962, |
| "step": 1735, |
| "valid_targets_mean": 2627.2, |
| "valid_targets_min": 1023 |
| }, |
| { |
| "epoch": 2.7884615384615383, |
| "grad_norm": 0.825330415012023, |
| "learning_rate": 3.011512966615195e-05, |
| "loss": 0.3568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1733407974243164, |
| "step": 1740, |
| "valid_targets_mean": 2149.0, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 2.796474358974359, |
| "grad_norm": 0.7695789184189072, |
| "learning_rate": 3.0046105377267523e-05, |
| "loss": 0.3452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13556677103042603, |
| "step": 1745, |
| "valid_targets_mean": 2014.4, |
| "valid_targets_min": 1220 |
| }, |
| { |
| "epoch": 2.8044871794871797, |
| "grad_norm": 0.7365188240450388, |
| "learning_rate": 2.9976920678612456e-05, |
| "loss": 0.3379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19936934113502502, |
| "step": 1750, |
| "valid_targets_mean": 3110.4, |
| "valid_targets_min": 1290 |
| }, |
| { |
| "epoch": 2.8125, |
| "grad_norm": 0.7010220729446671, |
| "learning_rate": 2.9907576674883664e-05, |
| "loss": 0.3527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14287908375263214, |
| "step": 1755, |
| "valid_targets_mean": 2108.6, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 2.8205128205128203, |
| "grad_norm": 1.0422014811559845, |
| "learning_rate": 2.983807447332174e-05, |
| "loss": 0.3366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19687989354133606, |
| "step": 1760, |
| "valid_targets_mean": 2476.4, |
| "valid_targets_min": 828 |
| }, |
| { |
| "epoch": 2.828525641025641, |
| "grad_norm": 0.7770747301590775, |
| "learning_rate": 2.9768415183693293e-05, |
| "loss": 0.3622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19372722506523132, |
| "step": 1765, |
| "valid_targets_mean": 2394.9, |
| "valid_targets_min": 577 |
| }, |
| { |
| "epoch": 2.8365384615384617, |
| "grad_norm": 0.7422438539405928, |
| "learning_rate": 2.9698599918273197e-05, |
| "loss": 0.3448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1415659487247467, |
| "step": 1770, |
| "valid_targets_mean": 1877.5, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 2.844551282051282, |
| "grad_norm": 0.8216346096786719, |
| "learning_rate": 2.962862979182686e-05, |
| "loss": 0.3372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17512428760528564, |
| "step": 1775, |
| "valid_targets_mean": 2119.5, |
| "valid_targets_min": 1289 |
| }, |
| { |
| "epoch": 2.8525641025641026, |
| "grad_norm": 0.6864990682783045, |
| "learning_rate": 2.95585059215924e-05, |
| "loss": 0.3494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14896155893802643, |
| "step": 1780, |
| "valid_targets_mean": 2570.9, |
| "valid_targets_min": 1166 |
| }, |
| { |
| "epoch": 2.8605769230769234, |
| "grad_norm": 0.7673674716714654, |
| "learning_rate": 2.948822942726284e-05, |
| "loss": 0.3436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1696726679801941, |
| "step": 1785, |
| "valid_targets_mean": 2115.2, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 2.8685897435897436, |
| "grad_norm": 0.787999238286826, |
| "learning_rate": 2.941780143096817e-05, |
| "loss": 0.3485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23070955276489258, |
| "step": 1790, |
| "valid_targets_mean": 2714.6, |
| "valid_targets_min": 1237 |
| }, |
| { |
| "epoch": 2.876602564102564, |
| "grad_norm": 0.6927465574387711, |
| "learning_rate": 2.9347223057257505e-05, |
| "loss": 0.3081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15984871983528137, |
| "step": 1795, |
| "valid_targets_mean": 2840.6, |
| "valid_targets_min": 1456 |
| }, |
| { |
| "epoch": 2.8846153846153846, |
| "grad_norm": 0.7229524925061765, |
| "learning_rate": 2.927649543308106e-05, |
| "loss": 0.3195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1824902594089508, |
| "step": 1800, |
| "valid_targets_mean": 2636.5, |
| "valid_targets_min": 1155 |
| }, |
| { |
| "epoch": 2.8926282051282053, |
| "grad_norm": 0.9207234756930798, |
| "learning_rate": 2.9205619687772212e-05, |
| "loss": 0.3468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.194568932056427, |
| "step": 1805, |
| "valid_targets_mean": 2309.9, |
| "valid_targets_min": 1418 |
| }, |
| { |
| "epoch": 2.9006410256410255, |
| "grad_norm": 0.8484173433057807, |
| "learning_rate": 2.9134596953029413e-05, |
| "loss": 0.3508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18519386649131775, |
| "step": 1810, |
| "valid_targets_mean": 1788.4, |
| "valid_targets_min": 1265 |
| }, |
| { |
| "epoch": 2.9086538461538463, |
| "grad_norm": 0.8106235389071998, |
| "learning_rate": 2.9063428362898168e-05, |
| "loss": 0.3538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18934476375579834, |
| "step": 1815, |
| "valid_targets_mean": 2666.2, |
| "valid_targets_min": 1363 |
| }, |
| { |
| "epoch": 2.9166666666666665, |
| "grad_norm": 0.8083685538552774, |
| "learning_rate": 2.8992115053752905e-05, |
| "loss": 0.336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21094626188278198, |
| "step": 1820, |
| "valid_targets_mean": 2983.9, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 2.9246794871794872, |
| "grad_norm": 0.683223511020343, |
| "learning_rate": 2.8920658164278816e-05, |
| "loss": 0.3449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19165866076946259, |
| "step": 1825, |
| "valid_targets_mean": 3494.6, |
| "valid_targets_min": 1391 |
| }, |
| { |
| "epoch": 2.9326923076923075, |
| "grad_norm": 0.7022396849802295, |
| "learning_rate": 2.884905883545373e-05, |
| "loss": 0.3389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1804656982421875, |
| "step": 1830, |
| "valid_targets_mean": 2772.4, |
| "valid_targets_min": 1289 |
| }, |
| { |
| "epoch": 2.940705128205128, |
| "grad_norm": 0.699550022589993, |
| "learning_rate": 2.877731821052981e-05, |
| "loss": 0.3475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15796631574630737, |
| "step": 1835, |
| "valid_targets_mean": 2599.6, |
| "valid_targets_min": 985 |
| }, |
| { |
| "epoch": 2.948717948717949, |
| "grad_norm": 0.7457851430690988, |
| "learning_rate": 2.8705437435015375e-05, |
| "loss": 0.3592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1569703370332718, |
| "step": 1840, |
| "valid_targets_mean": 2262.1, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 2.956730769230769, |
| "grad_norm": 0.8448740229638224, |
| "learning_rate": 2.8633417656656566e-05, |
| "loss": 0.3345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19404947757720947, |
| "step": 1845, |
| "valid_targets_mean": 1978.1, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 2.96474358974359, |
| "grad_norm": 0.8042048534440943, |
| "learning_rate": 2.8561260025419036e-05, |
| "loss": 0.3377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18623505532741547, |
| "step": 1850, |
| "valid_targets_mean": 2426.5, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 2.97275641025641, |
| "grad_norm": 0.7147551803870944, |
| "learning_rate": 2.8488965693469583e-05, |
| "loss": 0.328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19029518961906433, |
| "step": 1855, |
| "valid_targets_mean": 2745.0, |
| "valid_targets_min": 1748 |
| }, |
| { |
| "epoch": 2.980769230769231, |
| "grad_norm": 0.7361534209295404, |
| "learning_rate": 2.8416535815157763e-05, |
| "loss": 0.3141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1878901571035385, |
| "step": 1860, |
| "valid_targets_mean": 2995.4, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 2.988782051282051, |
| "grad_norm": 0.7658891299385264, |
| "learning_rate": 2.8343971546997434e-05, |
| "loss": 0.3467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16783340275287628, |
| "step": 1865, |
| "valid_targets_mean": 2798.8, |
| "valid_targets_min": 383 |
| }, |
| { |
| "epoch": 2.996794871794872, |
| "grad_norm": 0.7446832022601828, |
| "learning_rate": 2.827127404764831e-05, |
| "loss": 0.3496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16190892457962036, |
| "step": 1870, |
| "valid_targets_mean": 2053.6, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 3.0048076923076925, |
| "grad_norm": 0.7325957115374676, |
| "learning_rate": 2.8198444477897467e-05, |
| "loss": 0.3039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1726066768169403, |
| "step": 1875, |
| "valid_targets_mean": 2703.5, |
| "valid_targets_min": 321 |
| }, |
| { |
| "epoch": 3.0128205128205128, |
| "grad_norm": 0.8146787211464528, |
| "learning_rate": 2.8125484000640787e-05, |
| "loss": 0.2898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14417630434036255, |
| "step": 1880, |
| "valid_targets_mean": 2497.8, |
| "valid_targets_min": 1203 |
| }, |
| { |
| "epoch": 3.0208333333333335, |
| "grad_norm": 0.8406399733518674, |
| "learning_rate": 2.8052393780864394e-05, |
| "loss": 0.3054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1478326916694641, |
| "step": 1885, |
| "valid_targets_mean": 2281.6, |
| "valid_targets_min": 1267 |
| }, |
| { |
| "epoch": 3.0288461538461537, |
| "grad_norm": 0.7160031702370862, |
| "learning_rate": 2.797917498562607e-05, |
| "loss": 0.294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13371425867080688, |
| "step": 1890, |
| "valid_targets_mean": 3478.1, |
| "valid_targets_min": 2443 |
| }, |
| { |
| "epoch": 3.0368589743589745, |
| "grad_norm": 0.7856133018379108, |
| "learning_rate": 2.7905828784036596e-05, |
| "loss": 0.2932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19632607698440552, |
| "step": 1895, |
| "valid_targets_mean": 3087.1, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 3.0448717948717947, |
| "grad_norm": 0.947660312509705, |
| "learning_rate": 2.78323563472411e-05, |
| "loss": 0.3186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13372501730918884, |
| "step": 1900, |
| "valid_targets_mean": 1653.9, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 3.0528846153846154, |
| "grad_norm": 0.9400847917635448, |
| "learning_rate": 2.7758758848400354e-05, |
| "loss": 0.3086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1144673079252243, |
| "step": 1905, |
| "valid_targets_mean": 1697.1, |
| "valid_targets_min": 859 |
| }, |
| { |
| "epoch": 3.0608974358974357, |
| "grad_norm": 0.7027648710059686, |
| "learning_rate": 2.7685037462672043e-05, |
| "loss": 0.3216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10471771657466888, |
| "step": 1910, |
| "valid_targets_mean": 2158.2, |
| "valid_targets_min": 1249 |
| }, |
| { |
| "epoch": 3.0689102564102564, |
| "grad_norm": 0.9402109201312709, |
| "learning_rate": 2.7611193367191993e-05, |
| "loss": 0.3119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21580298244953156, |
| "step": 1915, |
| "valid_targets_mean": 2296.0, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 3.076923076923077, |
| "grad_norm": 0.9572841906462561, |
| "learning_rate": 2.7537227741055378e-05, |
| "loss": 0.3104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1641775518655777, |
| "step": 1920, |
| "valid_targets_mean": 1653.5, |
| "valid_targets_min": 1161 |
| }, |
| { |
| "epoch": 3.0849358974358974, |
| "grad_norm": 0.729963052156269, |
| "learning_rate": 2.746314176529791e-05, |
| "loss": 0.2922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14104565978050232, |
| "step": 1925, |
| "valid_targets_mean": 2807.6, |
| "valid_targets_min": 1764 |
| }, |
| { |
| "epoch": 3.092948717948718, |
| "grad_norm": 0.7748643309949854, |
| "learning_rate": 2.7388936622876957e-05, |
| "loss": 0.2911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1505746990442276, |
| "step": 1930, |
| "valid_targets_mean": 2144.5, |
| "valid_targets_min": 960 |
| }, |
| { |
| "epoch": 3.1009615384615383, |
| "grad_norm": 0.7762780237813749, |
| "learning_rate": 2.7314613498652663e-05, |
| "loss": 0.2857, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17231060564517975, |
| "step": 1935, |
| "valid_targets_mean": 3336.2, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 3.108974358974359, |
| "grad_norm": 0.6722190788058807, |
| "learning_rate": 2.7240173579369025e-05, |
| "loss": 0.2833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14252430200576782, |
| "step": 1940, |
| "valid_targets_mean": 3849.6, |
| "valid_targets_min": 1573 |
| }, |
| { |
| "epoch": 3.1169871794871793, |
| "grad_norm": 0.9430632446810732, |
| "learning_rate": 2.7165618053634962e-05, |
| "loss": 0.3255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1814703643321991, |
| "step": 1945, |
| "valid_targets_mean": 2009.1, |
| "valid_targets_min": 1026 |
| }, |
| { |
| "epoch": 3.125, |
| "grad_norm": 0.7277451337056141, |
| "learning_rate": 2.7090948111905304e-05, |
| "loss": 0.283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15981590747833252, |
| "step": 1950, |
| "valid_targets_mean": 3229.4, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 3.1330128205128207, |
| "grad_norm": 0.8461152648042034, |
| "learning_rate": 2.701616494646183e-05, |
| "loss": 0.3036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1708703637123108, |
| "step": 1955, |
| "valid_targets_mean": 2370.4, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 3.141025641025641, |
| "grad_norm": 0.8759130229646693, |
| "learning_rate": 2.6941269751394174e-05, |
| "loss": 0.3199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1723184883594513, |
| "step": 1960, |
| "valid_targets_mean": 2504.0, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 3.1490384615384617, |
| "grad_norm": 0.8760804346780584, |
| "learning_rate": 2.686626372258081e-05, |
| "loss": 0.3108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1883678436279297, |
| "step": 1965, |
| "valid_targets_mean": 2763.2, |
| "valid_targets_min": 1438 |
| }, |
| { |
| "epoch": 3.157051282051282, |
| "grad_norm": 0.7824998399362582, |
| "learning_rate": 2.6791148057669913e-05, |
| "loss": 0.3121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14598461985588074, |
| "step": 1970, |
| "valid_targets_mean": 1893.1, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 3.1650641025641026, |
| "grad_norm": 0.7207162402545875, |
| "learning_rate": 2.671592395606027e-05, |
| "loss": 0.2963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1699347198009491, |
| "step": 1975, |
| "valid_targets_mean": 3550.0, |
| "valid_targets_min": 1056 |
| }, |
| { |
| "epoch": 3.173076923076923, |
| "grad_norm": 0.8392526596294367, |
| "learning_rate": 2.6640592618882114e-05, |
| "loss": 0.2851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12137892842292786, |
| "step": 1980, |
| "valid_targets_mean": 2289.5, |
| "valid_targets_min": 1066 |
| }, |
| { |
| "epoch": 3.1810897435897436, |
| "grad_norm": 0.6882637569568384, |
| "learning_rate": 2.656515524897795e-05, |
| "loss": 0.317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19221651554107666, |
| "step": 1985, |
| "valid_targets_mean": 3759.4, |
| "valid_targets_min": 1478 |
| }, |
| { |
| "epoch": 3.189102564102564, |
| "grad_norm": 0.9801416336913753, |
| "learning_rate": 2.6489613050883343e-05, |
| "loss": 0.3079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15233540534973145, |
| "step": 1990, |
| "valid_targets_mean": 1970.0, |
| "valid_targets_min": 1294 |
| }, |
| { |
| "epoch": 3.1971153846153846, |
| "grad_norm": 0.7453903933538132, |
| "learning_rate": 2.6413967230807677e-05, |
| "loss": 0.2709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16587764024734497, |
| "step": 1995, |
| "valid_targets_mean": 3308.9, |
| "valid_targets_min": 1813 |
| }, |
| { |
| "epoch": 3.2051282051282053, |
| "grad_norm": 0.7841224659830258, |
| "learning_rate": 2.6338218996614924e-05, |
| "loss": 0.3102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12263019382953644, |
| "step": 2000, |
| "valid_targets_mean": 2472.6, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 3.2131410256410255, |
| "grad_norm": 0.9039563479812038, |
| "learning_rate": 2.6262369557804325e-05, |
| "loss": 0.3313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1826220154762268, |
| "step": 2005, |
| "valid_targets_mean": 2237.0, |
| "valid_targets_min": 999 |
| }, |
| { |
| "epoch": 3.2211538461538463, |
| "grad_norm": 0.8416860751127145, |
| "learning_rate": 2.6186420125491094e-05, |
| "loss": 0.3029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1301402747631073, |
| "step": 2010, |
| "valid_targets_mean": 2353.5, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 3.2291666666666665, |
| "grad_norm": 0.8526043964264228, |
| "learning_rate": 2.6110371912387083e-05, |
| "loss": 0.3157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14723050594329834, |
| "step": 2015, |
| "valid_targets_mean": 1859.8, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 3.2371794871794872, |
| "grad_norm": 0.7157138595622383, |
| "learning_rate": 2.6034226132781407e-05, |
| "loss": 0.2923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1483040452003479, |
| "step": 2020, |
| "valid_targets_mean": 3164.2, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 3.2451923076923075, |
| "grad_norm": 0.8354355862763577, |
| "learning_rate": 2.5957984002521066e-05, |
| "loss": 0.2997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.151239812374115, |
| "step": 2025, |
| "valid_targets_mean": 1905.2, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 3.253205128205128, |
| "grad_norm": 0.8549380234850392, |
| "learning_rate": 2.588164673899151e-05, |
| "loss": 0.3203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14034335315227509, |
| "step": 2030, |
| "valid_targets_mean": 1982.0, |
| "valid_targets_min": 1465 |
| }, |
| { |
| "epoch": 3.261217948717949, |
| "grad_norm": 0.6918270014906354, |
| "learning_rate": 2.580521556109724e-05, |
| "loss": 0.3121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1363942176103592, |
| "step": 2035, |
| "valid_targets_mean": 2749.0, |
| "valid_targets_min": 1295 |
| }, |
| { |
| "epoch": 3.269230769230769, |
| "grad_norm": 1.0174666576501485, |
| "learning_rate": 2.57286916892423e-05, |
| "loss": 0.3029, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18560458719730377, |
| "step": 2040, |
| "valid_targets_mean": 1905.9, |
| "valid_targets_min": 1423 |
| }, |
| { |
| "epoch": 3.27724358974359, |
| "grad_norm": 0.9140763921901908, |
| "learning_rate": 2.5652076345310822e-05, |
| "loss": 0.3259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14916765689849854, |
| "step": 2045, |
| "valid_targets_mean": 1814.0, |
| "valid_targets_min": 1239 |
| }, |
| { |
| "epoch": 3.28525641025641, |
| "grad_norm": 0.6748799927803247, |
| "learning_rate": 2.5575370752647507e-05, |
| "loss": 0.2976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12936852872371674, |
| "step": 2050, |
| "valid_targets_mean": 2390.4, |
| "valid_targets_min": 1174 |
| }, |
| { |
| "epoch": 3.293269230769231, |
| "grad_norm": 0.7156103482993798, |
| "learning_rate": 2.5498576136038077e-05, |
| "loss": 0.32, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1080101728439331, |
| "step": 2055, |
| "valid_targets_mean": 1998.4, |
| "valid_targets_min": 1159 |
| }, |
| { |
| "epoch": 3.301282051282051, |
| "grad_norm": 0.703655239658459, |
| "learning_rate": 2.542169372168976e-05, |
| "loss": 0.3054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12107835710048676, |
| "step": 2060, |
| "valid_targets_mean": 2706.5, |
| "valid_targets_min": 653 |
| }, |
| { |
| "epoch": 3.309294871794872, |
| "grad_norm": 0.739225948183899, |
| "learning_rate": 2.5344724737211646e-05, |
| "loss": 0.3064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09956350922584534, |
| "step": 2065, |
| "valid_targets_mean": 1626.0, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 3.3173076923076925, |
| "grad_norm": 2.2757640724713064, |
| "learning_rate": 2.5267670411595152e-05, |
| "loss": 0.3038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1255197525024414, |
| "step": 2070, |
| "valid_targets_mean": 2971.5, |
| "valid_targets_min": 1132 |
| }, |
| { |
| "epoch": 3.3253205128205128, |
| "grad_norm": 0.7500910233878659, |
| "learning_rate": 2.5190531975194345e-05, |
| "loss": 0.3003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14343443512916565, |
| "step": 2075, |
| "valid_targets_mean": 3160.2, |
| "valid_targets_min": 1641 |
| }, |
| { |
| "epoch": 3.3333333333333335, |
| "grad_norm": 0.7428850119831736, |
| "learning_rate": 2.5113310659706322e-05, |
| "loss": 0.3057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1660858690738678, |
| "step": 2080, |
| "valid_targets_mean": 3558.9, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 3.3413461538461537, |
| "grad_norm": 0.805327734018275, |
| "learning_rate": 2.5036007698151553e-05, |
| "loss": 0.2945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11538653075695038, |
| "step": 2085, |
| "valid_targets_mean": 2320.5, |
| "valid_targets_min": 990 |
| }, |
| { |
| "epoch": 3.3493589743589745, |
| "grad_norm": 0.8271835600858624, |
| "learning_rate": 2.4958624324854185e-05, |
| "loss": 0.3124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1344335377216339, |
| "step": 2090, |
| "valid_targets_mean": 1865.6, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 3.3573717948717947, |
| "grad_norm": 0.7768125076129313, |
| "learning_rate": 2.4881161775422303e-05, |
| "loss": 0.288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16174614429473877, |
| "step": 2095, |
| "valid_targets_mean": 2769.1, |
| "valid_targets_min": 233 |
| }, |
| { |
| "epoch": 3.3653846153846154, |
| "grad_norm": 0.8892991278143192, |
| "learning_rate": 2.480362128672824e-05, |
| "loss": 0.3083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1573309600353241, |
| "step": 2100, |
| "valid_targets_mean": 2051.8, |
| "valid_targets_min": 878 |
| }, |
| { |
| "epoch": 3.373397435897436, |
| "grad_norm": 0.8378062536549976, |
| "learning_rate": 2.4726004096888817e-05, |
| "loss": 0.302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20106950402259827, |
| "step": 2105, |
| "valid_targets_mean": 3109.9, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 3.3814102564102564, |
| "grad_norm": 0.8230359694097013, |
| "learning_rate": 2.4648311445245558e-05, |
| "loss": 0.3226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2123335748910904, |
| "step": 2110, |
| "valid_targets_mean": 2667.5, |
| "valid_targets_min": 1020 |
| }, |
| { |
| "epoch": 3.389423076923077, |
| "grad_norm": 0.9290568558607065, |
| "learning_rate": 2.457054457234493e-05, |
| "loss": 0.3193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18395236134529114, |
| "step": 2115, |
| "valid_targets_mean": 2331.6, |
| "valid_targets_min": 281 |
| }, |
| { |
| "epoch": 3.3974358974358974, |
| "grad_norm": 0.7670991635073626, |
| "learning_rate": 2.4492704719918497e-05, |
| "loss": 0.3027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15496304631233215, |
| "step": 2120, |
| "valid_targets_mean": 2392.4, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 3.405448717948718, |
| "grad_norm": 0.782240421451244, |
| "learning_rate": 2.4414793130863134e-05, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18173784017562866, |
| "step": 2125, |
| "valid_targets_mean": 3618.1, |
| "valid_targets_min": 708 |
| }, |
| { |
| "epoch": 3.4134615384615383, |
| "grad_norm": 0.7322971407666778, |
| "learning_rate": 2.433681104922114e-05, |
| "loss": 0.3136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.117400161921978, |
| "step": 2130, |
| "valid_targets_mean": 2565.1, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 3.421474358974359, |
| "grad_norm": 0.6489435534494313, |
| "learning_rate": 2.4258759720160412e-05, |
| "loss": 0.3057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13403040170669556, |
| "step": 2135, |
| "valid_targets_mean": 3160.1, |
| "valid_targets_min": 1714 |
| }, |
| { |
| "epoch": 3.4294871794871793, |
| "grad_norm": 0.7779796344498587, |
| "learning_rate": 2.4180640389954534e-05, |
| "loss": 0.3, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15386280417442322, |
| "step": 2140, |
| "valid_targets_mean": 2593.6, |
| "valid_targets_min": 1072 |
| }, |
| { |
| "epoch": 3.4375, |
| "grad_norm": 0.8296585482152623, |
| "learning_rate": 2.4102454305962892e-05, |
| "loss": 0.3107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1341044306755066, |
| "step": 2145, |
| "valid_targets_mean": 1699.1, |
| "valid_targets_min": 361 |
| }, |
| { |
| "epoch": 3.4455128205128207, |
| "grad_norm": 0.7714401323308417, |
| "learning_rate": 2.402420271661076e-05, |
| "loss": 0.2962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14644163846969604, |
| "step": 2150, |
| "valid_targets_mean": 3023.0, |
| "valid_targets_min": 942 |
| }, |
| { |
| "epoch": 3.453525641025641, |
| "grad_norm": 0.7696698896813144, |
| "learning_rate": 2.3945886871369338e-05, |
| "loss": 0.2974, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16718119382858276, |
| "step": 2155, |
| "valid_targets_mean": 3139.9, |
| "valid_targets_min": 1343 |
| }, |
| { |
| "epoch": 3.4615384615384617, |
| "grad_norm": 0.8050270640705677, |
| "learning_rate": 2.3867508020735865e-05, |
| "loss": 0.3004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13597774505615234, |
| "step": 2160, |
| "valid_targets_mean": 2135.0, |
| "valid_targets_min": 1281 |
| }, |
| { |
| "epoch": 3.469551282051282, |
| "grad_norm": 0.880792188264717, |
| "learning_rate": 2.3789067416213568e-05, |
| "loss": 0.2981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.134599506855011, |
| "step": 2165, |
| "valid_targets_mean": 2303.0, |
| "valid_targets_min": 1009 |
| }, |
| { |
| "epoch": 3.4775641025641026, |
| "grad_norm": 0.7868422040472738, |
| "learning_rate": 2.3710566310291733e-05, |
| "loss": 0.3001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13010697066783905, |
| "step": 2170, |
| "valid_targets_mean": 2357.6, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 3.485576923076923, |
| "grad_norm": 0.8317296109067873, |
| "learning_rate": 2.36320059564257e-05, |
| "loss": 0.308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17702716588974, |
| "step": 2175, |
| "valid_targets_mean": 2804.6, |
| "valid_targets_min": 1479 |
| }, |
| { |
| "epoch": 3.4935897435897436, |
| "grad_norm": 0.7742404251072617, |
| "learning_rate": 2.3553387609016833e-05, |
| "loss": 0.2938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.146556094288826, |
| "step": 2180, |
| "valid_targets_mean": 2264.8, |
| "valid_targets_min": 1623 |
| }, |
| { |
| "epoch": 3.501602564102564, |
| "grad_norm": 0.8147300113930734, |
| "learning_rate": 2.347471252339252e-05, |
| "loss": 0.3077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1777869015932083, |
| "step": 2185, |
| "valid_targets_mean": 2804.1, |
| "valid_targets_min": 1277 |
| }, |
| { |
| "epoch": 3.5096153846153846, |
| "grad_norm": 0.848117651346152, |
| "learning_rate": 2.339598195578608e-05, |
| "loss": 0.3088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14068767428398132, |
| "step": 2190, |
| "valid_targets_mean": 1880.0, |
| "valid_targets_min": 895 |
| }, |
| { |
| "epoch": 3.5176282051282053, |
| "grad_norm": 0.7692448440855282, |
| "learning_rate": 2.3317197163316757e-05, |
| "loss": 0.3181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13899481296539307, |
| "step": 2195, |
| "valid_targets_mean": 2212.0, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 3.5256410256410255, |
| "grad_norm": 0.8800744946825352, |
| "learning_rate": 2.3238359403969608e-05, |
| "loss": 0.3115, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16469797492027283, |
| "step": 2200, |
| "valid_targets_mean": 2316.8, |
| "valid_targets_min": 443 |
| }, |
| { |
| "epoch": 3.5336538461538463, |
| "grad_norm": 0.9037287807197032, |
| "learning_rate": 2.315946993657543e-05, |
| "loss": 0.3168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15300291776657104, |
| "step": 2205, |
| "valid_targets_mean": 1937.8, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 3.5416666666666665, |
| "grad_norm": 0.7352963329157969, |
| "learning_rate": 2.3080530020790673e-05, |
| "loss": 0.3352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12197897583246231, |
| "step": 2210, |
| "valid_targets_mean": 2205.6, |
| "valid_targets_min": 577 |
| }, |
| { |
| "epoch": 3.5496794871794872, |
| "grad_norm": 0.7829030632859258, |
| "learning_rate": 2.300154091707731e-05, |
| "loss": 0.299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14087346196174622, |
| "step": 2215, |
| "valid_targets_mean": 2687.8, |
| "valid_targets_min": 1060 |
| }, |
| { |
| "epoch": 3.5576923076923075, |
| "grad_norm": 0.6539140626498782, |
| "learning_rate": 2.2922503886682706e-05, |
| "loss": 0.3002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12677669525146484, |
| "step": 2220, |
| "valid_targets_mean": 3135.9, |
| "valid_targets_min": 1455 |
| }, |
| { |
| "epoch": 3.565705128205128, |
| "grad_norm": 0.8014167728473969, |
| "learning_rate": 2.28434201916195e-05, |
| "loss": 0.3065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13969087600708008, |
| "step": 2225, |
| "valid_targets_mean": 2349.4, |
| "valid_targets_min": 1233 |
| }, |
| { |
| "epoch": 3.573717948717949, |
| "grad_norm": 0.6940618273966738, |
| "learning_rate": 2.2764291094645446e-05, |
| "loss": 0.3283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17305408418178558, |
| "step": 2230, |
| "valid_targets_mean": 2655.8, |
| "valid_targets_min": 1173 |
| }, |
| { |
| "epoch": 3.581730769230769, |
| "grad_norm": 0.8317185277984226, |
| "learning_rate": 2.2685117859243223e-05, |
| "loss": 0.312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1836153119802475, |
| "step": 2235, |
| "valid_targets_mean": 2955.6, |
| "valid_targets_min": 385 |
| }, |
| { |
| "epoch": 3.58974358974359, |
| "grad_norm": 0.9360794306661345, |
| "learning_rate": 2.2605901749600312e-05, |
| "loss": 0.2841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13323697447776794, |
| "step": 2240, |
| "valid_targets_mean": 1700.8, |
| "valid_targets_min": 1044 |
| }, |
| { |
| "epoch": 3.59775641025641, |
| "grad_norm": 0.9575442006291623, |
| "learning_rate": 2.2526644030588764e-05, |
| "loss": 0.3219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1550298035144806, |
| "step": 2245, |
| "valid_targets_mean": 1732.8, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 3.605769230769231, |
| "grad_norm": 0.7439293011806408, |
| "learning_rate": 2.2447345967745036e-05, |
| "loss": 0.3063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18119588494300842, |
| "step": 2250, |
| "valid_targets_mean": 3019.4, |
| "valid_targets_min": 1185 |
| }, |
| { |
| "epoch": 3.613782051282051, |
| "grad_norm": 0.7521495969910179, |
| "learning_rate": 2.2368008827249756e-05, |
| "loss": 0.3091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16421186923980713, |
| "step": 2255, |
| "valid_targets_mean": 2975.4, |
| "valid_targets_min": 1097 |
| }, |
| { |
| "epoch": 3.621794871794872, |
| "grad_norm": 0.8618091844527409, |
| "learning_rate": 2.228863387590752e-05, |
| "loss": 0.3061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13043256103992462, |
| "step": 2260, |
| "valid_targets_mean": 1935.0, |
| "valid_targets_min": 1235 |
| }, |
| { |
| "epoch": 3.6298076923076925, |
| "grad_norm": 0.9418809259129349, |
| "learning_rate": 2.2209222381126687e-05, |
| "loss": 0.312, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18692129850387573, |
| "step": 2265, |
| "valid_targets_mean": 3238.5, |
| "valid_targets_min": 1272 |
| }, |
| { |
| "epoch": 3.6378205128205128, |
| "grad_norm": 1.2669863904356735, |
| "learning_rate": 2.212977561089908e-05, |
| "loss": 0.3086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11323244869709015, |
| "step": 2270, |
| "valid_targets_mean": 1818.8, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 3.6458333333333335, |
| "grad_norm": 0.7178438925925271, |
| "learning_rate": 2.20502948337798e-05, |
| "loss": 0.3093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14442986249923706, |
| "step": 2275, |
| "valid_targets_mean": 2371.1, |
| "valid_targets_min": 1153 |
| }, |
| { |
| "epoch": 3.6538461538461537, |
| "grad_norm": 0.8569782259230551, |
| "learning_rate": 2.1970781318866953e-05, |
| "loss": 0.3256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19485518336296082, |
| "step": 2280, |
| "valid_targets_mean": 2588.1, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 3.6618589743589745, |
| "grad_norm": 2.112497526405271, |
| "learning_rate": 2.1891236335781363e-05, |
| "loss": 0.3152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12906664609909058, |
| "step": 2285, |
| "valid_targets_mean": 2045.6, |
| "valid_targets_min": 1078 |
| }, |
| { |
| "epoch": 3.6698717948717947, |
| "grad_norm": 1.2177253686979004, |
| "learning_rate": 2.1811661154646332e-05, |
| "loss": 0.3239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1536482274532318, |
| "step": 2290, |
| "valid_targets_mean": 1866.0, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 3.6778846153846154, |
| "grad_norm": 0.7181600618276615, |
| "learning_rate": 2.173205704606735e-05, |
| "loss": 0.3128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16137897968292236, |
| "step": 2295, |
| "valid_targets_mean": 3668.9, |
| "valid_targets_min": 1970 |
| }, |
| { |
| "epoch": 3.685897435897436, |
| "grad_norm": 0.7682172069784419, |
| "learning_rate": 2.1652425281111785e-05, |
| "loss": 0.2944, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11456585675477982, |
| "step": 2300, |
| "valid_targets_mean": 2416.9, |
| "valid_targets_min": 1804 |
| }, |
| { |
| "epoch": 3.6939102564102564, |
| "grad_norm": 0.894927579310415, |
| "learning_rate": 2.1572767131288607e-05, |
| "loss": 0.2982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12253161519765854, |
| "step": 2305, |
| "valid_targets_mean": 2175.1, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 3.7019230769230766, |
| "grad_norm": 0.9030443572331698, |
| "learning_rate": 2.1493083868528095e-05, |
| "loss": 0.3084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16637665033340454, |
| "step": 2310, |
| "valid_targets_mean": 1787.1, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 3.7099358974358974, |
| "grad_norm": 0.8709845006870474, |
| "learning_rate": 2.141337676516151e-05, |
| "loss": 0.292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14325791597366333, |
| "step": 2315, |
| "valid_targets_mean": 2471.1, |
| "valid_targets_min": 1252 |
| }, |
| { |
| "epoch": 3.717948717948718, |
| "grad_norm": 0.7117739613765913, |
| "learning_rate": 2.1333647093900772e-05, |
| "loss": 0.3006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1770605444908142, |
| "step": 2320, |
| "valid_targets_mean": 3549.5, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 3.7259615384615383, |
| "grad_norm": 0.7878345355183604, |
| "learning_rate": 2.1253896127818175e-05, |
| "loss": 0.3084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0999627634882927, |
| "step": 2325, |
| "valid_targets_mean": 1936.6, |
| "valid_targets_min": 1035 |
| }, |
| { |
| "epoch": 3.733974358974359, |
| "grad_norm": 0.886615512563476, |
| "learning_rate": 2.1174125140326013e-05, |
| "loss": 0.2965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15225833654403687, |
| "step": 2330, |
| "valid_targets_mean": 2917.9, |
| "valid_targets_min": 902 |
| }, |
| { |
| "epoch": 3.7419871794871797, |
| "grad_norm": 0.7335716261401273, |
| "learning_rate": 2.1094335405156277e-05, |
| "loss": 0.3036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13625505566596985, |
| "step": 2335, |
| "valid_targets_mean": 2365.8, |
| "valid_targets_min": 1204 |
| }, |
| { |
| "epoch": 3.75, |
| "grad_norm": 0.8029433347399508, |
| "learning_rate": 2.1014528196340316e-05, |
| "loss": 0.3038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17654207348823547, |
| "step": 2340, |
| "valid_targets_mean": 3089.9, |
| "valid_targets_min": 1638 |
| }, |
| { |
| "epoch": 3.7580128205128203, |
| "grad_norm": 0.813979444044512, |
| "learning_rate": 2.093470478818847e-05, |
| "loss": 0.3084, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17776831984519958, |
| "step": 2345, |
| "valid_targets_mean": 2865.4, |
| "valid_targets_min": 1878 |
| }, |
| { |
| "epoch": 3.766025641025641, |
| "grad_norm": 1.0704643578025568, |
| "learning_rate": 2.0854866455269756e-05, |
| "loss": 0.2992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11565354466438293, |
| "step": 2350, |
| "valid_targets_mean": 2172.4, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 3.7740384615384617, |
| "grad_norm": 0.767664259998352, |
| "learning_rate": 2.0775014472391496e-05, |
| "loss": 0.2908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13974158465862274, |
| "step": 2355, |
| "valid_targets_mean": 2264.8, |
| "valid_targets_min": 383 |
| }, |
| { |
| "epoch": 3.782051282051282, |
| "grad_norm": 0.8116983946381069, |
| "learning_rate": 2.0695150114578958e-05, |
| "loss": 0.3101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17401279509067535, |
| "step": 2360, |
| "valid_targets_mean": 2502.2, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 3.7900641025641026, |
| "grad_norm": 0.838756392734306, |
| "learning_rate": 2.061527465705502e-05, |
| "loss": 0.3042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1414027363061905, |
| "step": 2365, |
| "valid_targets_mean": 1893.6, |
| "valid_targets_min": 1012 |
| }, |
| { |
| "epoch": 3.7980769230769234, |
| "grad_norm": 0.8116104628684938, |
| "learning_rate": 2.0535389375219773e-05, |
| "loss": 0.2978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1255178451538086, |
| "step": 2370, |
| "valid_targets_mean": 1870.0, |
| "valid_targets_min": 1031 |
| }, |
| { |
| "epoch": 3.8060897435897436, |
| "grad_norm": 0.8119638624612898, |
| "learning_rate": 2.045549554463019e-05, |
| "loss": 0.3111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1506079137325287, |
| "step": 2375, |
| "valid_targets_mean": 2428.9, |
| "valid_targets_min": 868 |
| }, |
| { |
| "epoch": 3.814102564102564, |
| "grad_norm": 0.9284702930461602, |
| "learning_rate": 2.0375594440979744e-05, |
| "loss": 0.303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18719634413719177, |
| "step": 2380, |
| "valid_targets_mean": 2382.8, |
| "valid_targets_min": 1713 |
| }, |
| { |
| "epoch": 3.8221153846153846, |
| "grad_norm": 0.6769878780139562, |
| "learning_rate": 2.0295687340078037e-05, |
| "loss": 0.3036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14017589390277863, |
| "step": 2385, |
| "valid_targets_mean": 2623.1, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 3.8301282051282053, |
| "grad_norm": 0.7732324489152704, |
| "learning_rate": 2.0215775517830437e-05, |
| "loss": 0.3015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14514802396297455, |
| "step": 2390, |
| "valid_targets_mean": 2283.8, |
| "valid_targets_min": 1304 |
| }, |
| { |
| "epoch": 3.8381410256410255, |
| "grad_norm": 0.7064375534961691, |
| "learning_rate": 2.013586025021769e-05, |
| "loss": 0.3033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11343707889318466, |
| "step": 2395, |
| "valid_targets_mean": 2805.6, |
| "valid_targets_min": 1879 |
| }, |
| { |
| "epoch": 3.8461538461538463, |
| "grad_norm": 0.8985980622999645, |
| "learning_rate": 2.0055942813275564e-05, |
| "loss": 0.3196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16325703263282776, |
| "step": 2400, |
| "valid_targets_mean": 2028.1, |
| "valid_targets_min": 975 |
| }, |
| { |
| "epoch": 3.8541666666666665, |
| "grad_norm": 0.794562051071232, |
| "learning_rate": 1.9976024483074456e-05, |
| "loss": 0.31, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.168821781873703, |
| "step": 2405, |
| "valid_targets_mean": 3017.8, |
| "valid_targets_min": 1367 |
| }, |
| { |
| "epoch": 3.8621794871794872, |
| "grad_norm": 0.7169752500616591, |
| "learning_rate": 1.9896106535699025e-05, |
| "loss": 0.3037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15249863266944885, |
| "step": 2410, |
| "valid_targets_mean": 3116.9, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 3.8701923076923075, |
| "grad_norm": 1.2976110140884907, |
| "learning_rate": 1.9816190247227834e-05, |
| "loss": 0.3032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1410829871892929, |
| "step": 2415, |
| "valid_targets_mean": 3285.1, |
| "valid_targets_min": 1013 |
| }, |
| { |
| "epoch": 3.878205128205128, |
| "grad_norm": 0.7918220393027592, |
| "learning_rate": 1.9736276893712954e-05, |
| "loss": 0.2845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17646968364715576, |
| "step": 2420, |
| "valid_targets_mean": 2813.5, |
| "valid_targets_min": 1461 |
| }, |
| { |
| "epoch": 3.886217948717949, |
| "grad_norm": 0.9353419692330223, |
| "learning_rate": 1.9656367751159565e-05, |
| "loss": 0.3385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12920579314231873, |
| "step": 2425, |
| "valid_targets_mean": 1474.0, |
| "valid_targets_min": 314 |
| }, |
| { |
| "epoch": 3.894230769230769, |
| "grad_norm": 0.8471014654076914, |
| "learning_rate": 1.957646409550565e-05, |
| "loss": 0.3067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16839198768138885, |
| "step": 2430, |
| "valid_targets_mean": 2648.2, |
| "valid_targets_min": 1082 |
| }, |
| { |
| "epoch": 3.90224358974359, |
| "grad_norm": 0.805711000015817, |
| "learning_rate": 1.9496567202601545e-05, |
| "loss": 0.3216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1253741979598999, |
| "step": 2435, |
| "valid_targets_mean": 1789.8, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 3.91025641025641, |
| "grad_norm": 0.7373986082126022, |
| "learning_rate": 1.9416678348189627e-05, |
| "loss": 0.2949, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10667409002780914, |
| "step": 2440, |
| "valid_targets_mean": 2386.0, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 3.918269230769231, |
| "grad_norm": 0.7887849161507996, |
| "learning_rate": 1.9336798807883907e-05, |
| "loss": 0.3046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14934706687927246, |
| "step": 2445, |
| "valid_targets_mean": 2199.2, |
| "valid_targets_min": 315 |
| }, |
| { |
| "epoch": 3.926282051282051, |
| "grad_norm": 0.7530765328540372, |
| "learning_rate": 1.9256929857149686e-05, |
| "loss": 0.3012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12907078862190247, |
| "step": 2450, |
| "valid_targets_mean": 2505.1, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 3.934294871794872, |
| "grad_norm": 0.7605153269941574, |
| "learning_rate": 1.9177072771283167e-05, |
| "loss": 0.3209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18549108505249023, |
| "step": 2455, |
| "valid_targets_mean": 3427.1, |
| "valid_targets_min": 931 |
| }, |
| { |
| "epoch": 3.9423076923076925, |
| "grad_norm": 0.7187662676386029, |
| "learning_rate": 1.9097228825391087e-05, |
| "loss": 0.3087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18586839735507965, |
| "step": 2460, |
| "valid_targets_mean": 3050.5, |
| "valid_targets_min": 1382 |
| }, |
| { |
| "epoch": 3.9503205128205128, |
| "grad_norm": 0.801030836461524, |
| "learning_rate": 1.9017399294370413e-05, |
| "loss": 0.3008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1393556445837021, |
| "step": 2465, |
| "valid_targets_mean": 2522.4, |
| "valid_targets_min": 1126 |
| }, |
| { |
| "epoch": 3.9583333333333335, |
| "grad_norm": 0.7125978880537887, |
| "learning_rate": 1.893758545288791e-05, |
| "loss": 0.3023, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12806084752082825, |
| "step": 2470, |
| "valid_targets_mean": 2649.1, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 3.9663461538461537, |
| "grad_norm": 0.733573562499821, |
| "learning_rate": 1.8857788575359847e-05, |
| "loss": 0.3127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16902223229408264, |
| "step": 2475, |
| "valid_targets_mean": 2976.0, |
| "valid_targets_min": 1443 |
| }, |
| { |
| "epoch": 3.9743589743589745, |
| "grad_norm": 0.8286725638748283, |
| "learning_rate": 1.87780099359316e-05, |
| "loss": 0.3069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15555858612060547, |
| "step": 2480, |
| "valid_targets_mean": 2136.1, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 3.9823717948717947, |
| "grad_norm": 0.8013127483982946, |
| "learning_rate": 1.869825080845734e-05, |
| "loss": 0.3007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11979212611913681, |
| "step": 2485, |
| "valid_targets_mean": 1891.2, |
| "valid_targets_min": 1063 |
| }, |
| { |
| "epoch": 3.9903846153846154, |
| "grad_norm": 1.1755524488770757, |
| "learning_rate": 1.8618512466479686e-05, |
| "loss": 0.3176, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11900055408477783, |
| "step": 2490, |
| "valid_targets_mean": 1870.2, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 3.998397435897436, |
| "grad_norm": 0.7228754958110429, |
| "learning_rate": 1.8538796183209373e-05, |
| "loss": 0.3068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18811742961406708, |
| "step": 2495, |
| "valid_targets_mean": 3598.2, |
| "valid_targets_min": 2064 |
| }, |
| { |
| "epoch": 4.006410256410256, |
| "grad_norm": 0.8107216208175523, |
| "learning_rate": 1.845910323150491e-05, |
| "loss": 0.2849, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10420330613851547, |
| "step": 2500, |
| "valid_targets_mean": 1475.4, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 4.014423076923077, |
| "grad_norm": 0.7289801458879988, |
| "learning_rate": 1.8379434883852255e-05, |
| "loss": 0.2799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1149950623512268, |
| "step": 2505, |
| "valid_targets_mean": 2478.2, |
| "valid_targets_min": 1065 |
| }, |
| { |
| "epoch": 4.022435897435898, |
| "grad_norm": 0.6172941964344577, |
| "learning_rate": 1.8299792412344524e-05, |
| "loss": 0.2635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09197504073381424, |
| "step": 2510, |
| "valid_targets_mean": 2993.5, |
| "valid_targets_min": 827 |
| }, |
| { |
| "epoch": 4.030448717948718, |
| "grad_norm": 0.924056863546892, |
| "learning_rate": 1.8220177088661635e-05, |
| "loss": 0.2846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11417260766029358, |
| "step": 2515, |
| "valid_targets_mean": 2422.9, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 4.038461538461538, |
| "grad_norm": 0.7599373898282045, |
| "learning_rate": 1.814059018405004e-05, |
| "loss": 0.267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1344180405139923, |
| "step": 2520, |
| "valid_targets_mean": 2648.2, |
| "valid_targets_min": 1827 |
| }, |
| { |
| "epoch": 4.046474358974359, |
| "grad_norm": 0.847954527866217, |
| "learning_rate": 1.806103296930243e-05, |
| "loss": 0.2749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16294752061367035, |
| "step": 2525, |
| "valid_targets_mean": 2578.5, |
| "valid_targets_min": 1032 |
| }, |
| { |
| "epoch": 4.05448717948718, |
| "grad_norm": 0.7840662540311333, |
| "learning_rate": 1.7981506714737392e-05, |
| "loss": 0.2809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1518925577402115, |
| "step": 2530, |
| "valid_targets_mean": 2867.4, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 4.0625, |
| "grad_norm": 1.0308185743550442, |
| "learning_rate": 1.7902012690179188e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14089523255825043, |
| "step": 2535, |
| "valid_targets_mean": 1825.4, |
| "valid_targets_min": 972 |
| }, |
| { |
| "epoch": 4.07051282051282, |
| "grad_norm": 1.0080791319366573, |
| "learning_rate": 1.7822552164937437e-05, |
| "loss": 0.2897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15818694233894348, |
| "step": 2540, |
| "valid_targets_mean": 2121.5, |
| "valid_targets_min": 1100 |
| }, |
| { |
| "epoch": 4.078525641025641, |
| "grad_norm": 0.7700047605910827, |
| "learning_rate": 1.7743126407786873e-05, |
| "loss": 0.2431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11398568749427795, |
| "step": 2545, |
| "valid_targets_mean": 2395.9, |
| "valid_targets_min": 877 |
| }, |
| { |
| "epoch": 4.086538461538462, |
| "grad_norm": 0.8996747224204145, |
| "learning_rate": 1.766373668694707e-05, |
| "loss": 0.2679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19166290760040283, |
| "step": 2550, |
| "valid_targets_mean": 2388.6, |
| "valid_targets_min": 358 |
| }, |
| { |
| "epoch": 4.094551282051282, |
| "grad_norm": 0.6926397629736457, |
| "learning_rate": 1.7584384270062195e-05, |
| "loss": 0.2503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14995482563972473, |
| "step": 2555, |
| "valid_targets_mean": 3620.6, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 4.102564102564102, |
| "grad_norm": 0.9135167791555272, |
| "learning_rate": 1.7505070424180772e-05, |
| "loss": 0.2773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13266316056251526, |
| "step": 2560, |
| "valid_targets_mean": 1995.1, |
| "valid_targets_min": 399 |
| }, |
| { |
| "epoch": 4.110576923076923, |
| "grad_norm": 0.6987226388783631, |
| "learning_rate": 1.7425796415735454e-05, |
| "loss": 0.2579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14873361587524414, |
| "step": 2565, |
| "valid_targets_mean": 4161.2, |
| "valid_targets_min": 1467 |
| }, |
| { |
| "epoch": 4.118589743589744, |
| "grad_norm": 0.9300152796838081, |
| "learning_rate": 1.7346563510522783e-05, |
| "loss": 0.2666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14323440194129944, |
| "step": 2570, |
| "valid_targets_mean": 2504.5, |
| "valid_targets_min": 956 |
| }, |
| { |
| "epoch": 4.126602564102564, |
| "grad_norm": 0.9032919810067497, |
| "learning_rate": 1.7267372973682998e-05, |
| "loss": 0.2556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14378081262111664, |
| "step": 2575, |
| "valid_targets_mean": 1905.8, |
| "valid_targets_min": 1172 |
| }, |
| { |
| "epoch": 4.134615384615385, |
| "grad_norm": 0.738179906420384, |
| "learning_rate": 1.7188226069679834e-05, |
| "loss": 0.2651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16808360815048218, |
| "step": 2580, |
| "valid_targets_mean": 3544.9, |
| "valid_targets_min": 1459 |
| }, |
| { |
| "epoch": 4.142628205128205, |
| "grad_norm": 0.8642444098290127, |
| "learning_rate": 1.7109124062280307e-05, |
| "loss": 0.2668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13248826563358307, |
| "step": 2585, |
| "valid_targets_mean": 2062.6, |
| "valid_targets_min": 807 |
| }, |
| { |
| "epoch": 4.1506410256410255, |
| "grad_norm": 0.8868230221130139, |
| "learning_rate": 1.7030068214534567e-05, |
| "loss": 0.273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12323059141635895, |
| "step": 2590, |
| "valid_targets_mean": 2625.6, |
| "valid_targets_min": 1143 |
| }, |
| { |
| "epoch": 4.158653846153846, |
| "grad_norm": 0.8464117069340547, |
| "learning_rate": 1.695105978875572e-05, |
| "loss": 0.2783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1996307373046875, |
| "step": 2595, |
| "valid_targets_mean": 3468.2, |
| "valid_targets_min": 1515 |
| }, |
| { |
| "epoch": 4.166666666666667, |
| "grad_norm": 0.8256615333687891, |
| "learning_rate": 1.687210004649965e-05, |
| "loss": 0.272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13181278109550476, |
| "step": 2600, |
| "valid_targets_mean": 3212.9, |
| "valid_targets_min": 1089 |
| }, |
| { |
| "epoch": 4.174679487179487, |
| "grad_norm": 0.8870269434095935, |
| "learning_rate": 1.679319024854491e-05, |
| "loss": 0.2826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1275901198387146, |
| "step": 2605, |
| "valid_targets_mean": 1700.0, |
| "valid_targets_min": 840 |
| }, |
| { |
| "epoch": 4.1826923076923075, |
| "grad_norm": 0.7677929822500646, |
| "learning_rate": 1.6714331654872564e-05, |
| "loss": 0.2655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13212555646896362, |
| "step": 2610, |
| "valid_targets_mean": 3407.5, |
| "valid_targets_min": 1222 |
| }, |
| { |
| "epoch": 4.190705128205128, |
| "grad_norm": 0.903137572181981, |
| "learning_rate": 1.663552552464609e-05, |
| "loss": 0.2715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18511812388896942, |
| "step": 2615, |
| "valid_targets_mean": 2890.0, |
| "valid_targets_min": 430 |
| }, |
| { |
| "epoch": 4.198717948717949, |
| "grad_norm": 0.8198954378497408, |
| "learning_rate": 1.6556773116191257e-05, |
| "loss": 0.2644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11871003359556198, |
| "step": 2620, |
| "valid_targets_mean": 2507.9, |
| "valid_targets_min": 1272 |
| }, |
| { |
| "epoch": 4.206730769230769, |
| "grad_norm": 0.8935891481944647, |
| "learning_rate": 1.647807568697603e-05, |
| "loss": 0.2895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1254265010356903, |
| "step": 2625, |
| "valid_targets_mean": 2132.4, |
| "valid_targets_min": 1236 |
| }, |
| { |
| "epoch": 4.214743589743589, |
| "grad_norm": 0.806136169949257, |
| "learning_rate": 1.6399434493590524e-05, |
| "loss": 0.2733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1111583337187767, |
| "step": 2630, |
| "valid_targets_mean": 2298.0, |
| "valid_targets_min": 455 |
| }, |
| { |
| "epoch": 4.222756410256411, |
| "grad_norm": 0.8129392813125258, |
| "learning_rate": 1.6320850791726884e-05, |
| "loss": 0.2888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11087336391210556, |
| "step": 2635, |
| "valid_targets_mean": 2346.0, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 4.230769230769231, |
| "grad_norm": 0.7954597693417139, |
| "learning_rate": 1.6242325836159304e-05, |
| "loss": 0.2696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12124334275722504, |
| "step": 2640, |
| "valid_targets_mean": 2325.2, |
| "valid_targets_min": 1332 |
| }, |
| { |
| "epoch": 4.238782051282051, |
| "grad_norm": 0.7994370389318457, |
| "learning_rate": 1.6163860880723923e-05, |
| "loss": 0.2633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11619360744953156, |
| "step": 2645, |
| "valid_targets_mean": 2158.5, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 4.246794871794872, |
| "grad_norm": 1.3081684100190851, |
| "learning_rate": 1.6085457178298866e-05, |
| "loss": 0.273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15662749111652374, |
| "step": 2650, |
| "valid_targets_mean": 2542.2, |
| "valid_targets_min": 1074 |
| }, |
| { |
| "epoch": 4.2548076923076925, |
| "grad_norm": 0.9133168019792289, |
| "learning_rate": 1.6007115980784182e-05, |
| "loss": 0.2696, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14592257142066956, |
| "step": 2655, |
| "valid_targets_mean": 2387.5, |
| "valid_targets_min": 896 |
| }, |
| { |
| "epoch": 4.262820512820513, |
| "grad_norm": 0.853360669593718, |
| "learning_rate": 1.592883853908188e-05, |
| "loss": 0.2869, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12176774442195892, |
| "step": 2660, |
| "valid_targets_mean": 2206.1, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 4.270833333333333, |
| "grad_norm": 0.7599368635884864, |
| "learning_rate": 1.585062610307599e-05, |
| "loss": 0.2694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1838086098432541, |
| "step": 2665, |
| "valid_targets_mean": 3465.8, |
| "valid_targets_min": 1081 |
| }, |
| { |
| "epoch": 4.278846153846154, |
| "grad_norm": 0.8525433719634645, |
| "learning_rate": 1.5772479921612543e-05, |
| "loss": 0.2756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14185798168182373, |
| "step": 2670, |
| "valid_targets_mean": 2654.0, |
| "valid_targets_min": 1737 |
| }, |
| { |
| "epoch": 4.2868589743589745, |
| "grad_norm": 0.7462684034862797, |
| "learning_rate": 1.5694401242479677e-05, |
| "loss": 0.2653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14972269535064697, |
| "step": 2675, |
| "valid_targets_mean": 3185.0, |
| "valid_targets_min": 1101 |
| }, |
| { |
| "epoch": 4.294871794871795, |
| "grad_norm": 1.0578925215532613, |
| "learning_rate": 1.5616391312387683e-05, |
| "loss": 0.2805, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13549691438674927, |
| "step": 2680, |
| "valid_targets_mean": 2258.2, |
| "valid_targets_min": 1204 |
| }, |
| { |
| "epoch": 4.302884615384615, |
| "grad_norm": 0.8648608606389229, |
| "learning_rate": 1.5538451376949106e-05, |
| "loss": 0.2864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1298896223306656, |
| "step": 2685, |
| "valid_targets_mean": 2905.2, |
| "valid_targets_min": 1248 |
| }, |
| { |
| "epoch": 4.310897435897436, |
| "grad_norm": 0.8938045422851925, |
| "learning_rate": 1.5460582680658888e-05, |
| "loss": 0.287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16241608560085297, |
| "step": 2690, |
| "valid_targets_mean": 1907.6, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 4.318910256410256, |
| "grad_norm": 0.8098362846204934, |
| "learning_rate": 1.5382786466874446e-05, |
| "loss": 0.2712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11088044941425323, |
| "step": 2695, |
| "valid_targets_mean": 2425.4, |
| "valid_targets_min": 1100 |
| }, |
| { |
| "epoch": 4.326923076923077, |
| "grad_norm": 0.7618680406015733, |
| "learning_rate": 1.5305063977795856e-05, |
| "loss": 0.2524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10798428952693939, |
| "step": 2700, |
| "valid_targets_mean": 2501.0, |
| "valid_targets_min": 1152 |
| }, |
| { |
| "epoch": 4.334935897435898, |
| "grad_norm": 0.8771021903966155, |
| "learning_rate": 1.5227416454445995e-05, |
| "loss": 0.2763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12293270230293274, |
| "step": 2705, |
| "valid_targets_mean": 1854.9, |
| "valid_targets_min": 955 |
| }, |
| { |
| "epoch": 4.342948717948718, |
| "grad_norm": 0.8902232258682791, |
| "learning_rate": 1.5149845136650748e-05, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17401179671287537, |
| "step": 2710, |
| "valid_targets_mean": 2398.9, |
| "valid_targets_min": 1217 |
| }, |
| { |
| "epoch": 4.350961538461538, |
| "grad_norm": 0.7400416574631132, |
| "learning_rate": 1.5072351263019177e-05, |
| "loss": 0.2656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13317830860614777, |
| "step": 2715, |
| "valid_targets_mean": 2971.4, |
| "valid_targets_min": 367 |
| }, |
| { |
| "epoch": 4.358974358974359, |
| "grad_norm": 0.8323847921657985, |
| "learning_rate": 1.4994936070923784e-05, |
| "loss": 0.2649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11686371266841888, |
| "step": 2720, |
| "valid_targets_mean": 2373.9, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 4.36698717948718, |
| "grad_norm": 0.8564853210865073, |
| "learning_rate": 1.4917600796480745e-05, |
| "loss": 0.2657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.154568150639534, |
| "step": 2725, |
| "valid_targets_mean": 3047.5, |
| "valid_targets_min": 1192 |
| }, |
| { |
| "epoch": 4.375, |
| "grad_norm": 4.516311351290841, |
| "learning_rate": 1.4840346674530122e-05, |
| "loss": 0.2779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10477745532989502, |
| "step": 2730, |
| "valid_targets_mean": 1647.8, |
| "valid_targets_min": 577 |
| }, |
| { |
| "epoch": 4.38301282051282, |
| "grad_norm": 0.8773956755455364, |
| "learning_rate": 1.4763174938616232e-05, |
| "loss": 0.2868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12866738438606262, |
| "step": 2735, |
| "valid_targets_mean": 1814.0, |
| "valid_targets_min": 1064 |
| }, |
| { |
| "epoch": 4.391025641025641, |
| "grad_norm": 0.862173024576601, |
| "learning_rate": 1.4686086820967865e-05, |
| "loss": 0.2803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10677969455718994, |
| "step": 2740, |
| "valid_targets_mean": 2018.1, |
| "valid_targets_min": 1167 |
| }, |
| { |
| "epoch": 4.399038461538462, |
| "grad_norm": 0.7936422088513276, |
| "learning_rate": 1.460908355247868e-05, |
| "loss": 0.268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0854073315858841, |
| "step": 2745, |
| "valid_targets_mean": 1962.6, |
| "valid_targets_min": 344 |
| }, |
| { |
| "epoch": 4.407051282051282, |
| "grad_norm": 0.7666993392738055, |
| "learning_rate": 1.4532166362687507e-05, |
| "loss": 0.2848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09944554418325424, |
| "step": 2750, |
| "valid_targets_mean": 2318.1, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 4.415064102564102, |
| "grad_norm": 0.8829285662230825, |
| "learning_rate": 1.445533647975871e-05, |
| "loss": 0.2702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1385907530784607, |
| "step": 2755, |
| "valid_targets_mean": 2788.9, |
| "valid_targets_min": 949 |
| }, |
| { |
| "epoch": 4.423076923076923, |
| "grad_norm": 0.9272776009807071, |
| "learning_rate": 1.437859513046263e-05, |
| "loss": 0.2863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12871670722961426, |
| "step": 2760, |
| "valid_targets_mean": 1785.0, |
| "valid_targets_min": 1228 |
| }, |
| { |
| "epoch": 4.431089743589744, |
| "grad_norm": 0.8347503928560401, |
| "learning_rate": 1.4301943540155914e-05, |
| "loss": 0.2887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12505707144737244, |
| "step": 2765, |
| "valid_targets_mean": 2583.8, |
| "valid_targets_min": 1438 |
| }, |
| { |
| "epoch": 4.439102564102564, |
| "grad_norm": 0.9069365982168227, |
| "learning_rate": 1.4225382932762033e-05, |
| "loss": 0.2655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16004319489002228, |
| "step": 2770, |
| "valid_targets_mean": 2442.6, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 4.447115384615385, |
| "grad_norm": 1.0573384285454255, |
| "learning_rate": 1.4148914530751681e-05, |
| "loss": 0.2858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17709983885288239, |
| "step": 2775, |
| "valid_targets_mean": 1901.5, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 4.455128205128205, |
| "grad_norm": 0.9369049788177093, |
| "learning_rate": 1.4072539555123292e-05, |
| "loss": 0.2803, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1579183042049408, |
| "step": 2780, |
| "valid_targets_mean": 2392.0, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 4.4631410256410255, |
| "grad_norm": 0.8913049677040563, |
| "learning_rate": 1.3996259225383514e-05, |
| "loss": 0.2831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1293807029724121, |
| "step": 2785, |
| "valid_targets_mean": 2368.1, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 4.471153846153846, |
| "grad_norm": 0.88256947286605, |
| "learning_rate": 1.3920074759527737e-05, |
| "loss": 0.29, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14929986000061035, |
| "step": 2790, |
| "valid_targets_mean": 2416.9, |
| "valid_targets_min": 1440 |
| }, |
| { |
| "epoch": 4.479166666666667, |
| "grad_norm": 0.8160206288790809, |
| "learning_rate": 1.3843987374020689e-05, |
| "loss": 0.3178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14964623749256134, |
| "step": 2795, |
| "valid_targets_mean": 2870.5, |
| "valid_targets_min": 721 |
| }, |
| { |
| "epoch": 4.487179487179487, |
| "grad_norm": 0.8428944555480611, |
| "learning_rate": 1.376799828377696e-05, |
| "loss": 0.2659, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1721874475479126, |
| "step": 2800, |
| "valid_targets_mean": 2782.9, |
| "valid_targets_min": 1694 |
| }, |
| { |
| "epoch": 4.4951923076923075, |
| "grad_norm": 0.8871852280382094, |
| "learning_rate": 1.3692108702141642e-05, |
| "loss": 0.2688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12747956812381744, |
| "step": 2805, |
| "valid_targets_mean": 1721.0, |
| "valid_targets_min": 338 |
| }, |
| { |
| "epoch": 4.503205128205128, |
| "grad_norm": 0.9872908843916991, |
| "learning_rate": 1.361631984087091e-05, |
| "loss": 0.2752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15744715929031372, |
| "step": 2810, |
| "valid_targets_mean": 1939.6, |
| "valid_targets_min": 1134 |
| }, |
| { |
| "epoch": 4.511217948717949, |
| "grad_norm": 0.8580567465549157, |
| "learning_rate": 1.354063291011273e-05, |
| "loss": 0.2632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.130362868309021, |
| "step": 2815, |
| "valid_targets_mean": 2308.5, |
| "valid_targets_min": 1237 |
| }, |
| { |
| "epoch": 4.519230769230769, |
| "grad_norm": 0.7644493527586255, |
| "learning_rate": 1.3465049118387486e-05, |
| "loss": 0.2674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13236522674560547, |
| "step": 2820, |
| "valid_targets_mean": 2896.8, |
| "valid_targets_min": 1084 |
| }, |
| { |
| "epoch": 4.527243589743589, |
| "grad_norm": 0.9667014319508634, |
| "learning_rate": 1.3389569672568707e-05, |
| "loss": 0.2831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12788935005664825, |
| "step": 2825, |
| "valid_targets_mean": 2036.5, |
| "valid_targets_min": 324 |
| }, |
| { |
| "epoch": 4.535256410256411, |
| "grad_norm": 0.8421523844856508, |
| "learning_rate": 1.331419577786381e-05, |
| "loss": 0.2553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.109443299472332, |
| "step": 2830, |
| "valid_targets_mean": 1979.4, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 4.543269230769231, |
| "grad_norm": 0.744928564210247, |
| "learning_rate": 1.3238928637794816e-05, |
| "loss": 0.2639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11254187673330307, |
| "step": 2835, |
| "valid_targets_mean": 2626.8, |
| "valid_targets_min": 753 |
| }, |
| { |
| "epoch": 4.551282051282051, |
| "grad_norm": 0.975086466256904, |
| "learning_rate": 1.3163769454179183e-05, |
| "loss": 0.2768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1786927580833435, |
| "step": 2840, |
| "valid_targets_mean": 2314.1, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 4.559294871794872, |
| "grad_norm": 0.7209383245592558, |
| "learning_rate": 1.3088719427110552e-05, |
| "loss": 0.266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08105504512786865, |
| "step": 2845, |
| "valid_targets_mean": 2961.5, |
| "valid_targets_min": 1371 |
| }, |
| { |
| "epoch": 4.5673076923076925, |
| "grad_norm": 0.7810108736494066, |
| "learning_rate": 1.3013779754939666e-05, |
| "loss": 0.2735, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14913949370384216, |
| "step": 2850, |
| "valid_targets_mean": 2757.1, |
| "valid_targets_min": 1361 |
| }, |
| { |
| "epoch": 4.575320512820513, |
| "grad_norm": 0.8254385625250282, |
| "learning_rate": 1.2938951634255164e-05, |
| "loss": 0.2989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1645059883594513, |
| "step": 2855, |
| "valid_targets_mean": 3087.0, |
| "valid_targets_min": 1169 |
| }, |
| { |
| "epoch": 4.583333333333333, |
| "grad_norm": 0.7306018923704536, |
| "learning_rate": 1.2864236259864495e-05, |
| "loss": 0.2603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11817409098148346, |
| "step": 2860, |
| "valid_targets_mean": 2937.9, |
| "valid_targets_min": 371 |
| }, |
| { |
| "epoch": 4.591346153846154, |
| "grad_norm": 0.7477590617323558, |
| "learning_rate": 1.2789634824774887e-05, |
| "loss": 0.2722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12819048762321472, |
| "step": 2865, |
| "valid_targets_mean": 2968.5, |
| "valid_targets_min": 1499 |
| }, |
| { |
| "epoch": 4.5993589743589745, |
| "grad_norm": 0.728894279788435, |
| "learning_rate": 1.2715148520174206e-05, |
| "loss": 0.2687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12905170023441315, |
| "step": 2870, |
| "valid_targets_mean": 3541.0, |
| "valid_targets_min": 1720 |
| }, |
| { |
| "epoch": 4.607371794871795, |
| "grad_norm": 0.744918036805367, |
| "learning_rate": 1.2640778535412036e-05, |
| "loss": 0.2645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10740716010332108, |
| "step": 2875, |
| "valid_targets_mean": 2260.5, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 4.615384615384615, |
| "grad_norm": 0.8997924981650226, |
| "learning_rate": 1.2566526057980608e-05, |
| "loss": 0.2517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1263289749622345, |
| "step": 2880, |
| "valid_targets_mean": 2141.9, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 4.623397435897436, |
| "grad_norm": 0.7732205590951574, |
| "learning_rate": 1.2492392273495879e-05, |
| "loss": 0.2626, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1344079226255417, |
| "step": 2885, |
| "valid_targets_mean": 3042.1, |
| "valid_targets_min": 1931 |
| }, |
| { |
| "epoch": 4.631410256410256, |
| "grad_norm": 0.9244368747106443, |
| "learning_rate": 1.2418378365678612e-05, |
| "loss": 0.2776, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18506968021392822, |
| "step": 2890, |
| "valid_targets_mean": 2340.2, |
| "valid_targets_min": 1257 |
| }, |
| { |
| "epoch": 4.639423076923077, |
| "grad_norm": 0.981906856635814, |
| "learning_rate": 1.234448551633542e-05, |
| "loss": 0.2707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11560280621051788, |
| "step": 2895, |
| "valid_targets_mean": 1585.2, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 4.647435897435898, |
| "grad_norm": 0.9031224981302811, |
| "learning_rate": 1.2270714905339969e-05, |
| "loss": 0.2716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11820649355649948, |
| "step": 2900, |
| "valid_targets_mean": 2263.9, |
| "valid_targets_min": 482 |
| }, |
| { |
| "epoch": 4.655448717948718, |
| "grad_norm": 0.8745154308021823, |
| "learning_rate": 1.2197067710614075e-05, |
| "loss": 0.2798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09645086526870728, |
| "step": 2905, |
| "valid_targets_mean": 1823.5, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 4.663461538461538, |
| "grad_norm": 0.8245554409210525, |
| "learning_rate": 1.2123545108108943e-05, |
| "loss": 0.2887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12594664096832275, |
| "step": 2910, |
| "valid_targets_mean": 2744.8, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 4.671474358974359, |
| "grad_norm": 0.829115549908771, |
| "learning_rate": 1.2050148271786348e-05, |
| "loss": 0.2912, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15721480548381805, |
| "step": 2915, |
| "valid_targets_mean": 3267.1, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 4.67948717948718, |
| "grad_norm": 0.846511250803801, |
| "learning_rate": 1.1976878373599928e-05, |
| "loss": 0.2866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14120858907699585, |
| "step": 2920, |
| "valid_targets_mean": 2450.1, |
| "valid_targets_min": 1375 |
| }, |
| { |
| "epoch": 4.6875, |
| "grad_norm": 0.7975341835970318, |
| "learning_rate": 1.1903736583476441e-05, |
| "loss": 0.2745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14211896061897278, |
| "step": 2925, |
| "valid_targets_mean": 2471.6, |
| "valid_targets_min": 1047 |
| }, |
| { |
| "epoch": 4.69551282051282, |
| "grad_norm": 0.9078900951131141, |
| "learning_rate": 1.1830724069297106e-05, |
| "loss": 0.2676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13938596844673157, |
| "step": 2930, |
| "valid_targets_mean": 2080.9, |
| "valid_targets_min": 1256 |
| }, |
| { |
| "epoch": 4.703525641025641, |
| "grad_norm": 0.8028681041530895, |
| "learning_rate": 1.1757841996878957e-05, |
| "loss": 0.287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11330582201480865, |
| "step": 2935, |
| "valid_targets_mean": 2032.8, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 4.711538461538462, |
| "grad_norm": 0.8363540894412191, |
| "learning_rate": 1.1685091529956187e-05, |
| "loss": 0.2676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15411382913589478, |
| "step": 2940, |
| "valid_targets_mean": 2787.2, |
| "valid_targets_min": 1093 |
| }, |
| { |
| "epoch": 4.719551282051282, |
| "grad_norm": 0.912460705122893, |
| "learning_rate": 1.161247383016163e-05, |
| "loss": 0.2818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16072651743888855, |
| "step": 2945, |
| "valid_targets_mean": 2128.5, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 4.727564102564102, |
| "grad_norm": 0.7499400173047096, |
| "learning_rate": 1.1539990057008166e-05, |
| "loss": 0.285, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10620361566543579, |
| "step": 2950, |
| "valid_targets_mean": 2388.1, |
| "valid_targets_min": 1203 |
| }, |
| { |
| "epoch": 4.735576923076923, |
| "grad_norm": 0.9237353949311389, |
| "learning_rate": 1.1467641367870198e-05, |
| "loss": 0.2644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11121618747711182, |
| "step": 2955, |
| "valid_targets_mean": 1521.9, |
| "valid_targets_min": 937 |
| }, |
| { |
| "epoch": 4.743589743589744, |
| "grad_norm": 0.8205670496593648, |
| "learning_rate": 1.1395428917965239e-05, |
| "loss": 0.2633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14764776825904846, |
| "step": 2960, |
| "valid_targets_mean": 2725.4, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 4.751602564102564, |
| "grad_norm": 0.9098777718387225, |
| "learning_rate": 1.1323353860335385e-05, |
| "loss": 0.2838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15366676449775696, |
| "step": 2965, |
| "valid_targets_mean": 2146.5, |
| "valid_targets_min": 1034 |
| }, |
| { |
| "epoch": 4.759615384615385, |
| "grad_norm": 0.8551265905437225, |
| "learning_rate": 1.1251417345828962e-05, |
| "loss": 0.2948, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20508478581905365, |
| "step": 2970, |
| "valid_targets_mean": 3284.0, |
| "valid_targets_min": 1291 |
| }, |
| { |
| "epoch": 4.767628205128205, |
| "grad_norm": 0.8632459584174168, |
| "learning_rate": 1.1179620523082107e-05, |
| "loss": 0.278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15938019752502441, |
| "step": 2975, |
| "valid_targets_mean": 2744.9, |
| "valid_targets_min": 1368 |
| }, |
| { |
| "epoch": 4.7756410256410255, |
| "grad_norm": 0.8257591086160776, |
| "learning_rate": 1.110796453850047e-05, |
| "loss": 0.2649, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13130192458629608, |
| "step": 2980, |
| "valid_targets_mean": 2265.9, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 4.783653846153846, |
| "grad_norm": 0.8559905279176463, |
| "learning_rate": 1.1036450536240877e-05, |
| "loss": 0.2744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14812210202217102, |
| "step": 2985, |
| "valid_targets_mean": 2335.5, |
| "valid_targets_min": 403 |
| }, |
| { |
| "epoch": 4.791666666666667, |
| "grad_norm": 0.7527787079235052, |
| "learning_rate": 1.0965079658193068e-05, |
| "loss": 0.2754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13627628982067108, |
| "step": 2990, |
| "valid_targets_mean": 3166.6, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 4.799679487179487, |
| "grad_norm": 0.9363191867774112, |
| "learning_rate": 1.0893853043961475e-05, |
| "loss": 0.2661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15567584335803986, |
| "step": 2995, |
| "valid_targets_mean": 2027.8, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 4.8076923076923075, |
| "grad_norm": 0.8073681066642808, |
| "learning_rate": 1.0822771830847011e-05, |
| "loss": 0.2645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09198524802923203, |
| "step": 3000, |
| "valid_targets_mean": 1890.8, |
| "valid_targets_min": 218 |
| }, |
| { |
| "epoch": 4.815705128205128, |
| "grad_norm": 0.988773013105684, |
| "learning_rate": 1.0751837153828926e-05, |
| "loss": 0.2683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13376572728157043, |
| "step": 3005, |
| "valid_targets_mean": 1561.8, |
| "valid_targets_min": 1034 |
| }, |
| { |
| "epoch": 4.823717948717949, |
| "grad_norm": 0.9762413699290895, |
| "learning_rate": 1.0681050145546666e-05, |
| "loss": 0.2865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14275820553302765, |
| "step": 3010, |
| "valid_targets_mean": 2047.4, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 4.831730769230769, |
| "grad_norm": 0.9275506661578156, |
| "learning_rate": 1.0610411936281801e-05, |
| "loss": 0.281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15121185779571533, |
| "step": 3015, |
| "valid_targets_mean": 2387.4, |
| "valid_targets_min": 1138 |
| }, |
| { |
| "epoch": 4.839743589743589, |
| "grad_norm": 1.186762101396794, |
| "learning_rate": 1.0539923653939978e-05, |
| "loss": 0.2635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14785534143447876, |
| "step": 3020, |
| "valid_targets_mean": 2331.1, |
| "valid_targets_min": 260 |
| }, |
| { |
| "epoch": 4.847756410256411, |
| "grad_norm": 0.7972641980595226, |
| "learning_rate": 1.0469586424032903e-05, |
| "loss": 0.278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11366459727287292, |
| "step": 3025, |
| "valid_targets_mean": 2833.2, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 4.855769230769231, |
| "grad_norm": 0.787773519783044, |
| "learning_rate": 1.0399401369660369e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12477640807628632, |
| "step": 3030, |
| "valid_targets_mean": 2976.5, |
| "valid_targets_min": 1412 |
| }, |
| { |
| "epoch": 4.863782051282051, |
| "grad_norm": 1.077467606380259, |
| "learning_rate": 1.0329369611492334e-05, |
| "loss": 0.2799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13085028529167175, |
| "step": 3035, |
| "valid_targets_mean": 1301.2, |
| "valid_targets_min": 903 |
| }, |
| { |
| "epoch": 4.871794871794872, |
| "grad_norm": 0.779085250047778, |
| "learning_rate": 1.0259492267751022e-05, |
| "loss": 0.2683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09794454276561737, |
| "step": 3040, |
| "valid_targets_mean": 2191.4, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 4.8798076923076925, |
| "grad_norm": 0.772242896624771, |
| "learning_rate": 1.0189770454193052e-05, |
| "loss": 0.2655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09873206913471222, |
| "step": 3045, |
| "valid_targets_mean": 1930.6, |
| "valid_targets_min": 998 |
| }, |
| { |
| "epoch": 4.887820512820513, |
| "grad_norm": 0.9599867450295364, |
| "learning_rate": 1.0120205284091673e-05, |
| "loss": 0.2858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11163206398487091, |
| "step": 3050, |
| "valid_targets_mean": 1916.6, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 4.895833333333333, |
| "grad_norm": 0.7918817935809193, |
| "learning_rate": 1.0050797868218907e-05, |
| "loss": 0.2591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1077142059803009, |
| "step": 3055, |
| "valid_targets_mean": 2029.9, |
| "valid_targets_min": 1202 |
| }, |
| { |
| "epoch": 4.903846153846154, |
| "grad_norm": 1.0640408645767745, |
| "learning_rate": 9.981549314827876e-06, |
| "loss": 0.2627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15119090676307678, |
| "step": 3060, |
| "valid_targets_mean": 2257.6, |
| "valid_targets_min": 1607 |
| }, |
| { |
| "epoch": 4.9118589743589745, |
| "grad_norm": 0.9302729531429398, |
| "learning_rate": 9.912460729635097e-06, |
| "loss": 0.2607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1315920054912567, |
| "step": 3065, |
| "valid_targets_mean": 2105.0, |
| "valid_targets_min": 1408 |
| }, |
| { |
| "epoch": 4.919871794871795, |
| "grad_norm": 0.9369289493805716, |
| "learning_rate": 9.843533215802796e-06, |
| "loss": 0.2706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15253514051437378, |
| "step": 3070, |
| "valid_targets_mean": 2191.6, |
| "valid_targets_min": 1061 |
| }, |
| { |
| "epoch": 4.927884615384615, |
| "grad_norm": 0.844646606230592, |
| "learning_rate": 9.774767873921357e-06, |
| "loss": 0.2723, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.137139230966568, |
| "step": 3075, |
| "valid_targets_mean": 2565.4, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 4.935897435897436, |
| "grad_norm": 2.329062257750856, |
| "learning_rate": 9.706165801991651e-06, |
| "loss": 0.2711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13304753601551056, |
| "step": 3080, |
| "valid_targets_mean": 1838.1, |
| "valid_targets_min": 795 |
| }, |
| { |
| "epoch": 4.943910256410256, |
| "grad_norm": 0.853413187103336, |
| "learning_rate": 9.637728095407593e-06, |
| "loss": 0.2421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12307369709014893, |
| "step": 3085, |
| "valid_targets_mean": 2275.2, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 4.951923076923077, |
| "grad_norm": 0.8149656643934992, |
| "learning_rate": 9.56945584693861e-06, |
| "loss": 0.2665, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14071014523506165, |
| "step": 3090, |
| "valid_targets_mean": 2706.8, |
| "valid_targets_min": 1006 |
| }, |
| { |
| "epoch": 4.959935897435898, |
| "grad_norm": 0.8879281552541326, |
| "learning_rate": 9.501350146712193e-06, |
| "loss": 0.2833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16927888989448547, |
| "step": 3095, |
| "valid_targets_mean": 2713.2, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 4.967948717948718, |
| "grad_norm": 0.8421674616911554, |
| "learning_rate": 9.433412082196527e-06, |
| "loss": 0.278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15744885802268982, |
| "step": 3100, |
| "valid_targets_mean": 2638.9, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 4.975961538461538, |
| "grad_norm": 0.8600840077890818, |
| "learning_rate": 9.365642738183044e-06, |
| "loss": 0.2627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.104631707072258, |
| "step": 3105, |
| "valid_targets_mean": 1865.5, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 4.983974358974359, |
| "grad_norm": 0.8348297609388227, |
| "learning_rate": 9.298043196769217e-06, |
| "loss": 0.259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13417679071426392, |
| "step": 3110, |
| "valid_targets_mean": 2495.9, |
| "valid_targets_min": 1227 |
| }, |
| { |
| "epoch": 4.99198717948718, |
| "grad_norm": 9.580138479223857, |
| "learning_rate": 9.230614537341167e-06, |
| "loss": 0.2797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1282835602760315, |
| "step": 3115, |
| "valid_targets_mean": 2251.1, |
| "valid_targets_min": 1236 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.8722530383797718, |
| "learning_rate": 9.163357836556498e-06, |
| "loss": 0.2589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1430858075618744, |
| "step": 3120, |
| "valid_targets_mean": 2250.0, |
| "valid_targets_min": 360 |
| }, |
| { |
| "epoch": 5.00801282051282, |
| "grad_norm": 0.760262997035743, |
| "learning_rate": 9.096274168327122e-06, |
| "loss": 0.2711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11211199313402176, |
| "step": 3125, |
| "valid_targets_mean": 2454.6, |
| "valid_targets_min": 1559 |
| }, |
| { |
| "epoch": 5.016025641025641, |
| "grad_norm": 0.8081201546727087, |
| "learning_rate": 9.029364603802017e-06, |
| "loss": 0.2593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12468785047531128, |
| "step": 3130, |
| "valid_targets_mean": 2825.5, |
| "valid_targets_min": 964 |
| }, |
| { |
| "epoch": 5.024038461538462, |
| "grad_norm": 0.9144227586011615, |
| "learning_rate": 8.962630211350248e-06, |
| "loss": 0.2531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11245831847190857, |
| "step": 3135, |
| "valid_targets_mean": 2072.0, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 5.032051282051282, |
| "grad_norm": 0.8415836808622785, |
| "learning_rate": 8.89607205654378e-06, |
| "loss": 0.2656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21187756955623627, |
| "step": 3140, |
| "valid_targets_mean": 3681.8, |
| "valid_targets_min": 1378 |
| }, |
| { |
| "epoch": 5.040064102564102, |
| "grad_norm": 1.0690915033438144, |
| "learning_rate": 8.829691202140591e-06, |
| "loss": 0.2566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0969729870557785, |
| "step": 3145, |
| "valid_targets_mean": 1514.1, |
| "valid_targets_min": 498 |
| }, |
| { |
| "epoch": 5.048076923076923, |
| "grad_norm": 0.888331771783694, |
| "learning_rate": 8.763488708067604e-06, |
| "loss": 0.2521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12027233839035034, |
| "step": 3150, |
| "valid_targets_mean": 2255.6, |
| "valid_targets_min": 955 |
| }, |
| { |
| "epoch": 5.056089743589744, |
| "grad_norm": 0.8115419127246998, |
| "learning_rate": 8.69746563140379e-06, |
| "loss": 0.2514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13751327991485596, |
| "step": 3155, |
| "valid_targets_mean": 3138.2, |
| "valid_targets_min": 925 |
| }, |
| { |
| "epoch": 5.064102564102564, |
| "grad_norm": 0.880802924767822, |
| "learning_rate": 8.631623026363331e-06, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09337887912988663, |
| "step": 3160, |
| "valid_targets_mean": 1815.4, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 5.072115384615385, |
| "grad_norm": 0.8526126585543974, |
| "learning_rate": 8.56596194427873e-06, |
| "loss": 0.2534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10085926949977875, |
| "step": 3165, |
| "valid_targets_mean": 1936.5, |
| "valid_targets_min": 1147 |
| }, |
| { |
| "epoch": 5.080128205128205, |
| "grad_norm": 0.865864615519599, |
| "learning_rate": 8.500483433584054e-06, |
| "loss": 0.247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11514122039079666, |
| "step": 3170, |
| "valid_targets_mean": 2888.1, |
| "valid_targets_min": 1666 |
| }, |
| { |
| "epoch": 5.0881410256410255, |
| "grad_norm": 0.8633744921019645, |
| "learning_rate": 8.435188539798187e-06, |
| "loss": 0.2695, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16413256525993347, |
| "step": 3175, |
| "valid_targets_mean": 3507.0, |
| "valid_targets_min": 1585 |
| }, |
| { |
| "epoch": 5.096153846153846, |
| "grad_norm": 0.7489172858590697, |
| "learning_rate": 8.370078305508136e-06, |
| "loss": 0.2302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1103079617023468, |
| "step": 3180, |
| "valid_targets_mean": 3308.8, |
| "valid_targets_min": 1774 |
| }, |
| { |
| "epoch": 5.104166666666667, |
| "grad_norm": 0.7761189735769272, |
| "learning_rate": 8.305153770352384e-06, |
| "loss": 0.2555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10959683358669281, |
| "step": 3185, |
| "valid_targets_mean": 3496.6, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 5.112179487179487, |
| "grad_norm": 0.953121153374897, |
| "learning_rate": 8.240415971004285e-06, |
| "loss": 0.2404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14587818086147308, |
| "step": 3190, |
| "valid_targets_mean": 2079.8, |
| "valid_targets_min": 1043 |
| }, |
| { |
| "epoch": 5.1201923076923075, |
| "grad_norm": 0.8994783360343982, |
| "learning_rate": 8.175865941155525e-06, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11071066558361053, |
| "step": 3195, |
| "valid_targets_mean": 2350.0, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 5.128205128205128, |
| "grad_norm": 0.8639406630796981, |
| "learning_rate": 8.111504711499598e-06, |
| "loss": 0.2537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15387535095214844, |
| "step": 3200, |
| "valid_targets_mean": 3171.8, |
| "valid_targets_min": 1809 |
| }, |
| { |
| "epoch": 5.136217948717949, |
| "grad_norm": 0.8743544692197517, |
| "learning_rate": 8.04733330971536e-06, |
| "loss": 0.2608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12671324610710144, |
| "step": 3205, |
| "valid_targets_mean": 2485.6, |
| "valid_targets_min": 1268 |
| }, |
| { |
| "epoch": 5.144230769230769, |
| "grad_norm": 0.9582632299000284, |
| "learning_rate": 7.983352760450618e-06, |
| "loss": 0.2571, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11250822991132736, |
| "step": 3210, |
| "valid_targets_mean": 1896.8, |
| "valid_targets_min": 554 |
| }, |
| { |
| "epoch": 5.152243589743589, |
| "grad_norm": 0.9124958970924283, |
| "learning_rate": 7.919564085305768e-06, |
| "loss": 0.2553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11880991607904434, |
| "step": 3215, |
| "valid_targets_mean": 2402.8, |
| "valid_targets_min": 1805 |
| }, |
| { |
| "epoch": 5.160256410256411, |
| "grad_norm": 0.809203448407432, |
| "learning_rate": 7.855968302817487e-06, |
| "loss": 0.2553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1249704360961914, |
| "step": 3220, |
| "valid_targets_mean": 2293.9, |
| "valid_targets_min": 314 |
| }, |
| { |
| "epoch": 5.168269230769231, |
| "grad_norm": 1.0224736881905714, |
| "learning_rate": 7.792566428442456e-06, |
| "loss": 0.2552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1433626413345337, |
| "step": 3225, |
| "valid_targets_mean": 2055.8, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 5.176282051282051, |
| "grad_norm": 0.828565366523305, |
| "learning_rate": 7.729359474541168e-06, |
| "loss": 0.2411, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12695926427841187, |
| "step": 3230, |
| "valid_targets_mean": 3304.5, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 5.184294871794872, |
| "grad_norm": 1.0703527171317921, |
| "learning_rate": 7.666348450361737e-06, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17552143335342407, |
| "step": 3235, |
| "valid_targets_mean": 2147.1, |
| "valid_targets_min": 922 |
| }, |
| { |
| "epoch": 5.1923076923076925, |
| "grad_norm": 0.8629077122279247, |
| "learning_rate": 7.60353436202381e-06, |
| "loss": 0.2335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12918856739997864, |
| "step": 3240, |
| "valid_targets_mean": 2890.6, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 5.200320512820513, |
| "grad_norm": 0.7496627630060603, |
| "learning_rate": 7.540918212502479e-06, |
| "loss": 0.2425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11419525742530823, |
| "step": 3245, |
| "valid_targets_mean": 3239.9, |
| "valid_targets_min": 903 |
| }, |
| { |
| "epoch": 5.208333333333333, |
| "grad_norm": 0.9516986948209849, |
| "learning_rate": 7.478501001612281e-06, |
| "loss": 0.2642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10599060356616974, |
| "step": 3250, |
| "valid_targets_mean": 2018.6, |
| "valid_targets_min": 1264 |
| }, |
| { |
| "epoch": 5.216346153846154, |
| "grad_norm": 0.8786538617105409, |
| "learning_rate": 7.416283725991229e-06, |
| "loss": 0.2442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13649001717567444, |
| "step": 3255, |
| "valid_targets_mean": 2654.9, |
| "valid_targets_min": 974 |
| }, |
| { |
| "epoch": 5.2243589743589745, |
| "grad_norm": 0.7547164045773196, |
| "learning_rate": 7.354267379084896e-06, |
| "loss": 0.2375, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11847176402807236, |
| "step": 3260, |
| "valid_targets_mean": 3161.9, |
| "valid_targets_min": 1418 |
| }, |
| { |
| "epoch": 5.232371794871795, |
| "grad_norm": 0.8827711281808431, |
| "learning_rate": 7.292452951130548e-06, |
| "loss": 0.2478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11796671152114868, |
| "step": 3265, |
| "valid_targets_mean": 2813.1, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 5.240384615384615, |
| "grad_norm": 0.991683934378518, |
| "learning_rate": 7.230841429141347e-06, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11138557642698288, |
| "step": 3270, |
| "valid_targets_mean": 1707.8, |
| "valid_targets_min": 779 |
| }, |
| { |
| "epoch": 5.248397435897436, |
| "grad_norm": 0.8413292996210097, |
| "learning_rate": 7.169433796890595e-06, |
| "loss": 0.2585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11664022505283356, |
| "step": 3275, |
| "valid_targets_mean": 2805.9, |
| "valid_targets_min": 1887 |
| }, |
| { |
| "epoch": 5.256410256410256, |
| "grad_norm": 0.8481142716287121, |
| "learning_rate": 7.108231034895976e-06, |
| "loss": 0.2545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12616068124771118, |
| "step": 3280, |
| "valid_targets_mean": 2882.4, |
| "valid_targets_min": 1045 |
| }, |
| { |
| "epoch": 5.264423076923077, |
| "grad_norm": 0.7422363717208107, |
| "learning_rate": 7.047234120403972e-06, |
| "loss": 0.2453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07960276305675507, |
| "step": 3285, |
| "valid_targets_mean": 2813.0, |
| "valid_targets_min": 830 |
| }, |
| { |
| "epoch": 5.272435897435898, |
| "grad_norm": 0.9631783328404132, |
| "learning_rate": 6.986444027374211e-06, |
| "loss": 0.2565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10581400245428085, |
| "step": 3290, |
| "valid_targets_mean": 1969.2, |
| "valid_targets_min": 473 |
| }, |
| { |
| "epoch": 5.280448717948718, |
| "grad_norm": 0.9641249779597492, |
| "learning_rate": 6.925861726463919e-06, |
| "loss": 0.2488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12430629134178162, |
| "step": 3295, |
| "valid_targets_mean": 2351.1, |
| "valid_targets_min": 1181 |
| }, |
| { |
| "epoch": 5.288461538461538, |
| "grad_norm": 0.9412615692571877, |
| "learning_rate": 6.865488185012464e-06, |
| "loss": 0.2898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1612430363893509, |
| "step": 3300, |
| "valid_targets_mean": 2558.1, |
| "valid_targets_min": 1309 |
| }, |
| { |
| "epoch": 5.296474358974359, |
| "grad_norm": 1.0509911379396097, |
| "learning_rate": 6.805324367025825e-06, |
| "loss": 0.2505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11822021007537842, |
| "step": 3305, |
| "valid_targets_mean": 1644.9, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 5.30448717948718, |
| "grad_norm": 0.8553682205085341, |
| "learning_rate": 6.745371233161309e-06, |
| "loss": 0.249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13173708319664001, |
| "step": 3310, |
| "valid_targets_mean": 2514.2, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 5.3125, |
| "grad_norm": 0.7609829443446366, |
| "learning_rate": 6.685629740712103e-06, |
| "loss": 0.2439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1069406270980835, |
| "step": 3315, |
| "valid_targets_mean": 2430.6, |
| "valid_targets_min": 1418 |
| }, |
| { |
| "epoch": 5.32051282051282, |
| "grad_norm": 0.8915994872025942, |
| "learning_rate": 6.6261008435920605e-06, |
| "loss": 0.2464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11810167878866196, |
| "step": 3320, |
| "valid_targets_mean": 2207.5, |
| "valid_targets_min": 1348 |
| }, |
| { |
| "epoch": 5.328525641025641, |
| "grad_norm": 0.9796125193027324, |
| "learning_rate": 6.566785492320471e-06, |
| "loss": 0.2596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13730502128601074, |
| "step": 3325, |
| "valid_targets_mean": 1870.9, |
| "valid_targets_min": 1223 |
| }, |
| { |
| "epoch": 5.336538461538462, |
| "grad_norm": 0.8717267812917334, |
| "learning_rate": 6.507684634006815e-06, |
| "loss": 0.2306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1494694948196411, |
| "step": 3330, |
| "valid_targets_mean": 2862.1, |
| "valid_targets_min": 1343 |
| }, |
| { |
| "epoch": 5.344551282051282, |
| "grad_norm": 0.7268347262067547, |
| "learning_rate": 6.448799212335734e-06, |
| "loss": 0.2438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09736894816160202, |
| "step": 3335, |
| "valid_targets_mean": 3054.6, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 5.352564102564102, |
| "grad_norm": 0.9759718449339392, |
| "learning_rate": 6.390130167551869e-06, |
| "loss": 0.2376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11273542046546936, |
| "step": 3340, |
| "valid_targets_mean": 1938.5, |
| "valid_targets_min": 1000 |
| }, |
| { |
| "epoch": 5.360576923076923, |
| "grad_norm": 0.9594102043664786, |
| "learning_rate": 6.331678436444939e-06, |
| "loss": 0.2497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13123399019241333, |
| "step": 3345, |
| "valid_targets_mean": 2063.9, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 5.368589743589744, |
| "grad_norm": 1.1783899265802422, |
| "learning_rate": 6.273444952334713e-06, |
| "loss": 0.255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1367177963256836, |
| "step": 3350, |
| "valid_targets_mean": 1565.1, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 5.376602564102564, |
| "grad_norm": 0.9688205506455062, |
| "learning_rate": 6.2154306450561175e-06, |
| "loss": 0.2452, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14453257620334625, |
| "step": 3355, |
| "valid_targets_mean": 2148.6, |
| "valid_targets_min": 1155 |
| }, |
| { |
| "epoch": 5.384615384615385, |
| "grad_norm": 0.8744646444334985, |
| "learning_rate": 6.157636440944445e-06, |
| "loss": 0.2412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11924951523542404, |
| "step": 3360, |
| "valid_targets_mean": 2748.2, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 5.392628205128205, |
| "grad_norm": 0.9862735226573559, |
| "learning_rate": 6.100063262820474e-06, |
| "loss": 0.2568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15304933488368988, |
| "step": 3365, |
| "valid_targets_mean": 2384.2, |
| "valid_targets_min": 851 |
| }, |
| { |
| "epoch": 5.4006410256410255, |
| "grad_norm": 0.9764993056093113, |
| "learning_rate": 6.0427120299758236e-06, |
| "loss": 0.2421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1572096198797226, |
| "step": 3370, |
| "valid_targets_mean": 2534.1, |
| "valid_targets_min": 1192 |
| }, |
| { |
| "epoch": 5.408653846153846, |
| "grad_norm": 0.8959864428190588, |
| "learning_rate": 5.985583658158212e-06, |
| "loss": 0.2409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12945888936519623, |
| "step": 3375, |
| "valid_targets_mean": 2567.4, |
| "valid_targets_min": 1399 |
| }, |
| { |
| "epoch": 5.416666666666667, |
| "grad_norm": 0.8552778775133383, |
| "learning_rate": 5.928679059556852e-06, |
| "loss": 0.2424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12539073824882507, |
| "step": 3380, |
| "valid_targets_mean": 2832.4, |
| "valid_targets_min": 1346 |
| }, |
| { |
| "epoch": 5.424679487179487, |
| "grad_norm": 0.8025920436996826, |
| "learning_rate": 5.871999142787908e-06, |
| "loss": 0.2327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13345125317573547, |
| "step": 3385, |
| "valid_targets_mean": 3709.1, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 5.4326923076923075, |
| "grad_norm": 0.8911055708140087, |
| "learning_rate": 5.815544812879936e-06, |
| "loss": 0.2465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11404845118522644, |
| "step": 3390, |
| "valid_targets_mean": 2082.8, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 5.440705128205128, |
| "grad_norm": 0.8366878051977619, |
| "learning_rate": 5.759316971259503e-06, |
| "loss": 0.2484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10606566071510315, |
| "step": 3395, |
| "valid_targets_mean": 2823.0, |
| "valid_targets_min": 1201 |
| }, |
| { |
| "epoch": 5.448717948717949, |
| "grad_norm": 0.8888192039843411, |
| "learning_rate": 5.703316515736734e-06, |
| "loss": 0.2548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09152843058109283, |
| "step": 3400, |
| "valid_targets_mean": 1674.8, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 5.456730769230769, |
| "grad_norm": 0.8827382632913743, |
| "learning_rate": 5.647544340491007e-06, |
| "loss": 0.2562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13417841494083405, |
| "step": 3405, |
| "valid_targets_mean": 2341.6, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 5.464743589743589, |
| "grad_norm": 0.9348158913522076, |
| "learning_rate": 5.592001336056659e-06, |
| "loss": 0.2599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11661595851182938, |
| "step": 3410, |
| "valid_targets_mean": 2148.5, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 5.472756410256411, |
| "grad_norm": 0.899463165773569, |
| "learning_rate": 5.536688389308782e-06, |
| "loss": 0.2133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11449143290519714, |
| "step": 3415, |
| "valid_targets_mean": 2986.8, |
| "valid_targets_min": 1542 |
| }, |
| { |
| "epoch": 5.480769230769231, |
| "grad_norm": 1.0221840707566308, |
| "learning_rate": 5.4816063834490496e-06, |
| "loss": 0.2514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11448987573385239, |
| "step": 3420, |
| "valid_targets_mean": 2707.9, |
| "valid_targets_min": 1385 |
| }, |
| { |
| "epoch": 5.488782051282051, |
| "grad_norm": 0.8886976079403867, |
| "learning_rate": 5.426756197991625e-06, |
| "loss": 0.2578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12407940626144409, |
| "step": 3425, |
| "valid_targets_mean": 2182.8, |
| "valid_targets_min": 1171 |
| }, |
| { |
| "epoch": 5.496794871794872, |
| "grad_norm": 0.9145768030794514, |
| "learning_rate": 5.372138708749104e-06, |
| "loss": 0.2468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1369701325893402, |
| "step": 3430, |
| "valid_targets_mean": 2594.4, |
| "valid_targets_min": 1301 |
| }, |
| { |
| "epoch": 5.5048076923076925, |
| "grad_norm": 1.009581529355524, |
| "learning_rate": 5.3177547878185436e-06, |
| "loss": 0.2506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14793305099010468, |
| "step": 3435, |
| "valid_targets_mean": 2712.1, |
| "valid_targets_min": 1151 |
| }, |
| { |
| "epoch": 5.512820512820513, |
| "grad_norm": 0.9955589264699403, |
| "learning_rate": 5.263605303567532e-06, |
| "loss": 0.2457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07715998589992523, |
| "step": 3440, |
| "valid_targets_mean": 1472.5, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 5.520833333333333, |
| "grad_norm": 0.9208751898365475, |
| "learning_rate": 5.20969112062032e-06, |
| "loss": 0.2693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1354086697101593, |
| "step": 3445, |
| "valid_targets_mean": 2418.8, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 5.528846153846154, |
| "grad_norm": 0.9221623243176863, |
| "learning_rate": 5.156013099844017e-06, |
| "loss": 0.247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12082527577877045, |
| "step": 3450, |
| "valid_targets_mean": 2732.0, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 5.5368589743589745, |
| "grad_norm": 0.8920903965938275, |
| "learning_rate": 5.1025720983348544e-06, |
| "loss": 0.2383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08986526727676392, |
| "step": 3455, |
| "valid_targets_mean": 1880.8, |
| "valid_targets_min": 358 |
| }, |
| { |
| "epoch": 5.544871794871795, |
| "grad_norm": 0.9181262406318845, |
| "learning_rate": 5.049368969404484e-06, |
| "loss": 0.2468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16663578152656555, |
| "step": 3460, |
| "valid_targets_mean": 2500.4, |
| "valid_targets_min": 233 |
| }, |
| { |
| "epoch": 5.552884615384615, |
| "grad_norm": 0.8756777064811084, |
| "learning_rate": 4.99640456256636e-06, |
| "loss": 0.2373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12099698930978775, |
| "step": 3465, |
| "valid_targets_mean": 2159.5, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 5.560897435897436, |
| "grad_norm": 0.7964295070270689, |
| "learning_rate": 4.9436797235221814e-06, |
| "loss": 0.2467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1270281970500946, |
| "step": 3470, |
| "valid_targets_mean": 3533.8, |
| "valid_targets_min": 1714 |
| }, |
| { |
| "epoch": 5.568910256410256, |
| "grad_norm": 0.8852318618982599, |
| "learning_rate": 4.891195294148376e-06, |
| "loss": 0.2584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13869354128837585, |
| "step": 3475, |
| "valid_targets_mean": 2751.9, |
| "valid_targets_min": 950 |
| }, |
| { |
| "epoch": 5.576923076923077, |
| "grad_norm": 0.9337792028669593, |
| "learning_rate": 4.838952112482671e-06, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11898134648799896, |
| "step": 3480, |
| "valid_targets_mean": 2228.0, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 5.584935897435898, |
| "grad_norm": 0.9715871230675452, |
| "learning_rate": 4.786951012710699e-06, |
| "loss": 0.2491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11031315475702286, |
| "step": 3485, |
| "valid_targets_mean": 1735.4, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 5.592948717948718, |
| "grad_norm": 1.098570377613153, |
| "learning_rate": 4.735192825152686e-06, |
| "loss": 0.2705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14487780630588531, |
| "step": 3490, |
| "valid_targets_mean": 2629.0, |
| "valid_targets_min": 1579 |
| }, |
| { |
| "epoch": 5.600961538461538, |
| "grad_norm": 1.103661958195554, |
| "learning_rate": 4.683678376250189e-06, |
| "loss": 0.2733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13785336911678314, |
| "step": 3495, |
| "valid_targets_mean": 2487.4, |
| "valid_targets_min": 718 |
| }, |
| { |
| "epoch": 5.608974358974359, |
| "grad_norm": 0.8912416531320945, |
| "learning_rate": 4.6324084885529086e-06, |
| "loss": 0.2572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14532919228076935, |
| "step": 3500, |
| "valid_targets_mean": 2370.6, |
| "valid_targets_min": 1463 |
| }, |
| { |
| "epoch": 5.61698717948718, |
| "grad_norm": 0.853809946943463, |
| "learning_rate": 4.581383980705538e-06, |
| "loss": 0.2634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11753176897764206, |
| "step": 3505, |
| "valid_targets_mean": 2203.1, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 5.625, |
| "grad_norm": 1.0148749521455824, |
| "learning_rate": 4.530605667434727e-06, |
| "loss": 0.2512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11378777027130127, |
| "step": 3510, |
| "valid_targets_mean": 1813.6, |
| "valid_targets_min": 907 |
| }, |
| { |
| "epoch": 5.63301282051282, |
| "grad_norm": 0.8809216737162711, |
| "learning_rate": 4.480074359536013e-06, |
| "loss": 0.2433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09223954379558563, |
| "step": 3515, |
| "valid_targets_mean": 2177.4, |
| "valid_targets_min": 1163 |
| }, |
| { |
| "epoch": 5.641025641025641, |
| "grad_norm": 0.7735268513204762, |
| "learning_rate": 4.429790863860934e-06, |
| "loss": 0.24, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09695015102624893, |
| "step": 3520, |
| "valid_targets_mean": 3094.4, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 5.649038461538462, |
| "grad_norm": 0.842148140258802, |
| "learning_rate": 4.3797559833041146e-06, |
| "loss": 0.2482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19254657626152039, |
| "step": 3525, |
| "valid_targets_mean": 4331.0, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 5.657051282051282, |
| "grad_norm": 0.9672571755633537, |
| "learning_rate": 4.329970516790447e-06, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08324987441301346, |
| "step": 3530, |
| "valid_targets_mean": 1956.8, |
| "valid_targets_min": 911 |
| }, |
| { |
| "epoch": 5.665064102564102, |
| "grad_norm": 0.8246469423610661, |
| "learning_rate": 4.280435259262363e-06, |
| "loss": 0.2509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09709151834249496, |
| "step": 3535, |
| "valid_targets_mean": 2326.0, |
| "valid_targets_min": 1127 |
| }, |
| { |
| "epoch": 5.673076923076923, |
| "grad_norm": 1.1471517807706315, |
| "learning_rate": 4.231151001667077e-06, |
| "loss": 0.2477, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12982910871505737, |
| "step": 3540, |
| "valid_targets_mean": 2151.2, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 5.681089743589744, |
| "grad_norm": 0.9991407058243512, |
| "learning_rate": 4.182118530944044e-06, |
| "loss": 0.2508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1193799376487732, |
| "step": 3545, |
| "valid_targets_mean": 1818.6, |
| "valid_targets_min": 890 |
| }, |
| { |
| "epoch": 5.689102564102564, |
| "grad_norm": 1.0600994797819268, |
| "learning_rate": 4.133338630012307e-06, |
| "loss": 0.2387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12433040142059326, |
| "step": 3550, |
| "valid_targets_mean": 1742.8, |
| "valid_targets_min": 389 |
| }, |
| { |
| "epoch": 5.697115384615385, |
| "grad_norm": 0.9556963156284349, |
| "learning_rate": 4.0848120777580554e-06, |
| "loss": 0.2398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1410602331161499, |
| "step": 3555, |
| "valid_targets_mean": 2916.0, |
| "valid_targets_min": 1039 |
| }, |
| { |
| "epoch": 5.705128205128205, |
| "grad_norm": 0.9434224405006304, |
| "learning_rate": 4.036539649022182e-06, |
| "loss": 0.2604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1809200495481491, |
| "step": 3560, |
| "valid_targets_mean": 2309.0, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 5.7131410256410255, |
| "grad_norm": 0.8716920870064443, |
| "learning_rate": 3.988522114587865e-06, |
| "loss": 0.2519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12875115871429443, |
| "step": 3565, |
| "valid_targets_mean": 2863.0, |
| "valid_targets_min": 1614 |
| }, |
| { |
| "epoch": 5.721153846153846, |
| "grad_norm": 1.0458563586692415, |
| "learning_rate": 3.940760241168331e-06, |
| "loss": 0.2509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11806829273700714, |
| "step": 3570, |
| "valid_targets_mean": 1454.2, |
| "valid_targets_min": 1001 |
| }, |
| { |
| "epoch": 5.729166666666667, |
| "grad_norm": 0.9062406947995726, |
| "learning_rate": 3.893254791394541e-06, |
| "loss": 0.2395, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11536668241024017, |
| "step": 3575, |
| "valid_targets_mean": 2212.8, |
| "valid_targets_min": 1612 |
| }, |
| { |
| "epoch": 5.737179487179487, |
| "grad_norm": 1.330022131278515, |
| "learning_rate": 3.846006523803074e-06, |
| "loss": 0.2469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12758204340934753, |
| "step": 3580, |
| "valid_targets_mean": 2525.5, |
| "valid_targets_min": 1242 |
| }, |
| { |
| "epoch": 5.7451923076923075, |
| "grad_norm": 0.8835904952970588, |
| "learning_rate": 3.799016192823981e-06, |
| "loss": 0.2478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09581005573272705, |
| "step": 3585, |
| "valid_targets_mean": 1695.1, |
| "valid_targets_min": 338 |
| }, |
| { |
| "epoch": 5.753205128205128, |
| "grad_norm": 0.9420105033129872, |
| "learning_rate": 3.7522845487687276e-06, |
| "loss": 0.2415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14770177006721497, |
| "step": 3590, |
| "valid_targets_mean": 2628.4, |
| "valid_targets_min": 1034 |
| }, |
| { |
| "epoch": 5.761217948717949, |
| "grad_norm": 0.8676921782417414, |
| "learning_rate": 3.7058123378182664e-06, |
| "loss": 0.2521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08950576186180115, |
| "step": 3595, |
| "valid_targets_mean": 2229.5, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 5.769230769230769, |
| "grad_norm": 1.0067847303064097, |
| "learning_rate": 3.6596003020110636e-06, |
| "loss": 0.2686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12687063217163086, |
| "step": 3600, |
| "valid_targets_mean": 1829.5, |
| "valid_targets_min": 1329 |
| }, |
| { |
| "epoch": 5.777243589743589, |
| "grad_norm": 0.9462956235007977, |
| "learning_rate": 3.613649179231287e-06, |
| "loss": 0.2369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12175004184246063, |
| "step": 3605, |
| "valid_targets_mean": 2789.6, |
| "valid_targets_min": 1053 |
| }, |
| { |
| "epoch": 5.785256410256411, |
| "grad_norm": 0.9538550126840127, |
| "learning_rate": 3.5679597031970017e-06, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11191975325345993, |
| "step": 3610, |
| "valid_targets_mean": 1783.1, |
| "valid_targets_min": 1165 |
| }, |
| { |
| "epoch": 5.793269230769231, |
| "grad_norm": 0.9448665396902267, |
| "learning_rate": 3.5225326034484764e-06, |
| "loss": 0.2259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11258763074874878, |
| "step": 3615, |
| "valid_targets_mean": 2813.6, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 5.801282051282051, |
| "grad_norm": 1.1921602754723932, |
| "learning_rate": 3.4773686053365197e-06, |
| "loss": 0.2547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.108152374625206, |
| "step": 3620, |
| "valid_targets_mean": 1980.9, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 5.809294871794872, |
| "grad_norm": 0.9389437871542158, |
| "learning_rate": 3.4324684300109003e-06, |
| "loss": 0.2454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12262805551290512, |
| "step": 3625, |
| "valid_targets_mean": 2210.5, |
| "valid_targets_min": 1501 |
| }, |
| { |
| "epoch": 5.8173076923076925, |
| "grad_norm": 0.8936446524664393, |
| "learning_rate": 3.387832794408832e-06, |
| "loss": 0.2469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11695268750190735, |
| "step": 3630, |
| "valid_targets_mean": 2020.8, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 5.825320512820513, |
| "grad_norm": 0.9701527092625535, |
| "learning_rate": 3.3434624112435342e-06, |
| "loss": 0.2494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1281004697084427, |
| "step": 3635, |
| "valid_targets_mean": 2187.0, |
| "valid_targets_min": 1121 |
| }, |
| { |
| "epoch": 5.833333333333333, |
| "grad_norm": 0.8743840128057639, |
| "learning_rate": 3.2993579889928397e-06, |
| "loss": 0.2543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16947509348392487, |
| "step": 3640, |
| "valid_targets_mean": 3233.1, |
| "valid_targets_min": 1260 |
| }, |
| { |
| "epoch": 5.841346153846154, |
| "grad_norm": 1.098032928845481, |
| "learning_rate": 3.25552023188789e-06, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08012664318084717, |
| "step": 3645, |
| "valid_targets_mean": 1645.8, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 5.8493589743589745, |
| "grad_norm": 0.800014973443817, |
| "learning_rate": 3.211949839901889e-06, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13721336424350739, |
| "step": 3650, |
| "valid_targets_mean": 3545.6, |
| "valid_targets_min": 1813 |
| }, |
| { |
| "epoch": 5.857371794871795, |
| "grad_norm": 0.8357203359294402, |
| "learning_rate": 3.168647508738927e-06, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13685111701488495, |
| "step": 3655, |
| "valid_targets_mean": 2689.5, |
| "valid_targets_min": 1076 |
| }, |
| { |
| "epoch": 5.865384615384615, |
| "grad_norm": 0.8044023365786744, |
| "learning_rate": 3.125613929822866e-06, |
| "loss": 0.2333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11675594747066498, |
| "step": 3660, |
| "valid_targets_mean": 2676.8, |
| "valid_targets_min": 1320 |
| }, |
| { |
| "epoch": 5.873397435897436, |
| "grad_norm": 0.9867169190192657, |
| "learning_rate": 3.0828497902863106e-06, |
| "loss": 0.2405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13692760467529297, |
| "step": 3665, |
| "valid_targets_mean": 2082.4, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 5.881410256410256, |
| "grad_norm": 1.033716028166094, |
| "learning_rate": 3.0403557729596267e-06, |
| "loss": 0.2507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08903215825557709, |
| "step": 3670, |
| "valid_targets_mean": 1578.8, |
| "valid_targets_min": 338 |
| }, |
| { |
| "epoch": 5.889423076923077, |
| "grad_norm": 0.9281432052223707, |
| "learning_rate": 2.998132556360038e-06, |
| "loss": 0.2475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1471833884716034, |
| "step": 3675, |
| "valid_targets_mean": 1990.5, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 5.897435897435898, |
| "grad_norm": 0.9371734995128413, |
| "learning_rate": 2.9561808146808068e-06, |
| "loss": 0.2724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13200689852237701, |
| "step": 3680, |
| "valid_targets_mean": 2243.6, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 5.905448717948718, |
| "grad_norm": 1.0373083841003878, |
| "learning_rate": 2.9145012177804476e-06, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1324290782213211, |
| "step": 3685, |
| "valid_targets_mean": 2374.5, |
| "valid_targets_min": 386 |
| }, |
| { |
| "epoch": 5.913461538461538, |
| "grad_norm": 1.2898842869596276, |
| "learning_rate": 2.8730944311720454e-06, |
| "loss": 0.2317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.140394926071167, |
| "step": 3690, |
| "valid_targets_mean": 2749.2, |
| "valid_targets_min": 1277 |
| }, |
| { |
| "epoch": 5.921474358974359, |
| "grad_norm": 0.9019036941814247, |
| "learning_rate": 2.8319611160126226e-06, |
| "loss": 0.2501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07446151226758957, |
| "step": 3695, |
| "valid_targets_mean": 1745.6, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 5.92948717948718, |
| "grad_norm": 0.8839791385323709, |
| "learning_rate": 2.791101929092592e-06, |
| "loss": 0.2489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11784940958023071, |
| "step": 3700, |
| "valid_targets_mean": 2234.2, |
| "valid_targets_min": 1195 |
| }, |
| { |
| "epoch": 5.9375, |
| "grad_norm": 0.8330181151771336, |
| "learning_rate": 2.750517522825251e-06, |
| "loss": 0.25, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13366447389125824, |
| "step": 3705, |
| "valid_targets_mean": 2719.9, |
| "valid_targets_min": 1104 |
| }, |
| { |
| "epoch": 5.94551282051282, |
| "grad_norm": 0.9377041217700914, |
| "learning_rate": 2.710208545236397e-06, |
| "loss": 0.236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.133009672164917, |
| "step": 3710, |
| "valid_targets_mean": 2508.2, |
| "valid_targets_min": 929 |
| }, |
| { |
| "epoch": 5.953525641025641, |
| "grad_norm": 0.9820403258442009, |
| "learning_rate": 2.670175639953929e-06, |
| "loss": 0.2568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11438588798046112, |
| "step": 3715, |
| "valid_targets_mean": 2220.0, |
| "valid_targets_min": 1251 |
| }, |
| { |
| "epoch": 5.961538461538462, |
| "grad_norm": 0.7615622545783344, |
| "learning_rate": 2.6304194461976207e-06, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14797644317150116, |
| "step": 3720, |
| "valid_targets_mean": 3764.2, |
| "valid_targets_min": 1940 |
| }, |
| { |
| "epoch": 5.969551282051282, |
| "grad_norm": 1.3057101203774155, |
| "learning_rate": 2.5909405987688896e-06, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12257261574268341, |
| "step": 3725, |
| "valid_targets_mean": 2614.1, |
| "valid_targets_min": 1414 |
| }, |
| { |
| "epoch": 5.977564102564102, |
| "grad_norm": 0.9546669568666493, |
| "learning_rate": 2.5517397280406565e-06, |
| "loss": 0.2651, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1352090984582901, |
| "step": 3730, |
| "valid_targets_mean": 1989.8, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 5.985576923076923, |
| "grad_norm": 0.8381510959729745, |
| "learning_rate": 2.512817459947312e-06, |
| "loss": 0.255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1442822366952896, |
| "step": 3735, |
| "valid_targets_mean": 2502.4, |
| "valid_targets_min": 303 |
| }, |
| { |
| "epoch": 5.993589743589744, |
| "grad_norm": 0.8381879679213633, |
| "learning_rate": 2.4741744159746618e-06, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1361812949180603, |
| "step": 3740, |
| "valid_targets_mean": 2932.0, |
| "valid_targets_min": 1390 |
| }, |
| { |
| "epoch": 6.001602564102564, |
| "grad_norm": 0.8973578582889672, |
| "learning_rate": 2.435811213150079e-06, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11854055523872375, |
| "step": 3745, |
| "valid_targets_mean": 2506.2, |
| "valid_targets_min": 1387 |
| }, |
| { |
| "epoch": 6.009615384615385, |
| "grad_norm": 0.8534114522962257, |
| "learning_rate": 2.3977284640325805e-06, |
| "loss": 0.2357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10698527097702026, |
| "step": 3750, |
| "valid_targets_mean": 2164.8, |
| "valid_targets_min": 1463 |
| }, |
| { |
| "epoch": 6.017628205128205, |
| "grad_norm": 1.0624803521960697, |
| "learning_rate": 2.359926776703092e-06, |
| "loss": 0.2545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16178178787231445, |
| "step": 3755, |
| "valid_targets_mean": 1912.1, |
| "valid_targets_min": 1224 |
| }, |
| { |
| "epoch": 6.0256410256410255, |
| "grad_norm": 0.9211420738337137, |
| "learning_rate": 2.3224067547547357e-06, |
| "loss": 0.2439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1036263182759285, |
| "step": 3760, |
| "valid_targets_mean": 1760.0, |
| "valid_targets_min": 351 |
| }, |
| { |
| "epoch": 6.033653846153846, |
| "grad_norm": 0.9051511202364992, |
| "learning_rate": 2.2851689972831536e-06, |
| "loss": 0.2508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11598742753267288, |
| "step": 3765, |
| "valid_targets_mean": 2061.2, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 6.041666666666667, |
| "grad_norm": 0.9418108298812553, |
| "learning_rate": 2.248214098877002e-06, |
| "loss": 0.2336, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10721792280673981, |
| "step": 3770, |
| "valid_targets_mean": 1872.5, |
| "valid_targets_min": 314 |
| }, |
| { |
| "epoch": 6.049679487179487, |
| "grad_norm": 0.9797618243041817, |
| "learning_rate": 2.2115426496083958e-06, |
| "loss": 0.2498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11505149304866791, |
| "step": 3775, |
| "valid_targets_mean": 1678.6, |
| "valid_targets_min": 303 |
| }, |
| { |
| "epoch": 6.0576923076923075, |
| "grad_norm": 0.993599072618345, |
| "learning_rate": 2.175155235023536e-06, |
| "loss": 0.2378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11126979440450668, |
| "step": 3780, |
| "valid_targets_mean": 1965.8, |
| "valid_targets_min": 395 |
| }, |
| { |
| "epoch": 6.065705128205129, |
| "grad_norm": 1.2166175998444293, |
| "learning_rate": 2.1390524361333355e-06, |
| "loss": 0.2055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11817347258329391, |
| "step": 3785, |
| "valid_targets_mean": 2711.9, |
| "valid_targets_min": 1262 |
| }, |
| { |
| "epoch": 6.073717948717949, |
| "grad_norm": 1.0184639512858285, |
| "learning_rate": 2.1032348294041305e-06, |
| "loss": 0.243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10550463944673538, |
| "step": 3790, |
| "valid_targets_mean": 2176.2, |
| "valid_targets_min": 413 |
| }, |
| { |
| "epoch": 6.081730769230769, |
| "grad_norm": 0.8816372867971991, |
| "learning_rate": 2.067702986748521e-06, |
| "loss": 0.2356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13984540104866028, |
| "step": 3795, |
| "valid_targets_mean": 2715.6, |
| "valid_targets_min": 1046 |
| }, |
| { |
| "epoch": 6.089743589743589, |
| "grad_norm": 0.856756363743796, |
| "learning_rate": 2.0324574755161764e-06, |
| "loss": 0.2158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11478455364704132, |
| "step": 3800, |
| "valid_targets_mean": 3045.0, |
| "valid_targets_min": 1110 |
| }, |
| { |
| "epoch": 6.097756410256411, |
| "grad_norm": 1.014237638787344, |
| "learning_rate": 1.9974988584848385e-06, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15924817323684692, |
| "step": 3805, |
| "valid_targets_mean": 2288.0, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 6.105769230769231, |
| "grad_norm": 0.7358071224075459, |
| "learning_rate": 1.96282769385129e-06, |
| "loss": 0.2368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16144993901252747, |
| "step": 3810, |
| "valid_targets_mean": 3920.1, |
| "valid_targets_min": 1087 |
| }, |
| { |
| "epoch": 6.113782051282051, |
| "grad_norm": 0.8095160537437991, |
| "learning_rate": 1.9284445352224625e-06, |
| "loss": 0.2482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12894617021083832, |
| "step": 3815, |
| "valid_targets_mean": 4050.4, |
| "valid_targets_min": 1416 |
| }, |
| { |
| "epoch": 6.121794871794871, |
| "grad_norm": 0.8248147276134351, |
| "learning_rate": 1.894349931606596e-06, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10038469731807709, |
| "step": 3820, |
| "valid_targets_mean": 2216.5, |
| "valid_targets_min": 1070 |
| }, |
| { |
| "epoch": 6.1298076923076925, |
| "grad_norm": 0.9659691832090724, |
| "learning_rate": 1.8605444274044493e-06, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13512755930423737, |
| "step": 3825, |
| "valid_targets_mean": 3244.0, |
| "valid_targets_min": 1432 |
| }, |
| { |
| "epoch": 6.137820512820513, |
| "grad_norm": 1.0862713671449233, |
| "learning_rate": 1.827028562400659e-06, |
| "loss": 0.238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09466798603534698, |
| "step": 3830, |
| "valid_targets_mean": 1761.5, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 6.145833333333333, |
| "grad_norm": 0.8998914205168546, |
| "learning_rate": 1.793802871755066e-06, |
| "loss": 0.2381, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13006693124771118, |
| "step": 3835, |
| "valid_targets_mean": 2522.0, |
| "valid_targets_min": 892 |
| }, |
| { |
| "epoch": 6.153846153846154, |
| "grad_norm": 0.9432779658728595, |
| "learning_rate": 1.760867885994202e-06, |
| "loss": 0.2438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1070912778377533, |
| "step": 3840, |
| "valid_targets_mean": 1912.8, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 6.1618589743589745, |
| "grad_norm": 0.9338261525659013, |
| "learning_rate": 1.7282241310028047e-06, |
| "loss": 0.2407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0991261750459671, |
| "step": 3845, |
| "valid_targets_mean": 1827.0, |
| "valid_targets_min": 816 |
| }, |
| { |
| "epoch": 6.169871794871795, |
| "grad_norm": 0.8125279588220881, |
| "learning_rate": 1.6958721280154232e-06, |
| "loss": 0.2384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09734629094600677, |
| "step": 3850, |
| "valid_targets_mean": 2683.1, |
| "valid_targets_min": 1626 |
| }, |
| { |
| "epoch": 6.177884615384615, |
| "grad_norm": 0.8247615418877465, |
| "learning_rate": 1.6638123936081085e-06, |
| "loss": 0.2287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10162614285945892, |
| "step": 3855, |
| "valid_targets_mean": 3007.8, |
| "valid_targets_min": 1285 |
| }, |
| { |
| "epoch": 6.185897435897436, |
| "grad_norm": 1.054167152401939, |
| "learning_rate": 1.6320454396901463e-06, |
| "loss": 0.2522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17180277407169342, |
| "step": 3860, |
| "valid_targets_mean": 2394.8, |
| "valid_targets_min": 835 |
| }, |
| { |
| "epoch": 6.193910256410256, |
| "grad_norm": 0.861439666599418, |
| "learning_rate": 1.6005717734958914e-06, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10443761199712753, |
| "step": 3865, |
| "valid_targets_mean": 2728.1, |
| "valid_targets_min": 1162 |
| }, |
| { |
| "epoch": 6.201923076923077, |
| "grad_norm": 1.1126631206428137, |
| "learning_rate": 1.569391897576671e-06, |
| "loss": 0.2305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13118451833724976, |
| "step": 3870, |
| "valid_targets_mean": 3325.9, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 6.209935897435898, |
| "grad_norm": 1.1962641290378953, |
| "learning_rate": 1.5385063097927533e-06, |
| "loss": 0.2458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15093114972114563, |
| "step": 3875, |
| "valid_targets_mean": 1901.5, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 6.217948717948718, |
| "grad_norm": 0.8163609568748574, |
| "learning_rate": 1.5079155033054104e-06, |
| "loss": 0.2637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12418213486671448, |
| "step": 3880, |
| "valid_targets_mean": 3363.8, |
| "valid_targets_min": 1873 |
| }, |
| { |
| "epoch": 6.225961538461538, |
| "grad_norm": 0.8700233982216152, |
| "learning_rate": 1.4776199665690239e-06, |
| "loss": 0.2315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14278334379196167, |
| "step": 3885, |
| "valid_targets_mean": 2949.2, |
| "valid_targets_min": 2107 |
| }, |
| { |
| "epoch": 6.233974358974359, |
| "grad_norm": 0.9683775134031113, |
| "learning_rate": 1.4476201833233084e-06, |
| "loss": 0.2456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1428484171628952, |
| "step": 3890, |
| "valid_targets_mean": 2313.9, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 6.24198717948718, |
| "grad_norm": 0.8620465618712795, |
| "learning_rate": 1.4179166325855676e-06, |
| "loss": 0.2301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10901591181755066, |
| "step": 3895, |
| "valid_targets_mean": 2681.1, |
| "valid_targets_min": 1417 |
| }, |
| { |
| "epoch": 6.25, |
| "grad_norm": 1.0173933841157816, |
| "learning_rate": 1.3885097886430599e-06, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11926823854446411, |
| "step": 3900, |
| "valid_targets_mean": 1679.1, |
| "valid_targets_min": 776 |
| }, |
| { |
| "epoch": 6.25801282051282, |
| "grad_norm": 0.9589762435954294, |
| "learning_rate": 1.35940012104542e-06, |
| "loss": 0.229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11792376637458801, |
| "step": 3905, |
| "valid_targets_mean": 2086.9, |
| "valid_targets_min": 1173 |
| }, |
| { |
| "epoch": 6.266025641025641, |
| "grad_norm": 0.8272561272888953, |
| "learning_rate": 1.3305880945971583e-06, |
| "loss": 0.2197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11362828314304352, |
| "step": 3910, |
| "valid_targets_mean": 2718.2, |
| "valid_targets_min": 1210 |
| }, |
| { |
| "epoch": 6.274038461538462, |
| "grad_norm": 0.874758503329499, |
| "learning_rate": 1.3020741693502403e-06, |
| "loss": 0.2244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11108657717704773, |
| "step": 3915, |
| "valid_targets_mean": 2434.9, |
| "valid_targets_min": 876 |
| }, |
| { |
| "epoch": 6.282051282051282, |
| "grad_norm": 0.9079477576801739, |
| "learning_rate": 1.27385880059675e-06, |
| "loss": 0.246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12969839572906494, |
| "step": 3920, |
| "valid_targets_mean": 2454.9, |
| "valid_targets_min": 1137 |
| }, |
| { |
| "epoch": 6.290064102564102, |
| "grad_norm": 2.0808279255459916, |
| "learning_rate": 1.245942438861607e-06, |
| "loss": 0.2313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14092810451984406, |
| "step": 3925, |
| "valid_targets_mean": 4037.8, |
| "valid_targets_min": 1906 |
| }, |
| { |
| "epoch": 6.298076923076923, |
| "grad_norm": 0.899393114401227, |
| "learning_rate": 1.2183255298953788e-06, |
| "loss": 0.2267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11960645020008087, |
| "step": 3930, |
| "valid_targets_mean": 2517.6, |
| "valid_targets_min": 294 |
| }, |
| { |
| "epoch": 6.306089743589744, |
| "grad_norm": 0.8903825930436158, |
| "learning_rate": 1.1910085146671645e-06, |
| "loss": 0.2335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09993119537830353, |
| "step": 3935, |
| "valid_targets_mean": 2103.9, |
| "valid_targets_min": 947 |
| }, |
| { |
| "epoch": 6.314102564102564, |
| "grad_norm": 0.954308249771596, |
| "learning_rate": 1.1639918293575492e-06, |
| "loss": 0.2362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10835768282413483, |
| "step": 3940, |
| "valid_targets_mean": 2119.8, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 6.322115384615385, |
| "grad_norm": 0.7514063558774706, |
| "learning_rate": 1.1372759053516536e-06, |
| "loss": 0.2378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07814587652683258, |
| "step": 3945, |
| "valid_targets_mean": 1868.4, |
| "valid_targets_min": 1116 |
| }, |
| { |
| "epoch": 6.330128205128205, |
| "grad_norm": 1.2072460679937176, |
| "learning_rate": 1.1108611692322157e-06, |
| "loss": 0.2302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12843677401542664, |
| "step": 3950, |
| "valid_targets_mean": 2542.8, |
| "valid_targets_min": 1621 |
| }, |
| { |
| "epoch": 6.3381410256410255, |
| "grad_norm": 1.0878840127555423, |
| "learning_rate": 1.0847480427728142e-06, |
| "loss": 0.2446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1504746973514557, |
| "step": 3955, |
| "valid_targets_mean": 2188.8, |
| "valid_targets_min": 1581 |
| }, |
| { |
| "epoch": 6.346153846153846, |
| "grad_norm": 0.9562102985761943, |
| "learning_rate": 1.0589369429311125e-06, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13461454212665558, |
| "step": 3960, |
| "valid_targets_mean": 2561.5, |
| "valid_targets_min": 1333 |
| }, |
| { |
| "epoch": 6.354166666666667, |
| "grad_norm": 0.9752919981880385, |
| "learning_rate": 1.0334282818422037e-06, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1450095921754837, |
| "step": 3965, |
| "valid_targets_mean": 2425.1, |
| "valid_targets_min": 1062 |
| }, |
| { |
| "epoch": 6.362179487179487, |
| "grad_norm": 1.5311355387380936, |
| "learning_rate": 1.008222466812041e-06, |
| "loss": 0.2553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07920059561729431, |
| "step": 3970, |
| "valid_targets_mean": 2347.8, |
| "valid_targets_min": 966 |
| }, |
| { |
| "epoch": 6.3701923076923075, |
| "grad_norm": 1.0924705252685218, |
| "learning_rate": 9.83319900310915e-07, |
| "loss": 0.2318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12321265786886215, |
| "step": 3975, |
| "valid_targets_mean": 2116.4, |
| "valid_targets_min": 1230 |
| }, |
| { |
| "epoch": 6.378205128205128, |
| "grad_norm": 0.9640948057385402, |
| "learning_rate": 9.587209799670495e-07, |
| "loss": 0.2377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11751890182495117, |
| "step": 3980, |
| "valid_targets_mean": 2322.9, |
| "valid_targets_min": 1085 |
| }, |
| { |
| "epoch": 6.386217948717949, |
| "grad_norm": 1.079236125695824, |
| "learning_rate": 9.344260985602327e-07, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16698667407035828, |
| "step": 3985, |
| "valid_targets_mean": 1949.1, |
| "valid_targets_min": 812 |
| }, |
| { |
| "epoch": 6.394230769230769, |
| "grad_norm": 1.0803656519063216, |
| "learning_rate": 9.104356440155526e-07, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.140387624502182, |
| "step": 3990, |
| "valid_targets_mean": 2234.5, |
| "valid_targets_min": 1183 |
| }, |
| { |
| "epoch": 6.402243589743589, |
| "grad_norm": 0.8456195863558014, |
| "learning_rate": 8.867499993972162e-07, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13046512007713318, |
| "step": 3995, |
| "valid_targets_mean": 3625.6, |
| "valid_targets_min": 979 |
| }, |
| { |
| "epoch": 6.410256410256411, |
| "grad_norm": 0.8977134484616605, |
| "learning_rate": 8.633695429024058e-07, |
| "loss": 0.2384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10581670701503754, |
| "step": 4000, |
| "valid_targets_mean": 2741.9, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 6.418269230769231, |
| "grad_norm": 0.7948378106951604, |
| "learning_rate": 8.402946478552732e-07, |
| "loss": 0.2253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09752516448497772, |
| "step": 4005, |
| "valid_targets_mean": 3156.9, |
| "valid_targets_min": 473 |
| }, |
| { |
| "epoch": 6.426282051282051, |
| "grad_norm": 0.8443688864845404, |
| "learning_rate": 8.175256827009392e-07, |
| "loss": 0.2344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10218418389558792, |
| "step": 4010, |
| "valid_targets_mean": 2307.0, |
| "valid_targets_min": 1029 |
| }, |
| { |
| "epoch": 6.434294871794872, |
| "grad_norm": 1.7792482258762818, |
| "learning_rate": 7.95063010999646e-07, |
| "loss": 0.2392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09822884202003479, |
| "step": 4015, |
| "valid_targets_mean": 1924.8, |
| "valid_targets_min": 981 |
| }, |
| { |
| "epoch": 6.4423076923076925, |
| "grad_norm": 0.926606896282617, |
| "learning_rate": 7.729069914209409e-07, |
| "loss": 0.2308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11828078329563141, |
| "step": 4020, |
| "valid_targets_mean": 2529.9, |
| "valid_targets_min": 1042 |
| }, |
| { |
| "epoch": 6.450320512820513, |
| "grad_norm": 1.0827086250732898, |
| "learning_rate": 7.510579777379345e-07, |
| "loss": 0.2326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10486094653606415, |
| "step": 4025, |
| "valid_targets_mean": 1429.4, |
| "valid_targets_min": 297 |
| }, |
| { |
| "epoch": 6.458333333333333, |
| "grad_norm": 0.9839272238313078, |
| "learning_rate": 7.295163188216792e-07, |
| "loss": 0.2348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1142701581120491, |
| "step": 4030, |
| "valid_targets_mean": 2105.8, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 6.466346153846154, |
| "grad_norm": 0.9291054329783041, |
| "learning_rate": 7.08282358635568e-07, |
| "loss": 0.2542, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12670905888080597, |
| "step": 4035, |
| "valid_targets_mean": 2173.2, |
| "valid_targets_min": 1040 |
| }, |
| { |
| "epoch": 6.4743589743589745, |
| "grad_norm": 0.9426259395664396, |
| "learning_rate": 6.87356436229869e-07, |
| "loss": 0.2555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12212735414505005, |
| "step": 4040, |
| "valid_targets_mean": 1812.4, |
| "valid_targets_min": 1033 |
| }, |
| { |
| "epoch": 6.482371794871795, |
| "grad_norm": 0.7380513636736298, |
| "learning_rate": 6.667388857362977e-07, |
| "loss": 0.2367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09599901735782623, |
| "step": 4045, |
| "valid_targets_mean": 2941.8, |
| "valid_targets_min": 934 |
| }, |
| { |
| "epoch": 6.490384615384615, |
| "grad_norm": 0.9099419008308579, |
| "learning_rate": 6.464300363626797e-07, |
| "loss": 0.2327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11146557331085205, |
| "step": 4050, |
| "valid_targets_mean": 2807.4, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 6.498397435897436, |
| "grad_norm": 0.9809559308191058, |
| "learning_rate": 6.264302123877053e-07, |
| "loss": 0.2297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11797185242176056, |
| "step": 4055, |
| "valid_targets_mean": 2723.9, |
| "valid_targets_min": 1600 |
| }, |
| { |
| "epoch": 6.506410256410256, |
| "grad_norm": 0.9350599141578312, |
| "learning_rate": 6.067397331557412e-07, |
| "loss": 0.2368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12935124337673187, |
| "step": 4060, |
| "valid_targets_mean": 2216.0, |
| "valid_targets_min": 1135 |
| }, |
| { |
| "epoch": 6.514423076923077, |
| "grad_norm": 1.4016198586806865, |
| "learning_rate": 5.873589130717405e-07, |
| "loss": 0.2382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12601718306541443, |
| "step": 4065, |
| "valid_targets_mean": 1985.8, |
| "valid_targets_min": 1158 |
| }, |
| { |
| "epoch": 6.522435897435898, |
| "grad_norm": 0.8251427320454606, |
| "learning_rate": 5.682880615962116e-07, |
| "loss": 0.2363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10815025866031647, |
| "step": 4070, |
| "valid_targets_mean": 2696.6, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 6.530448717948718, |
| "grad_norm": 0.8955660099878735, |
| "learning_rate": 5.495274832402841e-07, |
| "loss": 0.2244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10643479228019714, |
| "step": 4075, |
| "valid_targets_mean": 2961.2, |
| "valid_targets_min": 886 |
| }, |
| { |
| "epoch": 6.538461538461538, |
| "grad_norm": 0.9604493791278844, |
| "learning_rate": 5.310774775608529e-07, |
| "loss": 0.2425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1176200807094574, |
| "step": 4080, |
| "valid_targets_mean": 2403.2, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 6.546474358974359, |
| "grad_norm": 0.9762190869394272, |
| "learning_rate": 5.129383391557751e-07, |
| "loss": 0.253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1663392037153244, |
| "step": 4085, |
| "valid_targets_mean": 1939.5, |
| "valid_targets_min": 855 |
| }, |
| { |
| "epoch": 6.55448717948718, |
| "grad_norm": 0.842222470742701, |
| "learning_rate": 4.951103576591876e-07, |
| "loss": 0.225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10071545094251633, |
| "step": 4090, |
| "valid_targets_mean": 2852.8, |
| "valid_targets_min": 1331 |
| }, |
| { |
| "epoch": 6.5625, |
| "grad_norm": 0.9307268460212219, |
| "learning_rate": 4.7759381773687e-07, |
| "loss": 0.2297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11373141407966614, |
| "step": 4095, |
| "valid_targets_mean": 2556.9, |
| "valid_targets_min": 913 |
| }, |
| { |
| "epoch": 6.57051282051282, |
| "grad_norm": 0.8457918011171499, |
| "learning_rate": 4.6038899908170234e-07, |
| "loss": 0.2277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13154616951942444, |
| "step": 4100, |
| "valid_targets_mean": 2821.9, |
| "valid_targets_min": 1106 |
| }, |
| { |
| "epoch": 6.578525641025641, |
| "grad_norm": 0.8387894923769624, |
| "learning_rate": 4.4349617640920164e-07, |
| "loss": 0.2495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1035970151424408, |
| "step": 4105, |
| "valid_targets_mean": 1948.8, |
| "valid_targets_min": 1123 |
| }, |
| { |
| "epoch": 6.586538461538462, |
| "grad_norm": 0.9037859502058307, |
| "learning_rate": 4.2691561945312764e-07, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1121777892112732, |
| "step": 4110, |
| "valid_targets_mean": 2629.9, |
| "valid_targets_min": 1407 |
| }, |
| { |
| "epoch": 6.594551282051282, |
| "grad_norm": 0.8863493487648947, |
| "learning_rate": 4.106475929611886e-07, |
| "loss": 0.2289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11576659977436066, |
| "step": 4115, |
| "valid_targets_mean": 2561.9, |
| "valid_targets_min": 1661 |
| }, |
| { |
| "epoch": 6.602564102564102, |
| "grad_norm": 0.8878216680524392, |
| "learning_rate": 3.9469235669080007e-07, |
| "loss": 0.2276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10847125947475433, |
| "step": 4120, |
| "valid_targets_mean": 2641.6, |
| "valid_targets_min": 1118 |
| }, |
| { |
| "epoch": 6.610576923076923, |
| "grad_norm": 1.0358019265981901, |
| "learning_rate": 3.7905016540495053e-07, |
| "loss": 0.2547, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11162734031677246, |
| "step": 4125, |
| "valid_targets_mean": 1598.9, |
| "valid_targets_min": 508 |
| }, |
| { |
| "epoch": 6.618589743589744, |
| "grad_norm": 0.7745868367967038, |
| "learning_rate": 3.63721268868118e-07, |
| "loss": 0.2369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0914057046175003, |
| "step": 4130, |
| "valid_targets_mean": 2922.6, |
| "valid_targets_min": 1394 |
| }, |
| { |
| "epoch": 6.626602564102564, |
| "grad_norm": 1.0567183316790034, |
| "learning_rate": 3.487059118422997e-07, |
| "loss": 0.2458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11103471368551254, |
| "step": 4135, |
| "valid_targets_mean": 1526.8, |
| "valid_targets_min": 417 |
| }, |
| { |
| "epoch": 6.634615384615385, |
| "grad_norm": 0.7607762113223796, |
| "learning_rate": 3.3400433408308895e-07, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09019508957862854, |
| "step": 4140, |
| "valid_targets_mean": 2316.9, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 6.642628205128205, |
| "grad_norm": 0.8802472861580645, |
| "learning_rate": 3.196167703358577e-07, |
| "loss": 0.2349, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1006564050912857, |
| "step": 4145, |
| "valid_targets_mean": 2205.8, |
| "valid_targets_min": 945 |
| }, |
| { |
| "epoch": 6.6506410256410255, |
| "grad_norm": 0.8730051710281508, |
| "learning_rate": 3.0554345033199985e-07, |
| "loss": 0.2292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12638235092163086, |
| "step": 4150, |
| "valid_targets_mean": 3004.1, |
| "valid_targets_min": 796 |
| }, |
| { |
| "epoch": 6.658653846153846, |
| "grad_norm": 1.1553489157125603, |
| "learning_rate": 2.917845987852652e-07, |
| "loss": 0.2415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1155930757522583, |
| "step": 4155, |
| "valid_targets_mean": 2950.5, |
| "valid_targets_min": 1269 |
| }, |
| { |
| "epoch": 6.666666666666667, |
| "grad_norm": 0.8952157916587886, |
| "learning_rate": 2.783404353881758e-07, |
| "loss": 0.2424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.08050580322742462, |
| "step": 4160, |
| "valid_targets_mean": 2010.8, |
| "valid_targets_min": 1010 |
| }, |
| { |
| "epoch": 6.674679487179487, |
| "grad_norm": 0.9408776457030263, |
| "learning_rate": 2.652111748085151e-07, |
| "loss": 0.2301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11845621466636658, |
| "step": 4165, |
| "valid_targets_mean": 2520.0, |
| "valid_targets_min": 1905 |
| }, |
| { |
| "epoch": 6.6826923076923075, |
| "grad_norm": 1.0642164005801316, |
| "learning_rate": 2.523970266859044e-07, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15462008118629456, |
| "step": 4170, |
| "valid_targets_mean": 2359.5, |
| "valid_targets_min": 1170 |
| }, |
| { |
| "epoch": 6.690705128205128, |
| "grad_norm": 0.9995337282018758, |
| "learning_rate": 2.398981956284363e-07, |
| "loss": 0.2531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1114429384469986, |
| "step": 4175, |
| "valid_targets_mean": 1883.6, |
| "valid_targets_min": 1075 |
| }, |
| { |
| "epoch": 6.698717948717949, |
| "grad_norm": 0.8561185272458319, |
| "learning_rate": 2.2771488120944207e-07, |
| "loss": 0.2402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11397942900657654, |
| "step": 4180, |
| "valid_targets_mean": 2592.9, |
| "valid_targets_min": 1095 |
| }, |
| { |
| "epoch": 6.706730769230769, |
| "grad_norm": 0.9740156202400301, |
| "learning_rate": 2.1584727796427174e-07, |
| "loss": 0.2387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14512796700000763, |
| "step": 4185, |
| "valid_targets_mean": 2518.9, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 6.714743589743589, |
| "grad_norm": 1.1588496532617867, |
| "learning_rate": 2.0429557538720556e-07, |
| "loss": 0.2329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1153675764799118, |
| "step": 4190, |
| "valid_targets_mean": 2192.1, |
| "valid_targets_min": 1588 |
| }, |
| { |
| "epoch": 6.722756410256411, |
| "grad_norm": 0.8519923964077011, |
| "learning_rate": 1.930599579284298e-07, |
| "loss": 0.2283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10996921360492706, |
| "step": 4195, |
| "valid_targets_mean": 2487.8, |
| "valid_targets_min": 1049 |
| }, |
| { |
| "epoch": 6.730769230769231, |
| "grad_norm": 1.0100576905261862, |
| "learning_rate": 1.8214060499107679e-07, |
| "loss": 0.2561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1439555585384369, |
| "step": 4200, |
| "valid_targets_mean": 2279.6, |
| "valid_targets_min": 1079 |
| }, |
| { |
| "epoch": 6.738782051282051, |
| "grad_norm": 0.8166556725836737, |
| "learning_rate": 1.7153769092837614e-07, |
| "loss": 0.2148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10187620669603348, |
| "step": 4205, |
| "valid_targets_mean": 3076.2, |
| "valid_targets_min": 1198 |
| }, |
| { |
| "epoch": 6.746794871794872, |
| "grad_norm": 0.8522985195219519, |
| "learning_rate": 1.6125138504086146e-07, |
| "loss": 0.2387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.122517429292202, |
| "step": 4210, |
| "valid_targets_mean": 2788.5, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 6.7548076923076925, |
| "grad_norm": 1.04741022514734, |
| "learning_rate": 1.5128185157367247e-07, |
| "loss": 0.2353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11223140358924866, |
| "step": 4215, |
| "valid_targets_mean": 1682.9, |
| "valid_targets_min": 944 |
| }, |
| { |
| "epoch": 6.762820512820513, |
| "grad_norm": 1.0466928727574043, |
| "learning_rate": 1.4162924971393044e-07, |
| "loss": 0.2618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1298060417175293, |
| "step": 4220, |
| "valid_targets_mean": 1969.2, |
| "valid_targets_min": 292 |
| }, |
| { |
| "epoch": 6.770833333333333, |
| "grad_norm": 0.8061561581755782, |
| "learning_rate": 1.322937335881891e-07, |
| "loss": 0.2473, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16025656461715698, |
| "step": 4225, |
| "valid_targets_mean": 3525.5, |
| "valid_targets_min": 877 |
| }, |
| { |
| "epoch": 6.778846153846154, |
| "grad_norm": 0.9449521007617103, |
| "learning_rate": 1.2327545225999215e-07, |
| "loss": 0.2318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11590196937322617, |
| "step": 4230, |
| "valid_targets_mean": 2609.0, |
| "valid_targets_min": 1021 |
| }, |
| { |
| "epoch": 6.7868589743589745, |
| "grad_norm": 0.925371088266695, |
| "learning_rate": 1.145745497274664e-07, |
| "loss": 0.2468, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14536672830581665, |
| "step": 4235, |
| "valid_targets_mean": 2727.6, |
| "valid_targets_min": 1387 |
| }, |
| { |
| "epoch": 6.794871794871795, |
| "grad_norm": 0.7532084104831867, |
| "learning_rate": 1.061911649210523e-07, |
| "loss": 0.226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07455575466156006, |
| "step": 4240, |
| "valid_targets_mean": 2051.8, |
| "valid_targets_min": 371 |
| }, |
| { |
| "epoch": 6.802884615384615, |
| "grad_norm": 0.9954452940831777, |
| "learning_rate": 9.812543170126365e-08, |
| "loss": 0.2346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11818395555019379, |
| "step": 4245, |
| "valid_targets_mean": 2523.9, |
| "valid_targets_min": 1100 |
| }, |
| { |
| "epoch": 6.810897435897436, |
| "grad_norm": 0.8810844606785796, |
| "learning_rate": 9.03774788565559e-08, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10779982805252075, |
| "step": 4250, |
| "valid_targets_mean": 2419.9, |
| "valid_targets_min": 1234 |
| }, |
| { |
| "epoch": 6.818910256410256, |
| "grad_norm": 0.7587255090249656, |
| "learning_rate": 8.294743010127448e-08, |
| "loss": 0.2293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09742031991481781, |
| "step": 4255, |
| "valid_targets_mean": 2819.4, |
| "valid_targets_min": 1493 |
| }, |
| { |
| "epoch": 6.826923076923077, |
| "grad_norm": 0.9186887291366199, |
| "learning_rate": 7.583540407367418e-08, |
| "loss": 0.2325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11129537224769592, |
| "step": 4260, |
| "valid_targets_mean": 2361.5, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 6.834935897435898, |
| "grad_norm": 0.8638613619075678, |
| "learning_rate": 6.904151433402728e-08, |
| "loss": 0.2296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10862366110086441, |
| "step": 4265, |
| "valid_targets_mean": 2177.1, |
| "valid_targets_min": 1521 |
| }, |
| { |
| "epoch": 6.842948717948718, |
| "grad_norm": 0.887431984510552, |
| "learning_rate": 6.256586936281172e-08, |
| "loss": 0.2467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12638813257217407, |
| "step": 4270, |
| "valid_targets_mean": 2991.6, |
| "valid_targets_min": 1543 |
| }, |
| { |
| "epoch": 6.850961538461538, |
| "grad_norm": 1.0013091054241623, |
| "learning_rate": 5.6408572558972475e-08, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11181466281414032, |
| "step": 4275, |
| "valid_targets_mean": 1893.5, |
| "valid_targets_min": 1160 |
| }, |
| { |
| "epoch": 6.858974358974359, |
| "grad_norm": 1.0227568011240404, |
| "learning_rate": 5.0569722238280605e-08, |
| "loss": 0.246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16308793425559998, |
| "step": 4280, |
| "valid_targets_mean": 2498.2, |
| "valid_targets_min": 997 |
| }, |
| { |
| "epoch": 6.86698717948718, |
| "grad_norm": 0.9842765844108, |
| "learning_rate": 4.504941163175236e-08, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12176279723644257, |
| "step": 4285, |
| "valid_targets_mean": 1907.0, |
| "valid_targets_min": 953 |
| }, |
| { |
| "epoch": 6.875, |
| "grad_norm": 1.3291503879689117, |
| "learning_rate": 3.984772888417032e-08, |
| "loss": 0.2296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11058434844017029, |
| "step": 4290, |
| "valid_targets_mean": 2407.4, |
| "valid_targets_min": 1244 |
| }, |
| { |
| "epoch": 6.88301282051282, |
| "grad_norm": 0.7907667503962194, |
| "learning_rate": 3.4964757052671216e-08, |
| "loss": 0.2245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.07719993591308594, |
| "step": 4295, |
| "valid_targets_mean": 2425.5, |
| "valid_targets_min": 882 |
| }, |
| { |
| "epoch": 6.891025641025641, |
| "grad_norm": 0.9147924117446959, |
| "learning_rate": 3.0400574105415856e-08, |
| "loss": 0.2184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11411920189857483, |
| "step": 4300, |
| "valid_targets_mean": 2327.2, |
| "valid_targets_min": 1051 |
| }, |
| { |
| "epoch": 6.899038461538462, |
| "grad_norm": 0.8184445022532079, |
| "learning_rate": 2.615525292035459e-08, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10698746144771576, |
| "step": 4305, |
| "valid_targets_mean": 3427.0, |
| "valid_targets_min": 1359 |
| }, |
| { |
| "epoch": 6.907051282051282, |
| "grad_norm": 0.969049875717242, |
| "learning_rate": 2.222886128405266e-08, |
| "loss": 0.2434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09935212880373001, |
| "step": 4310, |
| "valid_targets_mean": 2346.5, |
| "valid_targets_min": 446 |
| }, |
| { |
| "epoch": 6.915064102564102, |
| "grad_norm": 0.8366135689501649, |
| "learning_rate": 1.8621461890617752e-08, |
| "loss": 0.2376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10085824131965637, |
| "step": 4315, |
| "valid_targets_mean": 2112.9, |
| "valid_targets_min": 1382 |
| }, |
| { |
| "epoch": 6.923076923076923, |
| "grad_norm": 0.9757835486083863, |
| "learning_rate": 1.5333112340687463e-08, |
| "loss": 0.243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1587846875190735, |
| "step": 4320, |
| "valid_targets_mean": 2357.0, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 6.931089743589744, |
| "grad_norm": 0.7896507256157604, |
| "learning_rate": 1.2363865140518905e-08, |
| "loss": 0.2664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1322735846042633, |
| "step": 4325, |
| "valid_targets_mean": 2378.5, |
| "valid_targets_min": 1000 |
| }, |
| { |
| "epoch": 6.939102564102564, |
| "grad_norm": 0.7394443171363577, |
| "learning_rate": 9.713767701151621e-09, |
| "loss": 0.2228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10028460621833801, |
| "step": 4330, |
| "valid_targets_mean": 3140.5, |
| "valid_targets_min": 1022 |
| }, |
| { |
| "epoch": 6.947115384615385, |
| "grad_norm": 0.937378550902355, |
| "learning_rate": 7.382862337641516e-09, |
| "loss": 0.2423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1184074729681015, |
| "step": 4335, |
| "valid_targets_mean": 2002.2, |
| "valid_targets_min": 883 |
| }, |
| { |
| "epoch": 6.955128205128205, |
| "grad_norm": 0.8929545659767167, |
| "learning_rate": 5.371186268390283e-09, |
| "loss": 0.2459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.0951998233795166, |
| "step": 4340, |
| "valid_targets_mean": 2122.8, |
| "valid_targets_min": 385 |
| }, |
| { |
| "epoch": 6.9631410256410255, |
| "grad_norm": 0.8450524750277165, |
| "learning_rate": 3.678771614550325e-09, |
| "loss": 0.261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1101217120885849, |
| "step": 4345, |
| "valid_targets_mean": 1946.5, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 6.971153846153846, |
| "grad_norm": 0.8222550737458072, |
| "learning_rate": 2.3056453995162763e-09, |
| "loss": 0.2313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06940317898988724, |
| "step": 4350, |
| "valid_targets_mean": 1825.2, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 6.979166666666667, |
| "grad_norm": 0.9510199952831588, |
| "learning_rate": 1.2518295484875708e-09, |
| "loss": 0.2619, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10881343483924866, |
| "step": 4355, |
| "valid_targets_mean": 1923.4, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 6.987179487179487, |
| "grad_norm": 0.9425580090389156, |
| "learning_rate": 5.173408881198328e-10, |
| "loss": 0.2432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1133669912815094, |
| "step": 4360, |
| "valid_targets_mean": 1864.9, |
| "valid_targets_min": 1216 |
| }, |
| { |
| "epoch": 6.9951923076923075, |
| "grad_norm": 0.9452987456146136, |
| "learning_rate": 1.0219114625398263e-10, |
| "loss": 0.2363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13046550750732422, |
| "step": 4365, |
| "valid_targets_mean": 2728.5, |
| "valid_targets_min": 1249 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.06942301988601685, |
| "step": 4368, |
| "total_flos": 7.09204861186474e+17, |
| "train_loss": 0.32849771289270874, |
| "train_runtime": 20331.9971, |
| "train_samples_per_second": 3.436, |
| "train_steps_per_second": 0.215, |
| "valid_targets_mean": 1305.1, |
| "valid_targets_min": 490 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4368, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 7.09204861186474e+17, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|