| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4662, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.0075075075075075074, |
| "grad_norm": 11.018023139973177, |
| "learning_rate": 3.426124197002142e-07, |
| "loss": 0.6962, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.666359007358551, |
| "step": 5, |
| "valid_targets_mean": 3406.2, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 0.015015015015015015, |
| "grad_norm": 14.300498234778246, |
| "learning_rate": 7.708779443254819e-07, |
| "loss": 0.6812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7260710597038269, |
| "step": 10, |
| "valid_targets_mean": 2929.3, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 0.02252252252252252, |
| "grad_norm": 10.308334513580103, |
| "learning_rate": 1.1991434689507496e-06, |
| "loss": 0.694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.7622815370559692, |
| "step": 15, |
| "valid_targets_mean": 4942.4, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 0.03003003003003003, |
| "grad_norm": 9.480467405179247, |
| "learning_rate": 1.6274089935760173e-06, |
| "loss": 0.63, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5915040969848633, |
| "step": 20, |
| "valid_targets_mean": 4988.7, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 0.03753753753753754, |
| "grad_norm": 6.98322327787682, |
| "learning_rate": 2.055674518201285e-06, |
| "loss": 0.634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6035254001617432, |
| "step": 25, |
| "valid_targets_mean": 4144.8, |
| "valid_targets_min": 406 |
| }, |
| { |
| "epoch": 0.04504504504504504, |
| "grad_norm": 4.519545202299929, |
| "learning_rate": 2.4839400428265524e-06, |
| "loss": 0.6108, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6693063974380493, |
| "step": 30, |
| "valid_targets_mean": 2645.9, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 0.052552552552552555, |
| "grad_norm": 2.254075439509915, |
| "learning_rate": 2.9122055674518203e-06, |
| "loss": 0.583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6287423968315125, |
| "step": 35, |
| "valid_targets_mean": 5337.9, |
| "valid_targets_min": 424 |
| }, |
| { |
| "epoch": 0.06006006006006006, |
| "grad_norm": 1.5869006029617074, |
| "learning_rate": 3.3404710920770882e-06, |
| "loss": 0.4981, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5136668682098389, |
| "step": 40, |
| "valid_targets_mean": 4675.1, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 0.06756756756756757, |
| "grad_norm": 1.2871585570908246, |
| "learning_rate": 3.7687366167023558e-06, |
| "loss": 0.498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4761298894882202, |
| "step": 45, |
| "valid_targets_mean": 4580.2, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 0.07507507507507508, |
| "grad_norm": 1.1073292407135484, |
| "learning_rate": 4.197002141327624e-06, |
| "loss": 0.4618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4800295829772949, |
| "step": 50, |
| "valid_targets_mean": 3829.7, |
| "valid_targets_min": 408 |
| }, |
| { |
| "epoch": 0.08258258258258258, |
| "grad_norm": 0.8919504665868666, |
| "learning_rate": 4.625267665952891e-06, |
| "loss": 0.5237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.525561511516571, |
| "step": 55, |
| "valid_targets_mean": 5515.5, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 0.09009009009009009, |
| "grad_norm": 0.865780829661676, |
| "learning_rate": 5.05353319057816e-06, |
| "loss": 0.5163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5415364503860474, |
| "step": 60, |
| "valid_targets_mean": 3433.2, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 0.09759759759759759, |
| "grad_norm": 0.5872913252913201, |
| "learning_rate": 5.481798715203427e-06, |
| "loss": 0.4707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3888802230358124, |
| "step": 65, |
| "valid_targets_mean": 5232.6, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 0.10510510510510511, |
| "grad_norm": 0.5994653626627001, |
| "learning_rate": 5.910064239828695e-06, |
| "loss": 0.4821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43450668454170227, |
| "step": 70, |
| "valid_targets_mean": 5187.1, |
| "valid_targets_min": 460 |
| }, |
| { |
| "epoch": 0.11261261261261261, |
| "grad_norm": 0.6662883071321841, |
| "learning_rate": 6.338329764453962e-06, |
| "loss": 0.4331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3964645564556122, |
| "step": 75, |
| "valid_targets_mean": 3182.0, |
| "valid_targets_min": 880 |
| }, |
| { |
| "epoch": 0.12012012012012012, |
| "grad_norm": 0.6301518751447736, |
| "learning_rate": 6.76659528907923e-06, |
| "loss": 0.4374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37995022535324097, |
| "step": 80, |
| "valid_targets_mean": 3907.1, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 0.12762762762762764, |
| "grad_norm": 0.6479909629866574, |
| "learning_rate": 7.194860813704497e-06, |
| "loss": 0.4749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43532025814056396, |
| "step": 85, |
| "valid_targets_mean": 3381.8, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 0.13513513513513514, |
| "grad_norm": 0.601954910384077, |
| "learning_rate": 7.623126338329765e-06, |
| "loss": 0.449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37232670187950134, |
| "step": 90, |
| "valid_targets_mean": 3859.4, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 0.14264264264264265, |
| "grad_norm": 0.6010699211352588, |
| "learning_rate": 8.051391862955033e-06, |
| "loss": 0.4036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3912065625190735, |
| "step": 95, |
| "valid_targets_mean": 4532.2, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 0.15015015015015015, |
| "grad_norm": 0.6776934870921543, |
| "learning_rate": 8.4796573875803e-06, |
| "loss": 0.4009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3918367922306061, |
| "step": 100, |
| "valid_targets_mean": 3923.7, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 0.15765765765765766, |
| "grad_norm": 0.5815397148408697, |
| "learning_rate": 8.907922912205568e-06, |
| "loss": 0.422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40705981850624084, |
| "step": 105, |
| "valid_targets_mean": 4907.4, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 0.16516516516516516, |
| "grad_norm": 0.6207231229898003, |
| "learning_rate": 9.336188436830836e-06, |
| "loss": 0.4197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35407790541648865, |
| "step": 110, |
| "valid_targets_mean": 4749.1, |
| "valid_targets_min": 357 |
| }, |
| { |
| "epoch": 0.17267267267267267, |
| "grad_norm": 0.7161182478604338, |
| "learning_rate": 9.764453961456105e-06, |
| "loss": 0.4271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3748543858528137, |
| "step": 115, |
| "valid_targets_mean": 2599.0, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 0.18018018018018017, |
| "grad_norm": 0.6433782885571062, |
| "learning_rate": 1.019271948608137e-05, |
| "loss": 0.4129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44952958822250366, |
| "step": 120, |
| "valid_targets_mean": 3456.8, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 0.18768768768768768, |
| "grad_norm": 0.608760987576289, |
| "learning_rate": 1.062098501070664e-05, |
| "loss": 0.396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4421440064907074, |
| "step": 125, |
| "valid_targets_mean": 4304.8, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 0.19519519519519518, |
| "grad_norm": 0.6056247540086898, |
| "learning_rate": 1.1049250535331907e-05, |
| "loss": 0.356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3524633049964905, |
| "step": 130, |
| "valid_targets_mean": 4378.4, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 0.20270270270270271, |
| "grad_norm": 0.7470542876873747, |
| "learning_rate": 1.1477516059957175e-05, |
| "loss": 0.3928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3509212136268616, |
| "step": 135, |
| "valid_targets_mean": 3348.1, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 0.21021021021021022, |
| "grad_norm": 0.5297517332166896, |
| "learning_rate": 1.1905781584582443e-05, |
| "loss": 0.3971, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3493044376373291, |
| "step": 140, |
| "valid_targets_mean": 4820.6, |
| "valid_targets_min": 588 |
| }, |
| { |
| "epoch": 0.21771771771771772, |
| "grad_norm": 0.8236972811131019, |
| "learning_rate": 1.233404710920771e-05, |
| "loss": 0.4229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4382990002632141, |
| "step": 145, |
| "valid_targets_mean": 4910.1, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 0.22522522522522523, |
| "grad_norm": 0.5641188867988419, |
| "learning_rate": 1.2762312633832978e-05, |
| "loss": 0.4053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4189315438270569, |
| "step": 150, |
| "valid_targets_mean": 4847.2, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 0.23273273273273273, |
| "grad_norm": 0.759436996305121, |
| "learning_rate": 1.3190578158458245e-05, |
| "loss": 0.3995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4512358009815216, |
| "step": 155, |
| "valid_targets_mean": 3609.1, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 0.24024024024024024, |
| "grad_norm": 0.5776616654260357, |
| "learning_rate": 1.3618843683083513e-05, |
| "loss": 0.3982, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.366862416267395, |
| "step": 160, |
| "valid_targets_mean": 4489.5, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 0.24774774774774774, |
| "grad_norm": 0.5621030834623711, |
| "learning_rate": 1.404710920770878e-05, |
| "loss": 0.3562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3245847225189209, |
| "step": 165, |
| "valid_targets_mean": 3611.0, |
| "valid_targets_min": 857 |
| }, |
| { |
| "epoch": 0.2552552552552553, |
| "grad_norm": 0.6383475705856398, |
| "learning_rate": 1.4475374732334048e-05, |
| "loss": 0.3633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3641152083873749, |
| "step": 170, |
| "valid_targets_mean": 3776.7, |
| "valid_targets_min": 273 |
| }, |
| { |
| "epoch": 0.2627627627627628, |
| "grad_norm": 0.6387883870614447, |
| "learning_rate": 1.4903640256959315e-05, |
| "loss": 0.3892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4122806787490845, |
| "step": 175, |
| "valid_targets_mean": 4106.8, |
| "valid_targets_min": 367 |
| }, |
| { |
| "epoch": 0.2702702702702703, |
| "grad_norm": 0.5859730062305724, |
| "learning_rate": 1.5331905781584583e-05, |
| "loss": 0.4145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4545392692089081, |
| "step": 180, |
| "valid_targets_mean": 5412.8, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 0.2777777777777778, |
| "grad_norm": 0.6291566957212851, |
| "learning_rate": 1.576017130620985e-05, |
| "loss": 0.3586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34801965951919556, |
| "step": 185, |
| "valid_targets_mean": 3683.8, |
| "valid_targets_min": 388 |
| }, |
| { |
| "epoch": 0.2852852852852853, |
| "grad_norm": 0.7714952807971188, |
| "learning_rate": 1.618843683083512e-05, |
| "loss": 0.4031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33357149362564087, |
| "step": 190, |
| "valid_targets_mean": 3992.8, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 0.2927927927927928, |
| "grad_norm": 0.6022688124054402, |
| "learning_rate": 1.6616702355460387e-05, |
| "loss": 0.3632, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32963526248931885, |
| "step": 195, |
| "valid_targets_mean": 4479.6, |
| "valid_targets_min": 376 |
| }, |
| { |
| "epoch": 0.3003003003003003, |
| "grad_norm": 0.5461125797479052, |
| "learning_rate": 1.7044967880085653e-05, |
| "loss": 0.3609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3471255898475647, |
| "step": 200, |
| "valid_targets_mean": 5124.2, |
| "valid_targets_min": 2440 |
| }, |
| { |
| "epoch": 0.3078078078078078, |
| "grad_norm": 0.6479231652954496, |
| "learning_rate": 1.7473233404710924e-05, |
| "loss": 0.3709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36097437143325806, |
| "step": 205, |
| "valid_targets_mean": 3874.2, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 0.3153153153153153, |
| "grad_norm": 0.6307321400936947, |
| "learning_rate": 1.790149892933619e-05, |
| "loss": 0.356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32168492674827576, |
| "step": 210, |
| "valid_targets_mean": 4215.9, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 0.3228228228228228, |
| "grad_norm": 0.7342733098843338, |
| "learning_rate": 1.8329764453961457e-05, |
| "loss": 0.3716, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3192724585533142, |
| "step": 215, |
| "valid_targets_mean": 3300.5, |
| "valid_targets_min": 465 |
| }, |
| { |
| "epoch": 0.3303303303303303, |
| "grad_norm": 0.6269217295173055, |
| "learning_rate": 1.8758029978586724e-05, |
| "loss": 0.382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.393771767616272, |
| "step": 220, |
| "valid_targets_mean": 3780.5, |
| "valid_targets_min": 520 |
| }, |
| { |
| "epoch": 0.33783783783783783, |
| "grad_norm": 0.6699586606597604, |
| "learning_rate": 1.9186295503211994e-05, |
| "loss": 0.3367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3441130518913269, |
| "step": 225, |
| "valid_targets_mean": 3570.4, |
| "valid_targets_min": 367 |
| }, |
| { |
| "epoch": 0.34534534534534533, |
| "grad_norm": 0.6212030440388314, |
| "learning_rate": 1.961456102783726e-05, |
| "loss": 0.3249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28860020637512207, |
| "step": 230, |
| "valid_targets_mean": 4043.8, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 0.35285285285285284, |
| "grad_norm": 0.5933247879185318, |
| "learning_rate": 2.004282655246253e-05, |
| "loss": 0.3663, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2963605523109436, |
| "step": 235, |
| "valid_targets_mean": 4519.4, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 0.36036036036036034, |
| "grad_norm": 0.5915857140141431, |
| "learning_rate": 2.0471092077087794e-05, |
| "loss": 0.3707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3590105175971985, |
| "step": 240, |
| "valid_targets_mean": 4801.9, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 0.36786786786786785, |
| "grad_norm": 0.6926624493340766, |
| "learning_rate": 2.089935760171306e-05, |
| "loss": 0.3699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3375079035758972, |
| "step": 245, |
| "valid_targets_mean": 3064.8, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 0.37537537537537535, |
| "grad_norm": 0.5625060900455121, |
| "learning_rate": 2.1327623126338334e-05, |
| "loss": 0.3717, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2878052592277527, |
| "step": 250, |
| "valid_targets_mean": 4984.9, |
| "valid_targets_min": 389 |
| }, |
| { |
| "epoch": 0.38288288288288286, |
| "grad_norm": 0.4895346484151352, |
| "learning_rate": 2.17558886509636e-05, |
| "loss": 0.3319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3224838972091675, |
| "step": 255, |
| "valid_targets_mean": 5919.2, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 0.39039039039039036, |
| "grad_norm": 0.6186907667129198, |
| "learning_rate": 2.2184154175588867e-05, |
| "loss": 0.3133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3299029767513275, |
| "step": 260, |
| "valid_targets_mean": 4151.9, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 0.3978978978978979, |
| "grad_norm": 0.637540257330486, |
| "learning_rate": 2.2612419700214137e-05, |
| "loss": 0.3034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31127655506134033, |
| "step": 265, |
| "valid_targets_mean": 4565.4, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 0.40540540540540543, |
| "grad_norm": 0.6482997719326944, |
| "learning_rate": 2.3040685224839404e-05, |
| "loss": 0.371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3371477723121643, |
| "step": 270, |
| "valid_targets_mean": 4799.7, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 0.41291291291291293, |
| "grad_norm": 0.630240697831865, |
| "learning_rate": 2.346895074946467e-05, |
| "loss": 0.4042, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3549198508262634, |
| "step": 275, |
| "valid_targets_mean": 3973.2, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 0.42042042042042044, |
| "grad_norm": 0.5378005948550142, |
| "learning_rate": 2.3897216274089937e-05, |
| "loss": 0.3568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3140275776386261, |
| "step": 280, |
| "valid_targets_mean": 4524.4, |
| "valid_targets_min": 466 |
| }, |
| { |
| "epoch": 0.42792792792792794, |
| "grad_norm": 0.5496707584360776, |
| "learning_rate": 2.4325481798715207e-05, |
| "loss": 0.3439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27984702587127686, |
| "step": 285, |
| "valid_targets_mean": 5251.4, |
| "valid_targets_min": 871 |
| }, |
| { |
| "epoch": 0.43543543543543545, |
| "grad_norm": 0.6054529261217243, |
| "learning_rate": 2.4753747323340474e-05, |
| "loss": 0.3399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2717384994029999, |
| "step": 290, |
| "valid_targets_mean": 5978.3, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 0.44294294294294295, |
| "grad_norm": 0.60946853866193, |
| "learning_rate": 2.518201284796574e-05, |
| "loss": 0.3324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31978553533554077, |
| "step": 295, |
| "valid_targets_mean": 3610.3, |
| "valid_targets_min": 729 |
| }, |
| { |
| "epoch": 0.45045045045045046, |
| "grad_norm": 0.7112237553385803, |
| "learning_rate": 2.5610278372591007e-05, |
| "loss": 0.365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36318349838256836, |
| "step": 300, |
| "valid_targets_mean": 2997.6, |
| "valid_targets_min": 398 |
| }, |
| { |
| "epoch": 0.45795795795795796, |
| "grad_norm": 0.5754561363093669, |
| "learning_rate": 2.6038543897216277e-05, |
| "loss": 0.3475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3775876760482788, |
| "step": 305, |
| "valid_targets_mean": 5485.2, |
| "valid_targets_min": 291 |
| }, |
| { |
| "epoch": 0.46546546546546547, |
| "grad_norm": 0.5225836627231101, |
| "learning_rate": 2.6466809421841544e-05, |
| "loss": 0.3327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2630726099014282, |
| "step": 310, |
| "valid_targets_mean": 5477.4, |
| "valid_targets_min": 1953 |
| }, |
| { |
| "epoch": 0.47297297297297297, |
| "grad_norm": 0.6631066150226813, |
| "learning_rate": 2.689507494646681e-05, |
| "loss": 0.3341, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4078267812728882, |
| "step": 315, |
| "valid_targets_mean": 4227.4, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 0.4804804804804805, |
| "grad_norm": 0.5625056894327084, |
| "learning_rate": 2.732334047109208e-05, |
| "loss": 0.3307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34400713443756104, |
| "step": 320, |
| "valid_targets_mean": 6082.6, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 0.487987987987988, |
| "grad_norm": 0.5720940827291631, |
| "learning_rate": 2.7751605995717347e-05, |
| "loss": 0.3544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.364154189825058, |
| "step": 325, |
| "valid_targets_mean": 5058.0, |
| "valid_targets_min": 1324 |
| }, |
| { |
| "epoch": 0.4954954954954955, |
| "grad_norm": 0.6142764560167397, |
| "learning_rate": 2.8179871520342614e-05, |
| "loss": 0.3567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3340011239051819, |
| "step": 330, |
| "valid_targets_mean": 3809.8, |
| "valid_targets_min": 606 |
| }, |
| { |
| "epoch": 0.503003003003003, |
| "grad_norm": 0.6862489554890606, |
| "learning_rate": 2.860813704496788e-05, |
| "loss": 0.3377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.347086638212204, |
| "step": 335, |
| "valid_targets_mean": 3381.4, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 0.5105105105105106, |
| "grad_norm": 0.5884162448896875, |
| "learning_rate": 2.903640256959315e-05, |
| "loss": 0.3156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3551441431045532, |
| "step": 340, |
| "valid_targets_mean": 4280.0, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 0.5180180180180181, |
| "grad_norm": 0.5985519809481195, |
| "learning_rate": 2.9464668094218417e-05, |
| "loss": 0.3718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3538270592689514, |
| "step": 345, |
| "valid_targets_mean": 4933.6, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 0.5255255255255256, |
| "grad_norm": 0.6608489868770677, |
| "learning_rate": 2.9892933618843684e-05, |
| "loss": 0.3821, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3977230191230774, |
| "step": 350, |
| "valid_targets_mean": 4619.8, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 0.5330330330330331, |
| "grad_norm": 0.6666435654761541, |
| "learning_rate": 3.032119914346895e-05, |
| "loss": 0.3205, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3276807963848114, |
| "step": 355, |
| "valid_targets_mean": 3228.0, |
| "valid_targets_min": 396 |
| }, |
| { |
| "epoch": 0.5405405405405406, |
| "grad_norm": 0.5700169845584041, |
| "learning_rate": 3.0749464668094224e-05, |
| "loss": 0.3373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.252112478017807, |
| "step": 360, |
| "valid_targets_mean": 4043.2, |
| "valid_targets_min": 470 |
| }, |
| { |
| "epoch": 0.5480480480480481, |
| "grad_norm": 0.5969317196396643, |
| "learning_rate": 3.117773019271949e-05, |
| "loss": 0.3344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.257426917552948, |
| "step": 365, |
| "valid_targets_mean": 3501.2, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 0.5555555555555556, |
| "grad_norm": 0.5338582932799799, |
| "learning_rate": 3.160599571734476e-05, |
| "loss": 0.3469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4118390679359436, |
| "step": 370, |
| "valid_targets_mean": 6022.6, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 0.5630630630630631, |
| "grad_norm": 0.7156868770693144, |
| "learning_rate": 3.2034261241970024e-05, |
| "loss": 0.342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33580997586250305, |
| "step": 375, |
| "valid_targets_mean": 3146.6, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 0.5705705705705706, |
| "grad_norm": 0.6105442252909425, |
| "learning_rate": 3.246252676659529e-05, |
| "loss": 0.3246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29976391792297363, |
| "step": 380, |
| "valid_targets_mean": 4423.6, |
| "valid_targets_min": 579 |
| }, |
| { |
| "epoch": 0.5780780780780781, |
| "grad_norm": 0.48535869781119606, |
| "learning_rate": 3.289079229122056e-05, |
| "loss": 0.3211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2958953380584717, |
| "step": 385, |
| "valid_targets_mean": 5096.5, |
| "valid_targets_min": 1111 |
| }, |
| { |
| "epoch": 0.5855855855855856, |
| "grad_norm": 0.5293285996606892, |
| "learning_rate": 3.3319057815845824e-05, |
| "loss": 0.3012, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29280033707618713, |
| "step": 390, |
| "valid_targets_mean": 4133.6, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 0.5930930930930931, |
| "grad_norm": 0.6364074446274751, |
| "learning_rate": 3.37473233404711e-05, |
| "loss": 0.3546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3336215019226074, |
| "step": 395, |
| "valid_targets_mean": 3474.1, |
| "valid_targets_min": 277 |
| }, |
| { |
| "epoch": 0.6006006006006006, |
| "grad_norm": 0.7064277061832516, |
| "learning_rate": 3.4175588865096364e-05, |
| "loss": 0.3238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38183677196502686, |
| "step": 400, |
| "valid_targets_mean": 4343.8, |
| "valid_targets_min": 831 |
| }, |
| { |
| "epoch": 0.6081081081081081, |
| "grad_norm": 0.5234255969114723, |
| "learning_rate": 3.460385438972163e-05, |
| "loss": 0.3259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3263946771621704, |
| "step": 405, |
| "valid_targets_mean": 5912.4, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 0.6156156156156156, |
| "grad_norm": 0.6859056535544392, |
| "learning_rate": 3.50321199143469e-05, |
| "loss": 0.3613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4518062472343445, |
| "step": 410, |
| "valid_targets_mean": 4294.0, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 0.6231231231231231, |
| "grad_norm": 0.593812126409495, |
| "learning_rate": 3.5460385438972164e-05, |
| "loss": 0.3236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.284976601600647, |
| "step": 415, |
| "valid_targets_mean": 4542.8, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 0.6306306306306306, |
| "grad_norm": 0.5542761631226861, |
| "learning_rate": 3.588865096359743e-05, |
| "loss": 0.3575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3369911313056946, |
| "step": 420, |
| "valid_targets_mean": 4173.8, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 0.6381381381381381, |
| "grad_norm": 0.694482077890855, |
| "learning_rate": 3.63169164882227e-05, |
| "loss": 0.331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35457199811935425, |
| "step": 425, |
| "valid_targets_mean": 3347.3, |
| "valid_targets_min": 323 |
| }, |
| { |
| "epoch": 0.6456456456456456, |
| "grad_norm": 0.5087776401105766, |
| "learning_rate": 3.674518201284797e-05, |
| "loss": 0.3077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2870054244995117, |
| "step": 430, |
| "valid_targets_mean": 5496.8, |
| "valid_targets_min": 995 |
| }, |
| { |
| "epoch": 0.6531531531531531, |
| "grad_norm": 0.5710934865190025, |
| "learning_rate": 3.717344753747324e-05, |
| "loss": 0.3449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3406960964202881, |
| "step": 435, |
| "valid_targets_mean": 4272.1, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 0.6606606606606606, |
| "grad_norm": 0.6532417856194169, |
| "learning_rate": 3.7601713062098504e-05, |
| "loss": 0.3358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3105970621109009, |
| "step": 440, |
| "valid_targets_mean": 4052.7, |
| "valid_targets_min": 469 |
| }, |
| { |
| "epoch": 0.6681681681681682, |
| "grad_norm": 0.5810179731496691, |
| "learning_rate": 3.802997858672377e-05, |
| "loss": 0.3534, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2967357933521271, |
| "step": 445, |
| "valid_targets_mean": 5399.5, |
| "valid_targets_min": 481 |
| }, |
| { |
| "epoch": 0.6756756756756757, |
| "grad_norm": 0.4933051723343659, |
| "learning_rate": 3.8458244111349045e-05, |
| "loss": 0.307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2656002640724182, |
| "step": 450, |
| "valid_targets_mean": 5050.2, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 0.6831831831831832, |
| "grad_norm": 0.5117823141215931, |
| "learning_rate": 3.8886509635974305e-05, |
| "loss": 0.3345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3394744396209717, |
| "step": 455, |
| "valid_targets_mean": 4780.2, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 0.6906906906906907, |
| "grad_norm": 0.5513150421712305, |
| "learning_rate": 3.931477516059957e-05, |
| "loss": 0.3344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38678789138793945, |
| "step": 460, |
| "valid_targets_mean": 4995.6, |
| "valid_targets_min": 787 |
| }, |
| { |
| "epoch": 0.6981981981981982, |
| "grad_norm": 0.5223578821175074, |
| "learning_rate": 3.974304068522484e-05, |
| "loss": 0.3301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3217771053314209, |
| "step": 465, |
| "valid_targets_mean": 5331.4, |
| "valid_targets_min": 1007 |
| }, |
| { |
| "epoch": 0.7057057057057057, |
| "grad_norm": 0.5938737922502441, |
| "learning_rate": 3.999997756656772e-05, |
| "loss": 0.3306, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31824183464050293, |
| "step": 470, |
| "valid_targets_mean": 4223.0, |
| "valid_targets_min": 452 |
| }, |
| { |
| "epoch": 0.7132132132132132, |
| "grad_norm": 0.49626310595338613, |
| "learning_rate": 3.9999725191032436e-05, |
| "loss": 0.2875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26925772428512573, |
| "step": 475, |
| "valid_targets_mean": 5763.9, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 0.7207207207207207, |
| "grad_norm": 0.6276161448251935, |
| "learning_rate": 3.999919240172184e-05, |
| "loss": 0.3228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.325122594833374, |
| "step": 480, |
| "valid_targets_mean": 4395.4, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 0.7282282282282282, |
| "grad_norm": 0.598897987227093, |
| "learning_rate": 3.9998379206106104e-05, |
| "loss": 0.2941, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2764396369457245, |
| "step": 485, |
| "valid_targets_mean": 5031.5, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 0.7357357357357357, |
| "grad_norm": 0.5920738798268582, |
| "learning_rate": 3.9997285615586944e-05, |
| "loss": 0.3449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33547401428222656, |
| "step": 490, |
| "valid_targets_mean": 4218.7, |
| "valid_targets_min": 416 |
| }, |
| { |
| "epoch": 0.7432432432432432, |
| "grad_norm": 0.5388292737396405, |
| "learning_rate": 3.999591164549747e-05, |
| "loss": 0.3216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30026373267173767, |
| "step": 495, |
| "valid_targets_mean": 5046.2, |
| "valid_targets_min": 885 |
| }, |
| { |
| "epoch": 0.7507507507507507, |
| "grad_norm": 0.7138413019632255, |
| "learning_rate": 3.999425731510195e-05, |
| "loss": 0.3161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3095625340938568, |
| "step": 500, |
| "valid_targets_mean": 3115.5, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 0.7582582582582582, |
| "grad_norm": 0.5065067605354636, |
| "learning_rate": 3.9992322647595543e-05, |
| "loss": 0.3132, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2668853998184204, |
| "step": 505, |
| "valid_targets_mean": 4890.2, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 0.7657657657657657, |
| "grad_norm": 0.48772270569522996, |
| "learning_rate": 3.999010767010401e-05, |
| "loss": 0.2792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21127644181251526, |
| "step": 510, |
| "valid_targets_mean": 4030.5, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 0.7732732732732732, |
| "grad_norm": 0.688910852981923, |
| "learning_rate": 3.998761241368328e-05, |
| "loss": 0.3356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31102752685546875, |
| "step": 515, |
| "valid_targets_mean": 2963.6, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 0.7807807807807807, |
| "grad_norm": 0.590399156229966, |
| "learning_rate": 3.9984836913319044e-05, |
| "loss": 0.3022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.295174777507782, |
| "step": 520, |
| "valid_targets_mean": 3820.8, |
| "valid_targets_min": 547 |
| }, |
| { |
| "epoch": 0.7882882882882883, |
| "grad_norm": 0.7498553089205983, |
| "learning_rate": 3.998178120792627e-05, |
| "loss": 0.3289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29107627272605896, |
| "step": 525, |
| "valid_targets_mean": 4623.9, |
| "valid_targets_min": 463 |
| }, |
| { |
| "epoch": 0.7957957957957958, |
| "grad_norm": 0.541430521248251, |
| "learning_rate": 3.9978445340348646e-05, |
| "loss": 0.3114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35057809948921204, |
| "step": 530, |
| "valid_targets_mean": 4895.9, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 0.8033033033033034, |
| "grad_norm": 0.6145616694631061, |
| "learning_rate": 3.997482935735796e-05, |
| "loss": 0.2989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2825467586517334, |
| "step": 535, |
| "valid_targets_mean": 4079.4, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 0.8108108108108109, |
| "grad_norm": 0.6457216047110463, |
| "learning_rate": 3.997093330965349e-05, |
| "loss": 0.3289, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37978658080101013, |
| "step": 540, |
| "valid_targets_mean": 3493.6, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 0.8183183183183184, |
| "grad_norm": 0.5512024613609153, |
| "learning_rate": 3.9966757251861256e-05, |
| "loss": 0.3083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30473941564559937, |
| "step": 545, |
| "valid_targets_mean": 4363.6, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 0.8258258258258259, |
| "grad_norm": 0.5404758251655593, |
| "learning_rate": 3.996230124253328e-05, |
| "loss": 0.2928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2958792746067047, |
| "step": 550, |
| "valid_targets_mean": 4708.9, |
| "valid_targets_min": 480 |
| }, |
| { |
| "epoch": 0.8333333333333334, |
| "grad_norm": 0.5409326702314928, |
| "learning_rate": 3.995756534414672e-05, |
| "loss": 0.3015, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3055042028427124, |
| "step": 555, |
| "valid_targets_mean": 4889.0, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 0.8408408408408409, |
| "grad_norm": 0.877523092977663, |
| "learning_rate": 3.9952549623103065e-05, |
| "loss": 0.3031, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27620965242385864, |
| "step": 560, |
| "valid_targets_mean": 3901.4, |
| "valid_targets_min": 782 |
| }, |
| { |
| "epoch": 0.8483483483483484, |
| "grad_norm": 0.5593566066914221, |
| "learning_rate": 3.994725414972713e-05, |
| "loss": 0.331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33034461736679077, |
| "step": 565, |
| "valid_targets_mean": 4464.5, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 0.8558558558558559, |
| "grad_norm": 0.6652170124791761, |
| "learning_rate": 3.994167899826614e-05, |
| "loss": 0.2967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.258162260055542, |
| "step": 570, |
| "valid_targets_mean": 3842.9, |
| "valid_targets_min": 410 |
| }, |
| { |
| "epoch": 0.8633633633633634, |
| "grad_norm": 0.5319260103081287, |
| "learning_rate": 3.993582424688861e-05, |
| "loss": 0.2819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2436560094356537, |
| "step": 575, |
| "valid_targets_mean": 4503.2, |
| "valid_targets_min": 810 |
| }, |
| { |
| "epoch": 0.8708708708708709, |
| "grad_norm": 0.5435805707257723, |
| "learning_rate": 3.9929689977683315e-05, |
| "loss": 0.3088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2837572991847992, |
| "step": 580, |
| "valid_targets_mean": 4475.9, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 0.8783783783783784, |
| "grad_norm": 0.6279074659022925, |
| "learning_rate": 3.992327627665814e-05, |
| "loss": 0.3233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3020919859409332, |
| "step": 585, |
| "valid_targets_mean": 3179.3, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 0.8858858858858859, |
| "grad_norm": 0.6751035596060991, |
| "learning_rate": 3.99165832337388e-05, |
| "loss": 0.3098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2893165349960327, |
| "step": 590, |
| "valid_targets_mean": 3005.4, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 0.8933933933933934, |
| "grad_norm": 0.9253018906213728, |
| "learning_rate": 3.990961094276767e-05, |
| "loss": 0.3072, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3459416627883911, |
| "step": 595, |
| "valid_targets_mean": 2077.6, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 0.9009009009009009, |
| "grad_norm": 0.6687225112938137, |
| "learning_rate": 3.990235950150242e-05, |
| "loss": 0.3079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36818212270736694, |
| "step": 600, |
| "valid_targets_mean": 3371.7, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 0.9084084084084084, |
| "grad_norm": 0.5328749806757945, |
| "learning_rate": 3.9894829011614627e-05, |
| "loss": 0.3135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25350844860076904, |
| "step": 605, |
| "valid_targets_mean": 3857.8, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 0.9159159159159159, |
| "grad_norm": 0.675741595187441, |
| "learning_rate": 3.988701957868842e-05, |
| "loss": 0.3172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3360707759857178, |
| "step": 610, |
| "valid_targets_mean": 2917.3, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 0.9234234234234234, |
| "grad_norm": 0.6571910621752247, |
| "learning_rate": 3.987893131221892e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2482086569070816, |
| "step": 615, |
| "valid_targets_mean": 3313.1, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 0.9309309309309309, |
| "grad_norm": 0.6979768745974733, |
| "learning_rate": 3.987056432561075e-05, |
| "loss": 0.3034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3537478744983673, |
| "step": 620, |
| "valid_targets_mean": 3899.6, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 0.9384384384384384, |
| "grad_norm": 0.46982739010374835, |
| "learning_rate": 3.986191873617645e-05, |
| "loss": 0.318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27537375688552856, |
| "step": 625, |
| "valid_targets_mean": 5885.1, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 0.9459459459459459, |
| "grad_norm": 0.5400448261626185, |
| "learning_rate": 3.985299466513479e-05, |
| "loss": 0.3106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3220127820968628, |
| "step": 630, |
| "valid_targets_mean": 4269.6, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 0.9534534534534534, |
| "grad_norm": 0.5242379048874888, |
| "learning_rate": 3.984379223760912e-05, |
| "loss": 0.3102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.36460551619529724, |
| "step": 635, |
| "valid_targets_mean": 4742.2, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 0.960960960960961, |
| "grad_norm": 0.5056910710384006, |
| "learning_rate": 3.983431158262558e-05, |
| "loss": 0.2783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2684648334980011, |
| "step": 640, |
| "valid_targets_mean": 4608.9, |
| "valid_targets_min": 805 |
| }, |
| { |
| "epoch": 0.9684684684684685, |
| "grad_norm": 0.5297540154671703, |
| "learning_rate": 3.982455283311131e-05, |
| "loss": 0.325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25975459814071655, |
| "step": 645, |
| "valid_targets_mean": 4382.8, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 0.975975975975976, |
| "grad_norm": 0.555629136176801, |
| "learning_rate": 3.981451612589259e-05, |
| "loss": 0.28, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26162397861480713, |
| "step": 650, |
| "valid_targets_mean": 4827.0, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 0.9834834834834835, |
| "grad_norm": 0.7355128171152777, |
| "learning_rate": 3.980420160169289e-05, |
| "loss": 0.2788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28353631496429443, |
| "step": 655, |
| "valid_targets_mean": 4060.4, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 0.990990990990991, |
| "grad_norm": 0.6098329219635357, |
| "learning_rate": 3.979360940513092e-05, |
| "loss": 0.3267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2917211651802063, |
| "step": 660, |
| "valid_targets_mean": 3110.2, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 0.9984984984984985, |
| "grad_norm": 0.6602685528415261, |
| "learning_rate": 3.978273968471865e-05, |
| "loss": 0.3291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37517815828323364, |
| "step": 665, |
| "valid_targets_mean": 3097.9, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 1.006006006006006, |
| "grad_norm": 0.5990905965495634, |
| "learning_rate": 3.97715925928591e-05, |
| "loss": 0.3701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31573376059532166, |
| "step": 670, |
| "valid_targets_mean": 5335.8, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 1.0135135135135136, |
| "grad_norm": 0.5051572310687712, |
| "learning_rate": 3.9760168285844345e-05, |
| "loss": 0.2747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2896278500556946, |
| "step": 675, |
| "valid_targets_mean": 4987.1, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 1.021021021021021, |
| "grad_norm": 0.5358689615840903, |
| "learning_rate": 3.974846692385323e-05, |
| "loss": 0.2765, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29317814111709595, |
| "step": 680, |
| "valid_targets_mean": 5053.4, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 1.0285285285285286, |
| "grad_norm": 0.7789287894144826, |
| "learning_rate": 3.973648867094917e-05, |
| "loss": 0.3181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3238382935523987, |
| "step": 685, |
| "valid_targets_mean": 3482.4, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 1.0360360360360361, |
| "grad_norm": 0.5563018194673951, |
| "learning_rate": 3.972423369507783e-05, |
| "loss": 0.3166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3259349465370178, |
| "step": 690, |
| "valid_targets_mean": 5252.0, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 1.0435435435435436, |
| "grad_norm": 0.7250068591194968, |
| "learning_rate": 3.971170216806477e-05, |
| "loss": 0.3198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3443298935890198, |
| "step": 695, |
| "valid_targets_mean": 2799.4, |
| "valid_targets_min": 588 |
| }, |
| { |
| "epoch": 1.0510510510510511, |
| "grad_norm": 0.7089445149146085, |
| "learning_rate": 3.969889426561304e-05, |
| "loss": 0.3328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31399601697921753, |
| "step": 700, |
| "valid_targets_mean": 3693.1, |
| "valid_targets_min": 606 |
| }, |
| { |
| "epoch": 1.0585585585585586, |
| "grad_norm": 0.4834579345868247, |
| "learning_rate": 3.968581016730073e-05, |
| "loss": 0.2893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28393715620040894, |
| "step": 705, |
| "valid_targets_mean": 5210.3, |
| "valid_targets_min": 1146 |
| }, |
| { |
| "epoch": 1.0660660660660661, |
| "grad_norm": 0.580488043726015, |
| "learning_rate": 3.9672450056578426e-05, |
| "loss": 0.3114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3525095582008362, |
| "step": 710, |
| "valid_targets_mean": 4987.9, |
| "valid_targets_min": 872 |
| }, |
| { |
| "epoch": 1.0735735735735736, |
| "grad_norm": 0.5830757190666622, |
| "learning_rate": 3.965881412076665e-05, |
| "loss": 0.2927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2518344223499298, |
| "step": 715, |
| "valid_targets_mean": 3772.8, |
| "valid_targets_min": 301 |
| }, |
| { |
| "epoch": 1.0810810810810811, |
| "grad_norm": 0.603911299798853, |
| "learning_rate": 3.964490255105325e-05, |
| "loss": 0.2897, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2885856330394745, |
| "step": 720, |
| "valid_targets_mean": 3888.7, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 1.0885885885885886, |
| "grad_norm": 0.721271255619491, |
| "learning_rate": 3.96307155424907e-05, |
| "loss": 0.3009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33753496408462524, |
| "step": 725, |
| "valid_targets_mean": 3255.9, |
| "valid_targets_min": 323 |
| }, |
| { |
| "epoch": 1.0960960960960962, |
| "grad_norm": 0.5688287102135644, |
| "learning_rate": 3.961625329399335e-05, |
| "loss": 0.288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24445214867591858, |
| "step": 730, |
| "valid_targets_mean": 4295.9, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 1.1036036036036037, |
| "grad_norm": 0.5822780762193985, |
| "learning_rate": 3.960151600833469e-05, |
| "loss": 0.303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3242020606994629, |
| "step": 735, |
| "valid_targets_mean": 4509.4, |
| "valid_targets_min": 749 |
| }, |
| { |
| "epoch": 1.1111111111111112, |
| "grad_norm": 0.6988383396255673, |
| "learning_rate": 3.958650389214444e-05, |
| "loss": 0.2908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2766273021697998, |
| "step": 740, |
| "valid_targets_mean": 3003.1, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 1.1186186186186187, |
| "grad_norm": 0.5530037303674098, |
| "learning_rate": 3.95712171559057e-05, |
| "loss": 0.2862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2562218904495239, |
| "step": 745, |
| "valid_targets_mean": 4301.1, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 1.1261261261261262, |
| "grad_norm": 0.5917466496490228, |
| "learning_rate": 3.955565601395199e-05, |
| "loss": 0.2995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27801835536956787, |
| "step": 750, |
| "valid_targets_mean": 4016.3, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 1.1336336336336337, |
| "grad_norm": 0.5314431651828969, |
| "learning_rate": 3.953982068446424e-05, |
| "loss": 0.274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2895042896270752, |
| "step": 755, |
| "valid_targets_mean": 4829.9, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 1.1411411411411412, |
| "grad_norm": 0.5403700692721292, |
| "learning_rate": 3.952371138946773e-05, |
| "loss": 0.311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2900671660900116, |
| "step": 760, |
| "valid_targets_mean": 5102.2, |
| "valid_targets_min": 811 |
| }, |
| { |
| "epoch": 1.1486486486486487, |
| "grad_norm": 0.4466270912829498, |
| "learning_rate": 3.950732835482896e-05, |
| "loss": 0.2634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23144987225532532, |
| "step": 765, |
| "valid_targets_mean": 4800.4, |
| "valid_targets_min": 566 |
| }, |
| { |
| "epoch": 1.1561561561561562, |
| "grad_norm": 0.5126441976083996, |
| "learning_rate": 3.9490671810252525e-05, |
| "loss": 0.2738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2398991733789444, |
| "step": 770, |
| "valid_targets_mean": 3322.2, |
| "valid_targets_min": 260 |
| }, |
| { |
| "epoch": 1.1636636636636637, |
| "grad_norm": 0.6835376056729422, |
| "learning_rate": 3.947374198927787e-05, |
| "loss": 0.2818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2788790464401245, |
| "step": 775, |
| "valid_targets_mean": 2824.4, |
| "valid_targets_min": 481 |
| }, |
| { |
| "epoch": 1.1711711711711712, |
| "grad_norm": 0.7480255450833108, |
| "learning_rate": 3.945653912927599e-05, |
| "loss": 0.3116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41352379322052, |
| "step": 780, |
| "valid_targets_mean": 3108.0, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 1.1786786786786787, |
| "grad_norm": 0.7012989879636262, |
| "learning_rate": 3.943906347144615e-05, |
| "loss": 0.2908, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2697921395301819, |
| "step": 785, |
| "valid_targets_mean": 2765.4, |
| "valid_targets_min": 559 |
| }, |
| { |
| "epoch": 1.1861861861861862, |
| "grad_norm": 0.6294134200242447, |
| "learning_rate": 3.942131526081249e-05, |
| "loss": 0.2965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28815174102783203, |
| "step": 790, |
| "valid_targets_mean": 5498.2, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 1.1936936936936937, |
| "grad_norm": 0.5405122434808368, |
| "learning_rate": 3.940329474622055e-05, |
| "loss": 0.3025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26721876859664917, |
| "step": 795, |
| "valid_targets_mean": 4779.1, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 1.2012012012012012, |
| "grad_norm": 0.6027467491848216, |
| "learning_rate": 3.938500218033384e-05, |
| "loss": 0.2749, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28523164987564087, |
| "step": 800, |
| "valid_targets_mean": 3985.0, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 1.2087087087087087, |
| "grad_norm": 0.49337094306984625, |
| "learning_rate": 3.936643781963024e-05, |
| "loss": 0.3508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3622555136680603, |
| "step": 805, |
| "valid_targets_mean": 6322.6, |
| "valid_targets_min": 390 |
| }, |
| { |
| "epoch": 1.2162162162162162, |
| "grad_norm": 0.5183504295911457, |
| "learning_rate": 3.9347601924398475e-05, |
| "loss": 0.2833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2589194178581238, |
| "step": 810, |
| "valid_targets_mean": 4678.0, |
| "valid_targets_min": 899 |
| }, |
| { |
| "epoch": 1.2237237237237237, |
| "grad_norm": 0.5342990678808706, |
| "learning_rate": 3.932849475873438e-05, |
| "loss": 0.3152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2209431231021881, |
| "step": 815, |
| "valid_targets_mean": 4677.4, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 1.2312312312312312, |
| "grad_norm": 0.4783352437662895, |
| "learning_rate": 3.9309116590537266e-05, |
| "loss": 0.2653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2841101884841919, |
| "step": 820, |
| "valid_targets_mean": 4398.6, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 1.2387387387387387, |
| "grad_norm": 0.5066260881718098, |
| "learning_rate": 3.9289467691506125e-05, |
| "loss": 0.3159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2934754490852356, |
| "step": 825, |
| "valid_targets_mean": 4760.6, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 1.2462462462462462, |
| "grad_norm": 0.6920092254384417, |
| "learning_rate": 3.926954833713585e-05, |
| "loss": 0.3049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3148398697376251, |
| "step": 830, |
| "valid_targets_mean": 2882.6, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 1.2537537537537538, |
| "grad_norm": 0.49074537646024496, |
| "learning_rate": 3.924935880671334e-05, |
| "loss": 0.3005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2520464062690735, |
| "step": 835, |
| "valid_targets_mean": 5137.5, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 1.2612612612612613, |
| "grad_norm": 0.6626501857332863, |
| "learning_rate": 3.922889938331361e-05, |
| "loss": 0.3003, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38677817583084106, |
| "step": 840, |
| "valid_targets_mean": 3420.8, |
| "valid_targets_min": 627 |
| }, |
| { |
| "epoch": 1.2687687687687688, |
| "grad_norm": 0.5332552957049799, |
| "learning_rate": 3.920817035379581e-05, |
| "loss": 0.2804, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30235785245895386, |
| "step": 845, |
| "valid_targets_mean": 4300.7, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 1.2762762762762763, |
| "grad_norm": 0.5542167310126439, |
| "learning_rate": 3.9187172008799195e-05, |
| "loss": 0.3007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3331342339515686, |
| "step": 850, |
| "valid_targets_mean": 4431.8, |
| "valid_targets_min": 382 |
| }, |
| { |
| "epoch": 1.2837837837837838, |
| "grad_norm": 0.47602297520673265, |
| "learning_rate": 3.9165904642739085e-05, |
| "loss": 0.2825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24128374457359314, |
| "step": 855, |
| "valid_targets_mean": 5224.0, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 1.2912912912912913, |
| "grad_norm": 0.4907394738004159, |
| "learning_rate": 3.914436855380269e-05, |
| "loss": 0.2907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2902330458164215, |
| "step": 860, |
| "valid_targets_mean": 4872.4, |
| "valid_targets_min": 469 |
| }, |
| { |
| "epoch": 1.2987987987987988, |
| "grad_norm": 0.5780103792011559, |
| "learning_rate": 3.9122564043944956e-05, |
| "loss": 0.3022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.324124276638031, |
| "step": 865, |
| "valid_targets_mean": 4095.2, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 1.3063063063063063, |
| "grad_norm": 1.4238637814086352, |
| "learning_rate": 3.910049141888433e-05, |
| "loss": 0.3061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3050238788127899, |
| "step": 870, |
| "valid_targets_mean": 5166.2, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 1.3138138138138138, |
| "grad_norm": 0.49302688153022367, |
| "learning_rate": 3.907815098809849e-05, |
| "loss": 0.268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2744116187095642, |
| "step": 875, |
| "valid_targets_mean": 5715.9, |
| "valid_targets_min": 491 |
| }, |
| { |
| "epoch": 1.3213213213213213, |
| "grad_norm": 0.6362296442287568, |
| "learning_rate": 3.9055543064819945e-05, |
| "loss": 0.3095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28804486989974976, |
| "step": 880, |
| "valid_targets_mean": 3622.8, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 1.3288288288288288, |
| "grad_norm": 0.627623374325793, |
| "learning_rate": 3.9032667966031704e-05, |
| "loss": 0.2754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3453376293182373, |
| "step": 885, |
| "valid_targets_mean": 3533.0, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 1.3363363363363363, |
| "grad_norm": 0.6493174026676456, |
| "learning_rate": 3.9009526012462834e-05, |
| "loss": 0.292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3329022228717804, |
| "step": 890, |
| "valid_targets_mean": 4443.5, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 1.3438438438438438, |
| "grad_norm": 0.5328791757099103, |
| "learning_rate": 3.89861175285839e-05, |
| "loss": 0.2754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2938082218170166, |
| "step": 895, |
| "valid_targets_mean": 4643.6, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 1.3513513513513513, |
| "grad_norm": 0.5404971152718483, |
| "learning_rate": 3.89624428426025e-05, |
| "loss": 0.3149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3295516073703766, |
| "step": 900, |
| "valid_targets_mean": 5400.6, |
| "valid_targets_min": 431 |
| }, |
| { |
| "epoch": 1.3588588588588588, |
| "grad_norm": 0.5148482135727713, |
| "learning_rate": 3.8938502286458586e-05, |
| "loss": 0.2965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2672591209411621, |
| "step": 905, |
| "valid_targets_mean": 4434.6, |
| "valid_targets_min": 414 |
| }, |
| { |
| "epoch": 1.3663663663663663, |
| "grad_norm": 0.46940700753823117, |
| "learning_rate": 3.891429619581986e-05, |
| "loss": 0.2612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25686946511268616, |
| "step": 910, |
| "valid_targets_mean": 5001.9, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 1.3738738738738738, |
| "grad_norm": 0.5588622944159107, |
| "learning_rate": 3.888982491007705e-05, |
| "loss": 0.3063, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37934252619743347, |
| "step": 915, |
| "valid_targets_mean": 4426.3, |
| "valid_targets_min": 480 |
| }, |
| { |
| "epoch": 1.3813813813813813, |
| "grad_norm": 0.5032151155279457, |
| "learning_rate": 3.886508877233914e-05, |
| "loss": 0.3002, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24294015765190125, |
| "step": 920, |
| "valid_targets_mean": 4203.2, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 1.3888888888888888, |
| "grad_norm": 0.6375386060346272, |
| "learning_rate": 3.8840088129428594e-05, |
| "loss": 0.2822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2843095660209656, |
| "step": 925, |
| "valid_targets_mean": 2762.1, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 1.3963963963963963, |
| "grad_norm": 0.42954687639507877, |
| "learning_rate": 3.881482333187647e-05, |
| "loss": 0.2934, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24300193786621094, |
| "step": 930, |
| "valid_targets_mean": 6139.7, |
| "valid_targets_min": 1420 |
| }, |
| { |
| "epoch": 1.4039039039039038, |
| "grad_norm": 0.5288152668995841, |
| "learning_rate": 3.8789294733917486e-05, |
| "loss": 0.2809, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27250343561172485, |
| "step": 935, |
| "valid_targets_mean": 5227.9, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 1.4114114114114114, |
| "grad_norm": 0.4018203487416013, |
| "learning_rate": 3.876350269348509e-05, |
| "loss": 0.2843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2769063115119934, |
| "step": 940, |
| "valid_targets_mean": 7001.6, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 1.4189189189189189, |
| "grad_norm": 0.4733738366398111, |
| "learning_rate": 3.873744757220642e-05, |
| "loss": 0.3156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2413673847913742, |
| "step": 945, |
| "valid_targets_mean": 5955.6, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 1.4264264264264264, |
| "grad_norm": 0.40178048986196624, |
| "learning_rate": 3.871112973539725e-05, |
| "loss": 0.2818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22361788153648376, |
| "step": 950, |
| "valid_targets_mean": 5932.0, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 1.4339339339339339, |
| "grad_norm": 0.5858661329948348, |
| "learning_rate": 3.868454955205685e-05, |
| "loss": 0.2967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26762083172798157, |
| "step": 955, |
| "valid_targets_mean": 4612.1, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 1.4414414414414414, |
| "grad_norm": 0.59370232296713, |
| "learning_rate": 3.86577073948628e-05, |
| "loss": 0.3087, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.245170459151268, |
| "step": 960, |
| "valid_targets_mean": 4544.8, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 1.4489489489489489, |
| "grad_norm": 0.5776834809155071, |
| "learning_rate": 3.8630603640165815e-05, |
| "loss": 0.2795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3211957812309265, |
| "step": 965, |
| "valid_targets_mean": 3560.0, |
| "valid_targets_min": 462 |
| }, |
| { |
| "epoch": 1.4564564564564564, |
| "grad_norm": 0.5619424459014478, |
| "learning_rate": 3.860323866798443e-05, |
| "loss": 0.2582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21985271573066711, |
| "step": 970, |
| "valid_targets_mean": 4147.0, |
| "valid_targets_min": 964 |
| }, |
| { |
| "epoch": 1.4639639639639639, |
| "grad_norm": 0.5783533174246083, |
| "learning_rate": 3.857561286199968e-05, |
| "loss": 0.2969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29089707136154175, |
| "step": 975, |
| "valid_targets_mean": 3580.6, |
| "valid_targets_min": 489 |
| }, |
| { |
| "epoch": 1.4714714714714714, |
| "grad_norm": 0.4955776875207588, |
| "learning_rate": 3.85477266095497e-05, |
| "loss": 0.2825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2684110999107361, |
| "step": 980, |
| "valid_targets_mean": 4121.5, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 1.478978978978979, |
| "grad_norm": 0.5707278559095864, |
| "learning_rate": 3.851958030162433e-05, |
| "loss": 0.274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3071454167366028, |
| "step": 985, |
| "valid_targets_mean": 4583.5, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 1.4864864864864864, |
| "grad_norm": 0.5349960494922307, |
| "learning_rate": 3.8491174332859625e-05, |
| "loss": 0.2644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2876233160495758, |
| "step": 990, |
| "valid_targets_mean": 3913.2, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 1.493993993993994, |
| "grad_norm": 0.7242433186973595, |
| "learning_rate": 3.84625091015323e-05, |
| "loss": 0.2832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2717621624469757, |
| "step": 995, |
| "valid_targets_mean": 3196.1, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 1.5015015015015014, |
| "grad_norm": 0.559821205756259, |
| "learning_rate": 3.843358500955416e-05, |
| "loss": 0.277, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27973076701164246, |
| "step": 1000, |
| "valid_targets_mean": 3837.9, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 1.509009009009009, |
| "grad_norm": 0.5377924424199211, |
| "learning_rate": 3.840440246246648e-05, |
| "loss": 0.2818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2526509165763855, |
| "step": 1005, |
| "valid_targets_mean": 3364.9, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 1.5165165165165164, |
| "grad_norm": 0.6037241854694765, |
| "learning_rate": 3.837496186943428e-05, |
| "loss": 0.2838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3358380198478699, |
| "step": 1010, |
| "valid_targets_mean": 4278.9, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 1.524024024024024, |
| "grad_norm": 0.4711675437570829, |
| "learning_rate": 3.8345263643240634e-05, |
| "loss": 0.2535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26968130469322205, |
| "step": 1015, |
| "valid_targets_mean": 5544.2, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 1.5315315315315314, |
| "grad_norm": 0.5958428128963504, |
| "learning_rate": 3.831530820028084e-05, |
| "loss": 0.3192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32176512479782104, |
| "step": 1020, |
| "valid_targets_mean": 3855.1, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 1.539039039039039, |
| "grad_norm": 0.4865056298850766, |
| "learning_rate": 3.828509596055662e-05, |
| "loss": 0.2712, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2525503635406494, |
| "step": 1025, |
| "valid_targets_mean": 6991.5, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 1.5465465465465464, |
| "grad_norm": 0.5566299314673824, |
| "learning_rate": 3.82546273476702e-05, |
| "loss": 0.3577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2959470748901367, |
| "step": 1030, |
| "valid_targets_mean": 4056.7, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 1.554054054054054, |
| "grad_norm": 0.6266122143638768, |
| "learning_rate": 3.822390278881839e-05, |
| "loss": 0.2924, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31994956731796265, |
| "step": 1035, |
| "valid_targets_mean": 3313.5, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 1.5615615615615615, |
| "grad_norm": 0.5379754675133966, |
| "learning_rate": 3.819292271478659e-05, |
| "loss": 0.2853, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26793667674064636, |
| "step": 1040, |
| "valid_targets_mean": 3280.4, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 1.569069069069069, |
| "grad_norm": 0.42701565978810035, |
| "learning_rate": 3.816168755994274e-05, |
| "loss": 0.2752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21840263903141022, |
| "step": 1045, |
| "valid_targets_mean": 4529.6, |
| "valid_targets_min": 904 |
| }, |
| { |
| "epoch": 1.5765765765765765, |
| "grad_norm": 0.5000336725002723, |
| "learning_rate": 3.813019776223124e-05, |
| "loss": 0.286, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2662447690963745, |
| "step": 1050, |
| "valid_targets_mean": 4867.2, |
| "valid_targets_min": 988 |
| }, |
| { |
| "epoch": 1.584084084084084, |
| "grad_norm": 0.5648658240320987, |
| "learning_rate": 3.809845376316681e-05, |
| "loss": 0.3156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29331260919570923, |
| "step": 1055, |
| "valid_targets_mean": 4341.2, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 1.5915915915915915, |
| "grad_norm": 0.5284383529439995, |
| "learning_rate": 3.8066456007828304e-05, |
| "loss": 0.2835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23197105526924133, |
| "step": 1060, |
| "valid_targets_mean": 3968.8, |
| "valid_targets_min": 389 |
| }, |
| { |
| "epoch": 1.599099099099099, |
| "grad_norm": 0.5216262376393843, |
| "learning_rate": 3.803420494485244e-05, |
| "loss": 0.273, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2597469687461853, |
| "step": 1065, |
| "valid_targets_mean": 4115.9, |
| "valid_targets_min": 579 |
| }, |
| { |
| "epoch": 1.6066066066066065, |
| "grad_norm": 0.4939695307516829, |
| "learning_rate": 3.800170102642757e-05, |
| "loss": 0.2835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23144802451133728, |
| "step": 1070, |
| "valid_targets_mean": 3866.6, |
| "valid_targets_min": 486 |
| }, |
| { |
| "epoch": 1.614114114114114, |
| "grad_norm": 0.5829421644769698, |
| "learning_rate": 3.796894470828726e-05, |
| "loss": 0.267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.222642183303833, |
| "step": 1075, |
| "valid_targets_mean": 4570.8, |
| "valid_targets_min": 844 |
| }, |
| { |
| "epoch": 1.6216216216216215, |
| "grad_norm": 0.5335734411442947, |
| "learning_rate": 3.793593644970397e-05, |
| "loss": 0.2881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2972537577152252, |
| "step": 1080, |
| "valid_targets_mean": 4192.4, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 1.629129129129129, |
| "grad_norm": 0.7509523435082093, |
| "learning_rate": 3.7902676713482584e-05, |
| "loss": 0.2991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3354663848876953, |
| "step": 1085, |
| "valid_targets_mean": 3534.2, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 1.6366366366366365, |
| "grad_norm": 0.45680598867761874, |
| "learning_rate": 3.786916596595391e-05, |
| "loss": 0.2835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2275020182132721, |
| "step": 1090, |
| "valid_targets_mean": 4664.6, |
| "valid_targets_min": 768 |
| }, |
| { |
| "epoch": 1.644144144144144, |
| "grad_norm": 0.614422278972368, |
| "learning_rate": 3.783540467696817e-05, |
| "loss": 0.2845, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28407660126686096, |
| "step": 1095, |
| "valid_targets_mean": 3863.8, |
| "valid_targets_min": 409 |
| }, |
| { |
| "epoch": 1.6516516516516515, |
| "grad_norm": 0.5074836388259119, |
| "learning_rate": 3.78013933198884e-05, |
| "loss": 0.2611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23754659295082092, |
| "step": 1100, |
| "valid_targets_mean": 3914.6, |
| "valid_targets_min": 1027 |
| }, |
| { |
| "epoch": 1.659159159159159, |
| "grad_norm": 0.45212979425084815, |
| "learning_rate": 3.776713237158379e-05, |
| "loss": 0.2728, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2909110188484192, |
| "step": 1105, |
| "valid_targets_mean": 5534.1, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.6316240705989837, |
| "learning_rate": 3.773262231242305e-05, |
| "loss": 0.3053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2717238664627075, |
| "step": 1110, |
| "valid_targets_mean": 3312.1, |
| "valid_targets_min": 367 |
| }, |
| { |
| "epoch": 1.674174174174174, |
| "grad_norm": 0.5332254751800973, |
| "learning_rate": 3.7697863626267615e-05, |
| "loss": 0.3138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2853066623210907, |
| "step": 1115, |
| "valid_targets_mean": 3955.4, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 1.6816816816816815, |
| "grad_norm": 0.6436721167931566, |
| "learning_rate": 3.7662856800464907e-05, |
| "loss": 0.2876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33219900727272034, |
| "step": 1120, |
| "valid_targets_mean": 4150.2, |
| "valid_targets_min": 402 |
| }, |
| { |
| "epoch": 1.689189189189189, |
| "grad_norm": 0.41517090061996553, |
| "learning_rate": 3.762760232584148e-05, |
| "loss": 0.2544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2333643138408661, |
| "step": 1125, |
| "valid_targets_mean": 5115.1, |
| "valid_targets_min": 841 |
| }, |
| { |
| "epoch": 1.6966966966966965, |
| "grad_norm": 0.5176992190887993, |
| "learning_rate": 3.7592100696696134e-05, |
| "loss": 0.2732, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2570965886116028, |
| "step": 1130, |
| "valid_targets_mean": 3668.6, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 1.704204204204204, |
| "grad_norm": 0.511279913702578, |
| "learning_rate": 3.755635241079301e-05, |
| "loss": 0.2719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22817838191986084, |
| "step": 1135, |
| "valid_targets_mean": 3872.6, |
| "valid_targets_min": 475 |
| }, |
| { |
| "epoch": 1.7117117117117115, |
| "grad_norm": 0.6164706177166612, |
| "learning_rate": 3.7520357969354584e-05, |
| "loss": 0.2907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3176250457763672, |
| "step": 1140, |
| "valid_targets_mean": 3526.4, |
| "valid_targets_min": 693 |
| }, |
| { |
| "epoch": 1.7192192192192193, |
| "grad_norm": 0.4109077325218178, |
| "learning_rate": 3.748411787705466e-05, |
| "loss": 0.3218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2506415843963623, |
| "step": 1145, |
| "valid_targets_mean": 5783.5, |
| "valid_targets_min": 524 |
| }, |
| { |
| "epoch": 1.7267267267267268, |
| "grad_norm": 0.47340788265525957, |
| "learning_rate": 3.744763264201125e-05, |
| "loss": 0.259, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28487300872802734, |
| "step": 1150, |
| "valid_targets_mean": 5147.9, |
| "valid_targets_min": 311 |
| }, |
| { |
| "epoch": 1.7342342342342343, |
| "grad_norm": 0.6361764376110007, |
| "learning_rate": 3.741090277577953e-05, |
| "loss": 0.2747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33571434020996094, |
| "step": 1155, |
| "valid_targets_mean": 3613.9, |
| "valid_targets_min": 633 |
| }, |
| { |
| "epoch": 1.7417417417417418, |
| "grad_norm": 0.7263029802880552, |
| "learning_rate": 3.73739287933446e-05, |
| "loss": 0.3013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30988189578056335, |
| "step": 1160, |
| "valid_targets_mean": 2780.0, |
| "valid_targets_min": 388 |
| }, |
| { |
| "epoch": 1.7492492492492493, |
| "grad_norm": 0.5312249305901402, |
| "learning_rate": 3.733671121311426e-05, |
| "loss": 0.2691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25757136940956116, |
| "step": 1165, |
| "valid_targets_mean": 4026.9, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 1.7567567567567568, |
| "grad_norm": 0.5476708426420898, |
| "learning_rate": 3.729925055691182e-05, |
| "loss": 0.2875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30963361263275146, |
| "step": 1170, |
| "valid_targets_mean": 4677.7, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 1.7642642642642643, |
| "grad_norm": 0.613322007834183, |
| "learning_rate": 3.7261547349968675e-05, |
| "loss": 0.2902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34018972516059875, |
| "step": 1175, |
| "valid_targets_mean": 3271.2, |
| "valid_targets_min": 407 |
| }, |
| { |
| "epoch": 1.7717717717717718, |
| "grad_norm": 0.6162258596946204, |
| "learning_rate": 3.722360212091703e-05, |
| "loss": 0.3093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32241833209991455, |
| "step": 1180, |
| "valid_targets_mean": 3718.6, |
| "valid_targets_min": 466 |
| }, |
| { |
| "epoch": 1.7792792792792793, |
| "grad_norm": 0.664703409023323, |
| "learning_rate": 3.7185415401782434e-05, |
| "loss": 0.2791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33108675479888916, |
| "step": 1185, |
| "valid_targets_mean": 5692.8, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 1.7867867867867868, |
| "grad_norm": 0.5138638922358946, |
| "learning_rate": 3.7146987727976354e-05, |
| "loss": 0.2819, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30338913202285767, |
| "step": 1190, |
| "valid_targets_mean": 5333.4, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 1.7942942942942943, |
| "grad_norm": 0.4986654846084407, |
| "learning_rate": 3.7108319638288654e-05, |
| "loss": 0.2899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2863334119319916, |
| "step": 1195, |
| "valid_targets_mean": 4185.2, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 1.8018018018018018, |
| "grad_norm": 0.514824462976426, |
| "learning_rate": 3.706941167488002e-05, |
| "loss": 0.305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3966107666492462, |
| "step": 1200, |
| "valid_targets_mean": 4997.3, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 1.8093093093093093, |
| "grad_norm": 0.5002026479937768, |
| "learning_rate": 3.70302643832744e-05, |
| "loss": 0.3046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3028540015220642, |
| "step": 1205, |
| "valid_targets_mean": 4384.4, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 1.8168168168168168, |
| "grad_norm": 0.5733662063497278, |
| "learning_rate": 3.699087831235133e-05, |
| "loss": 0.271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28234004974365234, |
| "step": 1210, |
| "valid_targets_mean": 3882.9, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 1.8243243243243243, |
| "grad_norm": 0.49934816295444895, |
| "learning_rate": 3.6951254014338236e-05, |
| "loss": 0.2656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27083009481430054, |
| "step": 1215, |
| "valid_targets_mean": 4725.4, |
| "valid_targets_min": 497 |
| }, |
| { |
| "epoch": 1.8318318318318318, |
| "grad_norm": 0.732103811366184, |
| "learning_rate": 3.69113920448027e-05, |
| "loss": 0.2718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3054293394088745, |
| "step": 1220, |
| "valid_targets_mean": 2746.9, |
| "valid_targets_min": 478 |
| }, |
| { |
| "epoch": 1.8393393393393394, |
| "grad_norm": 0.6337417424539031, |
| "learning_rate": 3.687129296264468e-05, |
| "loss": 0.2591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26185324788093567, |
| "step": 1225, |
| "valid_targets_mean": 4788.4, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 1.8468468468468469, |
| "grad_norm": 0.5621683788362308, |
| "learning_rate": 3.683095733008864e-05, |
| "loss": 0.2693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2606724202632904, |
| "step": 1230, |
| "valid_targets_mean": 3237.6, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 1.8543543543543544, |
| "grad_norm": 0.5288214426455534, |
| "learning_rate": 3.6790385712675705e-05, |
| "loss": 0.2837, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3149155378341675, |
| "step": 1235, |
| "valid_targets_mean": 3973.2, |
| "valid_targets_min": 572 |
| }, |
| { |
| "epoch": 1.8618618618618619, |
| "grad_norm": 0.4813442560130786, |
| "learning_rate": 3.6749578679255715e-05, |
| "loss": 0.2996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2811282277107239, |
| "step": 1240, |
| "valid_targets_mean": 5313.8, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 1.8693693693693694, |
| "grad_norm": 0.6170835431330234, |
| "learning_rate": 3.6708536801979246e-05, |
| "loss": 0.2905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32795318961143494, |
| "step": 1245, |
| "valid_targets_mean": 3692.1, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 1.8768768768768769, |
| "grad_norm": 0.5375710532679772, |
| "learning_rate": 3.666726065628959e-05, |
| "loss": 0.2688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23410853743553162, |
| "step": 1250, |
| "valid_targets_mean": 3626.6, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 1.8843843843843844, |
| "grad_norm": 0.5400535513286914, |
| "learning_rate": 3.6625750820914694e-05, |
| "loss": 0.2569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3105897903442383, |
| "step": 1255, |
| "valid_targets_mean": 3530.0, |
| "valid_targets_min": 400 |
| }, |
| { |
| "epoch": 1.8918918918918919, |
| "grad_norm": 0.7192704328062035, |
| "learning_rate": 3.658400787785903e-05, |
| "loss": 0.2711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31259477138519287, |
| "step": 1260, |
| "valid_targets_mean": 2492.8, |
| "valid_targets_min": 367 |
| }, |
| { |
| "epoch": 1.8993993993993994, |
| "grad_norm": 0.5689420833987145, |
| "learning_rate": 3.654203241239546e-05, |
| "loss": 0.2752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2669737935066223, |
| "step": 1265, |
| "valid_targets_mean": 5125.1, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 1.906906906906907, |
| "grad_norm": 0.6991606704570577, |
| "learning_rate": 3.649982501305701e-05, |
| "loss": 0.2681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3605828285217285, |
| "step": 1270, |
| "valid_targets_mean": 2681.3, |
| "valid_targets_min": 603 |
| }, |
| { |
| "epoch": 1.9144144144144144, |
| "grad_norm": 0.5136360235806671, |
| "learning_rate": 3.6457386271628615e-05, |
| "loss": 0.2815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2559846043586731, |
| "step": 1275, |
| "valid_targets_mean": 4230.4, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 1.921921921921922, |
| "grad_norm": 0.5755425636039267, |
| "learning_rate": 3.641471678313883e-05, |
| "loss": 0.2629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32143378257751465, |
| "step": 1280, |
| "valid_targets_mean": 4531.5, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 1.9294294294294294, |
| "grad_norm": 0.5172980766220905, |
| "learning_rate": 3.6371817145851514e-05, |
| "loss": 0.2902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3124349117279053, |
| "step": 1285, |
| "valid_targets_mean": 5154.6, |
| "valid_targets_min": 690 |
| }, |
| { |
| "epoch": 1.936936936936937, |
| "grad_norm": 0.5579160547269432, |
| "learning_rate": 3.6328687961257374e-05, |
| "loss": 0.2863, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23261310160160065, |
| "step": 1290, |
| "valid_targets_mean": 3315.2, |
| "valid_targets_min": 432 |
| }, |
| { |
| "epoch": 1.9444444444444444, |
| "grad_norm": 0.471485760499144, |
| "learning_rate": 3.62853298340656e-05, |
| "loss": 0.2875, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23489312827587128, |
| "step": 1295, |
| "valid_targets_mean": 4736.7, |
| "valid_targets_min": 689 |
| }, |
| { |
| "epoch": 1.951951951951952, |
| "grad_norm": 0.45892772148849675, |
| "learning_rate": 3.624174337219536e-05, |
| "loss": 0.2919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23488348722457886, |
| "step": 1300, |
| "valid_targets_mean": 4925.0, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 1.9594594594594594, |
| "grad_norm": 0.6569352257148999, |
| "learning_rate": 3.6197929186767255e-05, |
| "loss": 0.2827, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26401716470718384, |
| "step": 1305, |
| "valid_targets_mean": 3648.6, |
| "valid_targets_min": 358 |
| }, |
| { |
| "epoch": 1.966966966966967, |
| "grad_norm": 0.47233655136122743, |
| "learning_rate": 3.6153887892094786e-05, |
| "loss": 0.292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2689140737056732, |
| "step": 1310, |
| "valid_targets_mean": 4251.4, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 1.9744744744744744, |
| "grad_norm": 0.4937344312534394, |
| "learning_rate": 3.6109620105675734e-05, |
| "loss": 0.2502, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2564142346382141, |
| "step": 1315, |
| "valid_targets_mean": 4050.1, |
| "valid_targets_min": 846 |
| }, |
| { |
| "epoch": 1.981981981981982, |
| "grad_norm": 0.5040985465764987, |
| "learning_rate": 3.606512644818347e-05, |
| "loss": 0.2959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27598607540130615, |
| "step": 1320, |
| "valid_targets_mean": 5606.7, |
| "valid_targets_min": 561 |
| }, |
| { |
| "epoch": 1.9894894894894894, |
| "grad_norm": 0.503656514625708, |
| "learning_rate": 3.6020407543458295e-05, |
| "loss": 0.2656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24646782875061035, |
| "step": 1325, |
| "valid_targets_mean": 4084.1, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 1.996996996996997, |
| "grad_norm": 0.48663621599509704, |
| "learning_rate": 3.597546401849866e-05, |
| "loss": 0.2877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3501949608325958, |
| "step": 1330, |
| "valid_targets_mean": 6161.8, |
| "valid_targets_min": 829 |
| }, |
| { |
| "epoch": 2.0045045045045047, |
| "grad_norm": 0.4886145150612323, |
| "learning_rate": 3.593029650345242e-05, |
| "loss": 0.248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2267410159111023, |
| "step": 1335, |
| "valid_targets_mean": 4201.8, |
| "valid_targets_min": 585 |
| }, |
| { |
| "epoch": 2.012012012012012, |
| "grad_norm": 0.918223183885553, |
| "learning_rate": 3.588490563160793e-05, |
| "loss": 0.263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20230059325695038, |
| "step": 1340, |
| "valid_targets_mean": 3759.8, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 2.0195195195195197, |
| "grad_norm": 0.41635246230968925, |
| "learning_rate": 3.583929203938523e-05, |
| "loss": 0.2647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20971567928791046, |
| "step": 1345, |
| "valid_targets_mean": 6513.2, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 2.027027027027027, |
| "grad_norm": 0.5324224076323132, |
| "learning_rate": 3.5793456366327074e-05, |
| "loss": 0.2579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2577601969242096, |
| "step": 1350, |
| "valid_targets_mean": 4199.0, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 2.0345345345345347, |
| "grad_norm": 0.666399334701293, |
| "learning_rate": 3.5747399255090016e-05, |
| "loss": 0.2532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25944650173187256, |
| "step": 1355, |
| "valid_targets_mean": 3050.4, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 2.042042042042042, |
| "grad_norm": 0.5560230204936001, |
| "learning_rate": 3.5701121351435346e-05, |
| "loss": 0.2565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30907580256462097, |
| "step": 1360, |
| "valid_targets_mean": 4342.1, |
| "valid_targets_min": 483 |
| }, |
| { |
| "epoch": 2.0495495495495497, |
| "grad_norm": 0.5093455715924559, |
| "learning_rate": 3.565462330422006e-05, |
| "loss": 0.2366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23613181710243225, |
| "step": 1365, |
| "valid_targets_mean": 4160.1, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 2.057057057057057, |
| "grad_norm": 0.5143252526017971, |
| "learning_rate": 3.560790576538777e-05, |
| "loss": 0.2441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28200429677963257, |
| "step": 1370, |
| "valid_targets_mean": 5243.5, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 2.0645645645645647, |
| "grad_norm": 0.6420496487933931, |
| "learning_rate": 3.556096938995953e-05, |
| "loss": 0.2644, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3083629906177521, |
| "step": 1375, |
| "valid_targets_mean": 3444.8, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 2.0720720720720722, |
| "grad_norm": 0.6041025909633767, |
| "learning_rate": 3.551381483602472e-05, |
| "loss": 0.3043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34277862310409546, |
| "step": 1380, |
| "valid_targets_mean": 5168.2, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 2.0795795795795797, |
| "grad_norm": 0.5065151180208464, |
| "learning_rate": 3.546644276473174e-05, |
| "loss": 0.2703, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22405189275741577, |
| "step": 1385, |
| "valid_targets_mean": 4451.1, |
| "valid_targets_min": 653 |
| }, |
| { |
| "epoch": 2.0870870870870872, |
| "grad_norm": 0.4653600091882295, |
| "learning_rate": 3.541885384027877e-05, |
| "loss": 0.2867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23494037985801697, |
| "step": 1390, |
| "valid_targets_mean": 4773.1, |
| "valid_targets_min": 515 |
| }, |
| { |
| "epoch": 2.0945945945945947, |
| "grad_norm": 0.4737552542155004, |
| "learning_rate": 3.53710487299045e-05, |
| "loss": 0.2301, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20185862481594086, |
| "step": 1395, |
| "valid_targets_mean": 4372.3, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 2.1021021021021022, |
| "grad_norm": 0.618244462622168, |
| "learning_rate": 3.5323028103878695e-05, |
| "loss": 0.2647, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28137439489364624, |
| "step": 1400, |
| "valid_targets_mean": 3066.6, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 2.1096096096096097, |
| "grad_norm": 0.6276854706539091, |
| "learning_rate": 3.527479263549287e-05, |
| "loss": 0.2567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24222517013549805, |
| "step": 1405, |
| "valid_targets_mean": 3623.4, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 2.1171171171171173, |
| "grad_norm": 0.5119888962756797, |
| "learning_rate": 3.52263430010508e-05, |
| "loss": 0.2456, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24120667576789856, |
| "step": 1410, |
| "valid_targets_mean": 4184.2, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 2.1246246246246248, |
| "grad_norm": 0.40193152670779986, |
| "learning_rate": 3.517767987985906e-05, |
| "loss": 0.2543, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21013514697551727, |
| "step": 1415, |
| "valid_targets_mean": 7112.9, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 2.1321321321321323, |
| "grad_norm": 0.6042469303834141, |
| "learning_rate": 3.5128803954217516e-05, |
| "loss": 0.245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24615558981895447, |
| "step": 1420, |
| "valid_targets_mean": 3546.8, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 2.1396396396396398, |
| "grad_norm": 0.517598650535331, |
| "learning_rate": 3.507971590940972e-05, |
| "loss": 0.2361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2518162727355957, |
| "step": 1425, |
| "valid_targets_mean": 4095.2, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 2.1471471471471473, |
| "grad_norm": 0.5314103976572915, |
| "learning_rate": 3.503041643369332e-05, |
| "loss": 0.2657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29391518235206604, |
| "step": 1430, |
| "valid_targets_mean": 4662.9, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 2.1546546546546548, |
| "grad_norm": 0.7994874645886633, |
| "learning_rate": 3.4980906218290425e-05, |
| "loss": 0.2778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24668291211128235, |
| "step": 1435, |
| "valid_targets_mean": 4393.5, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 2.1621621621621623, |
| "grad_norm": 0.5508650913511237, |
| "learning_rate": 3.493118595737789e-05, |
| "loss": 0.2655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26784124970436096, |
| "step": 1440, |
| "valid_targets_mean": 3928.2, |
| "valid_targets_min": 482 |
| }, |
| { |
| "epoch": 2.16966966966967, |
| "grad_norm": 0.48256368285307105, |
| "learning_rate": 3.4881256348077606e-05, |
| "loss": 0.2493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2078143209218979, |
| "step": 1445, |
| "valid_targets_mean": 4895.9, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 2.1771771771771773, |
| "grad_norm": 0.5518092824723564, |
| "learning_rate": 3.4831118090446695e-05, |
| "loss": 0.2614, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27934592962265015, |
| "step": 1450, |
| "valid_targets_mean": 4175.9, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 2.184684684684685, |
| "grad_norm": 0.6510442042007786, |
| "learning_rate": 3.478077188746774e-05, |
| "loss": 0.2825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25130707025527954, |
| "step": 1455, |
| "valid_targets_mean": 2940.2, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 2.1921921921921923, |
| "grad_norm": 0.6653821572090174, |
| "learning_rate": 3.473021844503885e-05, |
| "loss": 0.2915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29144030809402466, |
| "step": 1460, |
| "valid_targets_mean": 3176.5, |
| "valid_targets_min": 466 |
| }, |
| { |
| "epoch": 2.1996996996997, |
| "grad_norm": 0.5835363387672817, |
| "learning_rate": 3.4679458471963876e-05, |
| "loss": 0.2609, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2668296694755554, |
| "step": 1465, |
| "valid_targets_mean": 3661.9, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 2.2072072072072073, |
| "grad_norm": 0.473510630048058, |
| "learning_rate": 3.462849267994237e-05, |
| "loss": 0.2391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2349366545677185, |
| "step": 1470, |
| "valid_targets_mean": 4610.1, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 2.214714714714715, |
| "grad_norm": 0.5034796149297331, |
| "learning_rate": 3.457732178355966e-05, |
| "loss": 0.2786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22843249142169952, |
| "step": 1475, |
| "valid_targets_mean": 4560.3, |
| "valid_targets_min": 870 |
| }, |
| { |
| "epoch": 2.2222222222222223, |
| "grad_norm": 0.6628701647407635, |
| "learning_rate": 3.4525946500276815e-05, |
| "loss": 0.2524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33600878715515137, |
| "step": 1480, |
| "valid_targets_mean": 4715.0, |
| "valid_targets_min": 409 |
| }, |
| { |
| "epoch": 2.22972972972973, |
| "grad_norm": 0.4438069409661387, |
| "learning_rate": 3.447436755042059e-05, |
| "loss": 0.2579, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23582454025745392, |
| "step": 1485, |
| "valid_targets_mean": 6454.2, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 2.2372372372372373, |
| "grad_norm": 0.5589297614395898, |
| "learning_rate": 3.442258565717333e-05, |
| "loss": 0.2906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3400152325630188, |
| "step": 1490, |
| "valid_targets_mean": 5422.4, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 2.244744744744745, |
| "grad_norm": 0.5331121771902878, |
| "learning_rate": 3.437060154656281e-05, |
| "loss": 0.2911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31767523288726807, |
| "step": 1495, |
| "valid_targets_mean": 4458.2, |
| "valid_targets_min": 291 |
| }, |
| { |
| "epoch": 2.2522522522522523, |
| "grad_norm": 0.40712934057436334, |
| "learning_rate": 3.4318415947452085e-05, |
| "loss": 0.252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28288692235946655, |
| "step": 1500, |
| "valid_targets_mean": 6532.0, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 2.25975975975976, |
| "grad_norm": 0.45673386040732317, |
| "learning_rate": 3.4266029591529246e-05, |
| "loss": 0.2864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2521343529224396, |
| "step": 1505, |
| "valid_targets_mean": 5607.8, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 2.2672672672672673, |
| "grad_norm": 0.6013211253935284, |
| "learning_rate": 3.421344321329719e-05, |
| "loss": 0.2529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28024786710739136, |
| "step": 1510, |
| "valid_targets_mean": 3546.8, |
| "valid_targets_min": 515 |
| }, |
| { |
| "epoch": 2.274774774774775, |
| "grad_norm": 0.9210774515682121, |
| "learning_rate": 3.4160657550063286e-05, |
| "loss": 0.262, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2434246838092804, |
| "step": 1515, |
| "valid_targets_mean": 3957.6, |
| "valid_targets_min": 444 |
| }, |
| { |
| "epoch": 2.2822822822822824, |
| "grad_norm": 0.5034622925230656, |
| "learning_rate": 3.410767334192905e-05, |
| "loss": 0.2519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2538553476333618, |
| "step": 1520, |
| "valid_targets_mean": 4692.2, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 2.28978978978979, |
| "grad_norm": 0.6140827528489169, |
| "learning_rate": 3.40544913317798e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2580946087837219, |
| "step": 1525, |
| "valid_targets_mean": 3429.3, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 2.2972972972972974, |
| "grad_norm": 0.4522744249612033, |
| "learning_rate": 3.400111226527417e-05, |
| "loss": 0.2326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22649413347244263, |
| "step": 1530, |
| "valid_targets_mean": 5068.2, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 2.304804804804805, |
| "grad_norm": 0.49640935192095975, |
| "learning_rate": 3.3947536890833744e-05, |
| "loss": 0.2507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2515903115272522, |
| "step": 1535, |
| "valid_targets_mean": 4226.1, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 2.3123123123123124, |
| "grad_norm": 1.016722378855143, |
| "learning_rate": 3.389376595963248e-05, |
| "loss": 0.2882, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40263426303863525, |
| "step": 1540, |
| "valid_targets_mean": 3808.3, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 2.31981981981982, |
| "grad_norm": 0.520047683970159, |
| "learning_rate": 3.3839800225586233e-05, |
| "loss": 0.2725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24709469079971313, |
| "step": 1545, |
| "valid_targets_mean": 4321.6, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 2.3273273273273274, |
| "grad_norm": 0.4955591390887456, |
| "learning_rate": 3.378564044534216e-05, |
| "loss": 0.2218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24357634782791138, |
| "step": 1550, |
| "valid_targets_mean": 4470.6, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 2.334834834834835, |
| "grad_norm": 0.5304638752162832, |
| "learning_rate": 3.373128737826812e-05, |
| "loss": 0.2625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27869170904159546, |
| "step": 1555, |
| "valid_targets_mean": 3793.8, |
| "valid_targets_min": 252 |
| }, |
| { |
| "epoch": 2.3423423423423424, |
| "grad_norm": 0.6052044405674071, |
| "learning_rate": 3.367674178644201e-05, |
| "loss": 0.2578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2955855429172516, |
| "step": 1560, |
| "valid_targets_mean": 3434.8, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 2.34984984984985, |
| "grad_norm": 0.45641925043102494, |
| "learning_rate": 3.362200443464112e-05, |
| "loss": 0.2572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25648972392082214, |
| "step": 1565, |
| "valid_targets_mean": 5664.2, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 2.3573573573573574, |
| "grad_norm": 0.4104470454624804, |
| "learning_rate": 3.356707609033136e-05, |
| "loss": 0.2382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1871146857738495, |
| "step": 1570, |
| "valid_targets_mean": 5469.4, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 2.364864864864865, |
| "grad_norm": 0.5305663319530391, |
| "learning_rate": 3.351195752365654e-05, |
| "loss": 0.2546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20778313279151917, |
| "step": 1575, |
| "valid_targets_mean": 3653.4, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 2.3723723723723724, |
| "grad_norm": 0.952177731638365, |
| "learning_rate": 3.3456649507427537e-05, |
| "loss": 0.2785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30603039264678955, |
| "step": 1580, |
| "valid_targets_mean": 3391.8, |
| "valid_targets_min": 541 |
| }, |
| { |
| "epoch": 2.37987987987988, |
| "grad_norm": 0.625558644174225, |
| "learning_rate": 3.340115281711149e-05, |
| "loss": 0.2578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2915250360965729, |
| "step": 1585, |
| "valid_targets_mean": 3354.9, |
| "valid_targets_min": 376 |
| }, |
| { |
| "epoch": 2.3873873873873874, |
| "grad_norm": 0.4383965531441897, |
| "learning_rate": 3.3345468230820924e-05, |
| "loss": 0.2545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20519056916236877, |
| "step": 1590, |
| "valid_targets_mean": 5249.9, |
| "valid_targets_min": 576 |
| }, |
| { |
| "epoch": 2.394894894894895, |
| "grad_norm": 0.7263449171228276, |
| "learning_rate": 3.32895965293028e-05, |
| "loss": 0.2629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24948550760746002, |
| "step": 1595, |
| "valid_targets_mean": 3813.8, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 2.4024024024024024, |
| "grad_norm": 0.7704936140888641, |
| "learning_rate": 3.323353849592764e-05, |
| "loss": 0.27, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3838420808315277, |
| "step": 1600, |
| "valid_targets_mean": 4764.8, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 2.40990990990991, |
| "grad_norm": 0.5262208670623167, |
| "learning_rate": 3.317729491667848e-05, |
| "loss": 0.2854, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26990848779678345, |
| "step": 1605, |
| "valid_targets_mean": 4314.4, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 2.4174174174174174, |
| "grad_norm": 0.4905094743952616, |
| "learning_rate": 3.3120866580139856e-05, |
| "loss": 0.2678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24697014689445496, |
| "step": 1610, |
| "valid_targets_mean": 5779.1, |
| "valid_targets_min": 863 |
| }, |
| { |
| "epoch": 2.424924924924925, |
| "grad_norm": 0.5795672522700869, |
| "learning_rate": 3.306425427748681e-05, |
| "loss": 0.2753, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3122454881668091, |
| "step": 1615, |
| "valid_targets_mean": 4678.4, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 2.4324324324324325, |
| "grad_norm": 0.5127623781647497, |
| "learning_rate": 3.3007458802473705e-05, |
| "loss": 0.2418, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2780628502368927, |
| "step": 1620, |
| "valid_targets_mean": 5270.1, |
| "valid_targets_min": 408 |
| }, |
| { |
| "epoch": 2.43993993993994, |
| "grad_norm": 0.6000042814068866, |
| "learning_rate": 3.2950480951423166e-05, |
| "loss": 0.2492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26539573073387146, |
| "step": 1625, |
| "valid_targets_mean": 2969.9, |
| "valid_targets_min": 292 |
| }, |
| { |
| "epoch": 2.4474474474474475, |
| "grad_norm": 0.5601820602459276, |
| "learning_rate": 3.289332152321489e-05, |
| "loss": 0.2744, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34554967284202576, |
| "step": 1630, |
| "valid_targets_mean": 4328.4, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 2.454954954954955, |
| "grad_norm": 0.5017335839364364, |
| "learning_rate": 3.2835981319274436e-05, |
| "loss": 0.3016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31424376368522644, |
| "step": 1635, |
| "valid_targets_mean": 4981.0, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 2.4624624624624625, |
| "grad_norm": 0.5989444157971933, |
| "learning_rate": 3.277846114356201e-05, |
| "loss": 0.2812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29167452454566956, |
| "step": 1640, |
| "valid_targets_mean": 4280.9, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 2.46996996996997, |
| "grad_norm": 0.4818252524686284, |
| "learning_rate": 3.272076180256117e-05, |
| "loss": 0.2503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2451312243938446, |
| "step": 1645, |
| "valid_targets_mean": 5266.5, |
| "valid_targets_min": 456 |
| }, |
| { |
| "epoch": 2.4774774774774775, |
| "grad_norm": 0.5474083922971454, |
| "learning_rate": 3.2662884105267545e-05, |
| "loss": 0.2802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28529974818229675, |
| "step": 1650, |
| "valid_targets_mean": 4656.7, |
| "valid_targets_min": 323 |
| }, |
| { |
| "epoch": 2.484984984984985, |
| "grad_norm": 0.3927761927981878, |
| "learning_rate": 3.260482886317745e-05, |
| "loss": 0.2586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2354969084262848, |
| "step": 1655, |
| "valid_targets_mean": 6819.5, |
| "valid_targets_min": 769 |
| }, |
| { |
| "epoch": 2.4924924924924925, |
| "grad_norm": 0.5095139881585496, |
| "learning_rate": 3.254659689027656e-05, |
| "loss": 0.2822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25443506240844727, |
| "step": 1660, |
| "valid_targets_mean": 4691.8, |
| "valid_targets_min": 754 |
| }, |
| { |
| "epoch": 2.5, |
| "grad_norm": 0.48122470806496775, |
| "learning_rate": 3.2488189003028456e-05, |
| "loss": 0.2512, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25341033935546875, |
| "step": 1665, |
| "valid_targets_mean": 5473.4, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 2.5075075075075075, |
| "grad_norm": 0.535101793490416, |
| "learning_rate": 3.24296060203632e-05, |
| "loss": 0.2725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29341810941696167, |
| "step": 1670, |
| "valid_targets_mean": 4545.0, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 2.515015015015015, |
| "grad_norm": 0.5407510878775967, |
| "learning_rate": 3.2370848763665854e-05, |
| "loss": 0.2631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.298563152551651, |
| "step": 1675, |
| "valid_targets_mean": 4343.1, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 2.5225225225225225, |
| "grad_norm": 0.7328443730397846, |
| "learning_rate": 3.231191805676494e-05, |
| "loss": 0.2687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24576136469841003, |
| "step": 1680, |
| "valid_targets_mean": 4246.7, |
| "valid_targets_min": 381 |
| }, |
| { |
| "epoch": 2.53003003003003, |
| "grad_norm": 0.4953608748768144, |
| "learning_rate": 3.22528147259209e-05, |
| "loss": 0.2894, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3240085542201996, |
| "step": 1685, |
| "valid_targets_mean": 5762.2, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 2.5375375375375375, |
| "grad_norm": 0.6439990940182198, |
| "learning_rate": 3.2193539599814546e-05, |
| "loss": 0.2563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2948322892189026, |
| "step": 1690, |
| "valid_targets_mean": 3211.7, |
| "valid_targets_min": 785 |
| }, |
| { |
| "epoch": 2.545045045045045, |
| "grad_norm": 0.5649997969615153, |
| "learning_rate": 3.213409350953539e-05, |
| "loss": 0.2763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2883799374103546, |
| "step": 1695, |
| "valid_targets_mean": 3863.2, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 2.5525525525525525, |
| "grad_norm": 0.6654178682497041, |
| "learning_rate": 3.207447728857e-05, |
| "loss": 0.2697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2643584907054901, |
| "step": 1700, |
| "valid_targets_mean": 3119.7, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 2.56006006006006, |
| "grad_norm": 0.6865303086852059, |
| "learning_rate": 3.201469177279036e-05, |
| "loss": 0.2489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27196943759918213, |
| "step": 1705, |
| "valid_targets_mean": 2167.2, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 2.5675675675675675, |
| "grad_norm": 0.5565838052443746, |
| "learning_rate": 3.195473780044208e-05, |
| "loss": 0.2622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2557700276374817, |
| "step": 1710, |
| "valid_targets_mean": 3659.3, |
| "valid_targets_min": 446 |
| }, |
| { |
| "epoch": 2.575075075075075, |
| "grad_norm": 0.5197442676457078, |
| "learning_rate": 3.189461621213271e-05, |
| "loss": 0.2617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2678113579750061, |
| "step": 1715, |
| "valid_targets_mean": 4663.4, |
| "valid_targets_min": 609 |
| }, |
| { |
| "epoch": 2.5825825825825826, |
| "grad_norm": 0.5166944613990696, |
| "learning_rate": 3.18343278508199e-05, |
| "loss": 0.2584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24757936596870422, |
| "step": 1720, |
| "valid_targets_mean": 4511.7, |
| "valid_targets_min": 460 |
| }, |
| { |
| "epoch": 2.59009009009009, |
| "grad_norm": 0.4761985812024692, |
| "learning_rate": 3.177387356179962e-05, |
| "loss": 0.2292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20293045043945312, |
| "step": 1725, |
| "valid_targets_mean": 4317.4, |
| "valid_targets_min": 477 |
| }, |
| { |
| "epoch": 2.5975975975975976, |
| "grad_norm": 0.5529954148422914, |
| "learning_rate": 3.1713254192694284e-05, |
| "loss": 0.2407, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24401406943798065, |
| "step": 1730, |
| "valid_targets_mean": 3834.1, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 2.605105105105105, |
| "grad_norm": 0.4955364019562657, |
| "learning_rate": 3.1652470593440885e-05, |
| "loss": 0.2746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22095078229904175, |
| "step": 1735, |
| "valid_targets_mean": 5501.8, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 2.6126126126126126, |
| "grad_norm": 0.45641687982187235, |
| "learning_rate": 3.1591523616279055e-05, |
| "loss": 0.2507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20338258147239685, |
| "step": 1740, |
| "valid_targets_mean": 4772.7, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 2.62012012012012, |
| "grad_norm": 0.6226280659286444, |
| "learning_rate": 3.153041411573914e-05, |
| "loss": 0.2552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3405519723892212, |
| "step": 1745, |
| "valid_targets_mean": 4217.1, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 2.6276276276276276, |
| "grad_norm": 0.6357283334230661, |
| "learning_rate": 3.1469142948630194e-05, |
| "loss": 0.2552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27663713693618774, |
| "step": 1750, |
| "valid_targets_mean": 3277.6, |
| "valid_targets_min": 416 |
| }, |
| { |
| "epoch": 2.635135135135135, |
| "grad_norm": 0.5459413685496709, |
| "learning_rate": 3.140771097402798e-05, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.257800430059433, |
| "step": 1755, |
| "valid_targets_mean": 4285.2, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 2.6426426426426426, |
| "grad_norm": 0.5121436251283435, |
| "learning_rate": 3.134611905326295e-05, |
| "loss": 0.2374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2595219910144806, |
| "step": 1760, |
| "valid_targets_mean": 4998.1, |
| "valid_targets_min": 900 |
| }, |
| { |
| "epoch": 2.65015015015015, |
| "grad_norm": 0.5290785372037086, |
| "learning_rate": 3.12843680499081e-05, |
| "loss": 0.2823, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.380996972322464, |
| "step": 1765, |
| "valid_targets_mean": 5265.2, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 2.6576576576576576, |
| "grad_norm": 0.7048181374115327, |
| "learning_rate": 3.122245882976693e-05, |
| "loss": 0.2989, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2908703684806824, |
| "step": 1770, |
| "valid_targets_mean": 2736.2, |
| "valid_targets_min": 909 |
| }, |
| { |
| "epoch": 2.665165165165165, |
| "grad_norm": 0.47236135012538977, |
| "learning_rate": 3.116039226086128e-05, |
| "loss": 0.2746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30878859758377075, |
| "step": 1775, |
| "valid_targets_mean": 5567.8, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 2.6726726726726726, |
| "grad_norm": 0.5445102500932314, |
| "learning_rate": 3.1098169213419155e-05, |
| "loss": 0.2366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2582714259624481, |
| "step": 1780, |
| "valid_targets_mean": 3773.7, |
| "valid_targets_min": 376 |
| }, |
| { |
| "epoch": 2.68018018018018, |
| "grad_norm": 0.4265129001988632, |
| "learning_rate": 3.103579055986251e-05, |
| "loss": 0.2629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2143097072839737, |
| "step": 1785, |
| "valid_targets_mean": 5390.5, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 2.6876876876876876, |
| "grad_norm": 0.5312743639290497, |
| "learning_rate": 3.0973257174795074e-05, |
| "loss": 0.2788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3563080430030823, |
| "step": 1790, |
| "valid_targets_mean": 4896.1, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 2.695195195195195, |
| "grad_norm": 0.46913349560934214, |
| "learning_rate": 3.0910569934990004e-05, |
| "loss": 0.2995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22366014122962952, |
| "step": 1795, |
| "valid_targets_mean": 5595.9, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 2.7027027027027026, |
| "grad_norm": 0.4542845059111592, |
| "learning_rate": 3.084772971937766e-05, |
| "loss": 0.2346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.238237202167511, |
| "step": 1800, |
| "valid_targets_mean": 4653.6, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 2.71021021021021, |
| "grad_norm": 0.5378230783334604, |
| "learning_rate": 3.078473740903325e-05, |
| "loss": 0.2585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30502867698669434, |
| "step": 1805, |
| "valid_targets_mean": 4299.5, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 2.7177177177177176, |
| "grad_norm": 0.5591431243642122, |
| "learning_rate": 3.07215938871645e-05, |
| "loss": 0.2414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.232755646109581, |
| "step": 1810, |
| "valid_targets_mean": 3461.2, |
| "valid_targets_min": 744 |
| }, |
| { |
| "epoch": 2.725225225225225, |
| "grad_norm": 0.6091187770028943, |
| "learning_rate": 3.0658300039099235e-05, |
| "loss": 0.2612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2591820955276489, |
| "step": 1815, |
| "valid_targets_mean": 3384.4, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 2.7327327327327327, |
| "grad_norm": 0.6447111768897391, |
| "learning_rate": 3.0594856752272987e-05, |
| "loss": 0.2546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25599902868270874, |
| "step": 1820, |
| "valid_targets_mean": 3581.4, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 2.74024024024024, |
| "grad_norm": 0.44894238539094306, |
| "learning_rate": 3.053126491621657e-05, |
| "loss": 0.2745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2371259331703186, |
| "step": 1825, |
| "valid_targets_mean": 4889.4, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 2.7477477477477477, |
| "grad_norm": 0.5214275290965238, |
| "learning_rate": 3.046752542254357e-05, |
| "loss": 0.2397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22412139177322388, |
| "step": 1830, |
| "valid_targets_mean": 3863.1, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 2.755255255255255, |
| "grad_norm": 0.5573497856924043, |
| "learning_rate": 3.0403639164937865e-05, |
| "loss": 0.2636, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24575021862983704, |
| "step": 1835, |
| "valid_targets_mean": 3198.3, |
| "valid_targets_min": 461 |
| }, |
| { |
| "epoch": 2.7627627627627627, |
| "grad_norm": 0.47880699639373114, |
| "learning_rate": 3.0339607039141107e-05, |
| "loss": 0.2303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25173407793045044, |
| "step": 1840, |
| "valid_targets_mean": 4396.7, |
| "valid_targets_min": 277 |
| }, |
| { |
| "epoch": 2.77027027027027, |
| "grad_norm": 0.5293345660103224, |
| "learning_rate": 3.027542994294013e-05, |
| "loss": 0.2464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24035535752773285, |
| "step": 1845, |
| "valid_targets_mean": 3506.6, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 2.7777777777777777, |
| "grad_norm": 0.5030154656400301, |
| "learning_rate": 3.0211108776154394e-05, |
| "loss": 0.27, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24871063232421875, |
| "step": 1850, |
| "valid_targets_mean": 4511.1, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 2.785285285285285, |
| "grad_norm": 0.4172382663816932, |
| "learning_rate": 3.0146644440623355e-05, |
| "loss": 0.2676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22848474979400635, |
| "step": 1855, |
| "valid_targets_mean": 5617.8, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 2.7927927927927927, |
| "grad_norm": 0.6045475468870822, |
| "learning_rate": 3.0082037840193812e-05, |
| "loss": 0.2434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26820242404937744, |
| "step": 1860, |
| "valid_targets_mean": 3179.9, |
| "valid_targets_min": 612 |
| }, |
| { |
| "epoch": 2.8003003003003, |
| "grad_norm": 0.5418178665003754, |
| "learning_rate": 3.001728988070724e-05, |
| "loss": 0.3025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3145066499710083, |
| "step": 1865, |
| "valid_targets_mean": 4837.1, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 2.8078078078078077, |
| "grad_norm": 0.5134558903404736, |
| "learning_rate": 2.995240146998712e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21890783309936523, |
| "step": 1870, |
| "valid_targets_mean": 4246.1, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 2.815315315315315, |
| "grad_norm": 0.583571397927643, |
| "learning_rate": 2.9887373517826153e-05, |
| "loss": 0.2692, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27330344915390015, |
| "step": 1875, |
| "valid_targets_mean": 3632.4, |
| "valid_targets_min": 630 |
| }, |
| { |
| "epoch": 2.8228228228228227, |
| "grad_norm": 0.47961940508462947, |
| "learning_rate": 2.9822206935973548e-05, |
| "loss": 0.2635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2063194215297699, |
| "step": 1880, |
| "valid_targets_mean": 4621.7, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 2.83033033033033, |
| "grad_norm": 0.5920736352732671, |
| "learning_rate": 2.9756902638122213e-05, |
| "loss": 0.2319, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23864233493804932, |
| "step": 1885, |
| "valid_targets_mean": 4123.9, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 2.8378378378378377, |
| "grad_norm": 0.5565272788823533, |
| "learning_rate": 2.969146153989598e-05, |
| "loss": 0.2509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22772765159606934, |
| "step": 1890, |
| "valid_targets_mean": 3277.6, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 2.8453453453453452, |
| "grad_norm": 0.6239789579469722, |
| "learning_rate": 2.9625884558836716e-05, |
| "loss": 0.2457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26187804341316223, |
| "step": 1895, |
| "valid_targets_mean": 2902.2, |
| "valid_targets_min": 503 |
| }, |
| { |
| "epoch": 2.8528528528528527, |
| "grad_norm": 0.5680461426104465, |
| "learning_rate": 2.95601726143915e-05, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3167528510093689, |
| "step": 1900, |
| "valid_targets_mean": 4054.1, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 2.8603603603603602, |
| "grad_norm": 0.45456838507650504, |
| "learning_rate": 2.949432662789971e-05, |
| "loss": 0.2483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29696983098983765, |
| "step": 1905, |
| "valid_targets_mean": 6072.6, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 2.8678678678678677, |
| "grad_norm": 0.496183629571747, |
| "learning_rate": 2.942834752258012e-05, |
| "loss": 0.2392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21913406252861023, |
| "step": 1910, |
| "valid_targets_mean": 4109.5, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 2.8753753753753752, |
| "grad_norm": 0.5334630488557025, |
| "learning_rate": 2.936223622351794e-05, |
| "loss": 0.2325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31040453910827637, |
| "step": 1915, |
| "valid_targets_mean": 4864.2, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 2.8828828828828827, |
| "grad_norm": 0.5005858977972606, |
| "learning_rate": 2.929599365765185e-05, |
| "loss": 0.2493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31291884183883667, |
| "step": 1920, |
| "valid_targets_mean": 5317.4, |
| "valid_targets_min": 547 |
| }, |
| { |
| "epoch": 2.8903903903903903, |
| "grad_norm": 0.4974443542961955, |
| "learning_rate": 2.9229620753761013e-05, |
| "loss": 0.2473, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.301303505897522, |
| "step": 1925, |
| "valid_targets_mean": 4499.8, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 2.8978978978978978, |
| "grad_norm": 0.5691190427521686, |
| "learning_rate": 2.9163118442452046e-05, |
| "loss": 0.2449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27089810371398926, |
| "step": 1930, |
| "valid_targets_mean": 4097.7, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 2.9054054054054053, |
| "grad_norm": 0.4198119186033015, |
| "learning_rate": 2.9096487656145968e-05, |
| "loss": 0.2596, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24759484827518463, |
| "step": 1935, |
| "valid_targets_mean": 6335.4, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 2.9129129129129128, |
| "grad_norm": 0.5531720093912547, |
| "learning_rate": 2.9029729329065134e-05, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23836839199066162, |
| "step": 1940, |
| "valid_targets_mean": 3271.4, |
| "valid_targets_min": 510 |
| }, |
| { |
| "epoch": 2.9204204204204203, |
| "grad_norm": 0.4289864597777698, |
| "learning_rate": 2.896284439722013e-05, |
| "loss": 0.2767, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2916072607040405, |
| "step": 1945, |
| "valid_targets_mean": 6052.6, |
| "valid_targets_min": 466 |
| }, |
| { |
| "epoch": 2.9279279279279278, |
| "grad_norm": 0.47685929908340674, |
| "learning_rate": 2.8895833798396657e-05, |
| "loss": 0.2414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22440025210380554, |
| "step": 1950, |
| "valid_targets_mean": 4654.8, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 2.9354354354354353, |
| "grad_norm": 0.4511746235008368, |
| "learning_rate": 2.882869847214237e-05, |
| "loss": 0.2683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2768084406852722, |
| "step": 1955, |
| "valid_targets_mean": 6411.6, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 2.942942942942943, |
| "grad_norm": 0.3897834130570682, |
| "learning_rate": 2.876143935975373e-05, |
| "loss": 0.2327, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23787030577659607, |
| "step": 1960, |
| "valid_targets_mean": 6063.3, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 2.9504504504504503, |
| "grad_norm": 0.5645744222530638, |
| "learning_rate": 2.8694057404262757e-05, |
| "loss": 0.2618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26880699396133423, |
| "step": 1965, |
| "valid_targets_mean": 3741.8, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 2.957957957957958, |
| "grad_norm": 0.48669690646418146, |
| "learning_rate": 2.862655355042387e-05, |
| "loss": 0.261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33517420291900635, |
| "step": 1970, |
| "valid_targets_mean": 5469.8, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 2.9654654654654653, |
| "grad_norm": 0.4988811225771945, |
| "learning_rate": 2.85589287447006e-05, |
| "loss": 0.2573, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2532571256160736, |
| "step": 1975, |
| "valid_targets_mean": 4500.7, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 2.972972972972973, |
| "grad_norm": 0.5067859361295777, |
| "learning_rate": 2.849118393525233e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22295460104942322, |
| "step": 1980, |
| "valid_targets_mean": 4019.2, |
| "valid_targets_min": 439 |
| }, |
| { |
| "epoch": 2.9804804804804803, |
| "grad_norm": 0.5614437078904748, |
| "learning_rate": 2.8423320071920986e-05, |
| "loss": 0.2496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25288334488868713, |
| "step": 1985, |
| "valid_targets_mean": 3232.5, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 2.987987987987988, |
| "grad_norm": 0.4074367928471507, |
| "learning_rate": 2.835533810621777e-05, |
| "loss": 0.2508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22124746441841125, |
| "step": 1990, |
| "valid_targets_mean": 6511.8, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 2.9954954954954953, |
| "grad_norm": 0.4746388334736856, |
| "learning_rate": 2.8287238991309746e-05, |
| "loss": 0.2591, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22991371154785156, |
| "step": 1995, |
| "valid_targets_mean": 4459.8, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 3.003003003003003, |
| "grad_norm": 0.5433525185386173, |
| "learning_rate": 2.8219023682006533e-05, |
| "loss": 0.261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2538215219974518, |
| "step": 2000, |
| "valid_targets_mean": 3868.6, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 3.0105105105105103, |
| "grad_norm": 0.6522092709294501, |
| "learning_rate": 2.8150693134746895e-05, |
| "loss": 0.2505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25473958253860474, |
| "step": 2005, |
| "valid_targets_mean": 4023.8, |
| "valid_targets_min": 939 |
| }, |
| { |
| "epoch": 3.018018018018018, |
| "grad_norm": 0.4893307325525604, |
| "learning_rate": 2.8082248307585332e-05, |
| "loss": 0.2284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20237843692302704, |
| "step": 2010, |
| "valid_targets_mean": 4555.2, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 3.0255255255255253, |
| "grad_norm": 0.4667369885254396, |
| "learning_rate": 2.801369016017865e-05, |
| "loss": 0.2271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18705838918685913, |
| "step": 2015, |
| "valid_targets_mean": 4288.2, |
| "valid_targets_min": 690 |
| }, |
| { |
| "epoch": 3.033033033033033, |
| "grad_norm": 0.49033218061993816, |
| "learning_rate": 2.7945019653772504e-05, |
| "loss": 0.2433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2408279925584793, |
| "step": 2020, |
| "valid_targets_mean": 5262.1, |
| "valid_targets_min": 515 |
| }, |
| { |
| "epoch": 3.0405405405405403, |
| "grad_norm": 0.5391107334148109, |
| "learning_rate": 2.7876237751187917e-05, |
| "loss": 0.2436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21394947171211243, |
| "step": 2025, |
| "valid_targets_mean": 3897.1, |
| "valid_targets_min": 1733 |
| }, |
| { |
| "epoch": 3.048048048048048, |
| "grad_norm": 0.6193116901994394, |
| "learning_rate": 2.7807345416807793e-05, |
| "loss": 0.2442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23730601370334625, |
| "step": 2030, |
| "valid_targets_mean": 3262.4, |
| "valid_targets_min": 439 |
| }, |
| { |
| "epoch": 3.0555555555555554, |
| "grad_norm": 0.5319064047511843, |
| "learning_rate": 2.773834361656339e-05, |
| "loss": 0.2363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2560746669769287, |
| "step": 2035, |
| "valid_targets_mean": 4626.2, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 3.063063063063063, |
| "grad_norm": 0.7633521135620636, |
| "learning_rate": 2.766923331792075e-05, |
| "loss": 0.2507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30914023518562317, |
| "step": 2040, |
| "valid_targets_mean": 3140.8, |
| "valid_targets_min": 595 |
| }, |
| { |
| "epoch": 3.0705705705705704, |
| "grad_norm": 1.0068010745411222, |
| "learning_rate": 2.7600015489867188e-05, |
| "loss": 0.2413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2271232008934021, |
| "step": 2045, |
| "valid_targets_mean": 4060.6, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 3.078078078078078, |
| "grad_norm": 0.5451000708994922, |
| "learning_rate": 2.753069110289766e-05, |
| "loss": 0.2459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22742116451263428, |
| "step": 2050, |
| "valid_targets_mean": 3681.6, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 3.0855855855855854, |
| "grad_norm": 0.5547733055241225, |
| "learning_rate": 2.7461261129001174e-05, |
| "loss": 0.2353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24244071543216705, |
| "step": 2055, |
| "valid_targets_mean": 3975.5, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 3.093093093093093, |
| "grad_norm": 0.42158312641460743, |
| "learning_rate": 2.7391726541647163e-05, |
| "loss": 0.2154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1724860966205597, |
| "step": 2060, |
| "valid_targets_mean": 5298.3, |
| "valid_targets_min": 423 |
| }, |
| { |
| "epoch": 3.1006006006006004, |
| "grad_norm": 0.5499035304566007, |
| "learning_rate": 2.7322088315771834e-05, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24446254968643188, |
| "step": 2065, |
| "valid_targets_mean": 3607.4, |
| "valid_targets_min": 478 |
| }, |
| { |
| "epoch": 3.108108108108108, |
| "grad_norm": 0.5590055107325951, |
| "learning_rate": 2.725234742776448e-05, |
| "loss": 0.2278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23849673569202423, |
| "step": 2070, |
| "valid_targets_mean": 5030.8, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 3.1156156156156154, |
| "grad_norm": 0.478630517596832, |
| "learning_rate": 2.7182504855453834e-05, |
| "loss": 0.2499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20381265878677368, |
| "step": 2075, |
| "valid_targets_mean": 4702.2, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 3.123123123123123, |
| "grad_norm": 0.5451665017950299, |
| "learning_rate": 2.7112561578094327e-05, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2420223355293274, |
| "step": 2080, |
| "valid_targets_mean": 5865.1, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 3.1306306306306304, |
| "grad_norm": 0.5244203768707708, |
| "learning_rate": 2.704251857635234e-05, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20124025642871857, |
| "step": 2085, |
| "valid_targets_mean": 3856.1, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 3.138138138138138, |
| "grad_norm": 0.553596247360053, |
| "learning_rate": 2.69723768322925e-05, |
| "loss": 0.2429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2544230818748474, |
| "step": 2090, |
| "valid_targets_mean": 3771.1, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 3.1456456456456454, |
| "grad_norm": 0.5826774718951724, |
| "learning_rate": 2.6902137329363892e-05, |
| "loss": 0.2476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27420639991760254, |
| "step": 2095, |
| "valid_targets_mean": 3996.2, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 3.153153153153153, |
| "grad_norm": 0.6143348318690984, |
| "learning_rate": 2.683180105238625e-05, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2823088765144348, |
| "step": 2100, |
| "valid_targets_mean": 3603.2, |
| "valid_targets_min": 664 |
| }, |
| { |
| "epoch": 3.1606606606606604, |
| "grad_norm": 0.5590576178147459, |
| "learning_rate": 2.676136898753617e-05, |
| "loss": 0.2448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25955310463905334, |
| "step": 2105, |
| "valid_targets_mean": 3985.4, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 3.1681681681681684, |
| "grad_norm": 0.596190398717275, |
| "learning_rate": 2.6690842122333286e-05, |
| "loss": 0.2255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24386368691921234, |
| "step": 2110, |
| "valid_targets_mean": 3912.7, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 3.175675675675676, |
| "grad_norm": 0.6071315295064825, |
| "learning_rate": 2.6620221445626416e-05, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23695698380470276, |
| "step": 2115, |
| "valid_targets_mean": 3008.4, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 3.1831831831831834, |
| "grad_norm": 0.6533097039267628, |
| "learning_rate": 2.6549507947579685e-05, |
| "loss": 0.2575, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2619466185569763, |
| "step": 2120, |
| "valid_targets_mean": 5412.9, |
| "valid_targets_min": 491 |
| }, |
| { |
| "epoch": 3.190690690690691, |
| "grad_norm": 0.49336937759151656, |
| "learning_rate": 2.6478702619658672e-05, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23457828164100647, |
| "step": 2125, |
| "valid_targets_mean": 4639.4, |
| "valid_targets_min": 456 |
| }, |
| { |
| "epoch": 3.1981981981981984, |
| "grad_norm": 0.48643384497808734, |
| "learning_rate": 2.6407806454616472e-05, |
| "loss": 0.2368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18629509210586548, |
| "step": 2130, |
| "valid_targets_mean": 3978.7, |
| "valid_targets_min": 815 |
| }, |
| { |
| "epoch": 3.205705705705706, |
| "grad_norm": 0.7137473060732604, |
| "learning_rate": 2.633682044647982e-05, |
| "loss": 0.2492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34111836552619934, |
| "step": 2135, |
| "valid_targets_mean": 2986.7, |
| "valid_targets_min": 211 |
| }, |
| { |
| "epoch": 3.2132132132132134, |
| "grad_norm": 0.4960650096175783, |
| "learning_rate": 2.626574559053512e-05, |
| "loss": 0.254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2693920433521271, |
| "step": 2140, |
| "valid_targets_mean": 6290.2, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 3.220720720720721, |
| "grad_norm": 0.543711754415262, |
| "learning_rate": 2.619458288331449e-05, |
| "loss": 0.2648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34854060411453247, |
| "step": 2145, |
| "valid_targets_mean": 4955.6, |
| "valid_targets_min": 273 |
| }, |
| { |
| "epoch": 3.2282282282282284, |
| "grad_norm": 0.4118913840003615, |
| "learning_rate": 2.6123333322581806e-05, |
| "loss": 0.2272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22846825420856476, |
| "step": 2150, |
| "valid_targets_mean": 6945.4, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 3.235735735735736, |
| "grad_norm": 0.6226838119580127, |
| "learning_rate": 2.6051997907318724e-05, |
| "loss": 0.2492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2525981664657593, |
| "step": 2155, |
| "valid_targets_mean": 3692.9, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 3.2432432432432434, |
| "grad_norm": 0.4814778903119386, |
| "learning_rate": 2.5980577637710632e-05, |
| "loss": 0.2397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21874025464057922, |
| "step": 2160, |
| "valid_targets_mean": 5269.8, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 3.250750750750751, |
| "grad_norm": 0.48643926272296106, |
| "learning_rate": 2.5909073515132667e-05, |
| "loss": 0.2508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23266538977622986, |
| "step": 2165, |
| "valid_targets_mean": 4732.6, |
| "valid_targets_min": 898 |
| }, |
| { |
| "epoch": 3.2582582582582584, |
| "grad_norm": 0.5108891449221944, |
| "learning_rate": 2.5837486542135648e-05, |
| "loss": 0.2329, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2183685451745987, |
| "step": 2170, |
| "valid_targets_mean": 4184.6, |
| "valid_targets_min": 659 |
| }, |
| { |
| "epoch": 3.265765765765766, |
| "grad_norm": 0.5625875087588166, |
| "learning_rate": 2.576581772243204e-05, |
| "loss": 0.2766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21907004714012146, |
| "step": 2175, |
| "valid_targets_mean": 5702.3, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 3.2732732732732734, |
| "grad_norm": 0.44524330986567173, |
| "learning_rate": 2.5694068060881856e-05, |
| "loss": 0.2347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2379521131515503, |
| "step": 2180, |
| "valid_targets_mean": 5613.1, |
| "valid_targets_min": 444 |
| }, |
| { |
| "epoch": 3.280780780780781, |
| "grad_norm": 0.41557044227218803, |
| "learning_rate": 2.5622238563478603e-05, |
| "loss": 0.2161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1911526620388031, |
| "step": 2185, |
| "valid_targets_mean": 6414.1, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 3.2882882882882885, |
| "grad_norm": 0.6461866697440014, |
| "learning_rate": 2.555033023733514e-05, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2639209032058716, |
| "step": 2190, |
| "valid_targets_mean": 3629.4, |
| "valid_targets_min": 580 |
| }, |
| { |
| "epoch": 3.295795795795796, |
| "grad_norm": 0.5159050633898964, |
| "learning_rate": 2.547834409066958e-05, |
| "loss": 0.2363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27777135372161865, |
| "step": 2195, |
| "valid_targets_mean": 5053.3, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 3.3033033033033035, |
| "grad_norm": 0.477902570867691, |
| "learning_rate": 2.540628113279116e-05, |
| "loss": 0.2412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3054026961326599, |
| "step": 2200, |
| "valid_targets_mean": 6047.9, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 3.310810810810811, |
| "grad_norm": 0.45215264311766057, |
| "learning_rate": 2.5334142374086053e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22195221483707428, |
| "step": 2205, |
| "valid_targets_mean": 5648.2, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 3.3183183183183185, |
| "grad_norm": 0.8158948988984059, |
| "learning_rate": 2.5261928826003246e-05, |
| "loss": 0.2694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3665313720703125, |
| "step": 2210, |
| "valid_targets_mean": 4771.2, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 3.325825825825826, |
| "grad_norm": 0.6202523003371706, |
| "learning_rate": 2.518964150104034e-05, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22199711203575134, |
| "step": 2215, |
| "valid_targets_mean": 2897.6, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 3.3333333333333335, |
| "grad_norm": 0.6530333048449412, |
| "learning_rate": 2.511728141272934e-05, |
| "loss": 0.2304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24529844522476196, |
| "step": 2220, |
| "valid_targets_mean": 3370.7, |
| "valid_targets_min": 503 |
| }, |
| { |
| "epoch": 3.340840840840841, |
| "grad_norm": 0.5905198582269967, |
| "learning_rate": 2.5044849575622458e-05, |
| "loss": 0.2272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2153581976890564, |
| "step": 2225, |
| "valid_targets_mean": 4749.2, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 3.3483483483483485, |
| "grad_norm": 0.4868966063934165, |
| "learning_rate": 2.4972347005277903e-05, |
| "loss": 0.2831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2968922257423401, |
| "step": 2230, |
| "valid_targets_mean": 5965.1, |
| "valid_targets_min": 498 |
| }, |
| { |
| "epoch": 3.355855855855856, |
| "grad_norm": 0.8961039788278082, |
| "learning_rate": 2.489977471824561e-05, |
| "loss": 0.2348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23392842710018158, |
| "step": 2235, |
| "valid_targets_mean": 3846.9, |
| "valid_targets_min": 368 |
| }, |
| { |
| "epoch": 3.3633633633633635, |
| "grad_norm": 0.6752840687920286, |
| "learning_rate": 2.4827133732053014e-05, |
| "loss": 0.2576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25479578971862793, |
| "step": 2240, |
| "valid_targets_mean": 3281.4, |
| "valid_targets_min": 291 |
| }, |
| { |
| "epoch": 3.370870870870871, |
| "grad_norm": 0.5573523830693498, |
| "learning_rate": 2.475442506519077e-05, |
| "loss": 0.2353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20670834183692932, |
| "step": 2245, |
| "valid_targets_mean": 3441.7, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 3.3783783783783785, |
| "grad_norm": 0.47716647459061995, |
| "learning_rate": 2.468164973709847e-05, |
| "loss": 0.2249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21283169090747833, |
| "step": 2250, |
| "valid_targets_mean": 4464.2, |
| "valid_targets_min": 910 |
| }, |
| { |
| "epoch": 3.385885885885886, |
| "grad_norm": 0.5064998483360107, |
| "learning_rate": 2.4608808768150357e-05, |
| "loss": 0.2216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19695068895816803, |
| "step": 2255, |
| "valid_targets_mean": 3949.1, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 3.3933933933933935, |
| "grad_norm": 0.5175599454597674, |
| "learning_rate": 2.4535903179641026e-05, |
| "loss": 0.2265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2480076104402542, |
| "step": 2260, |
| "valid_targets_mean": 5609.1, |
| "valid_targets_min": 1410 |
| }, |
| { |
| "epoch": 3.400900900900901, |
| "grad_norm": 0.42240678217071037, |
| "learning_rate": 2.4462933993771088e-05, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26719754934310913, |
| "step": 2265, |
| "valid_targets_mean": 6515.5, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 3.4084084084084085, |
| "grad_norm": 0.506514863267876, |
| "learning_rate": 2.438990223363284e-05, |
| "loss": 0.2589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25513604283332825, |
| "step": 2270, |
| "valid_targets_mean": 4471.0, |
| "valid_targets_min": 732 |
| }, |
| { |
| "epoch": 3.415915915915916, |
| "grad_norm": 0.5367632072440157, |
| "learning_rate": 2.4316808923195926e-05, |
| "loss": 0.2387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22310830652713776, |
| "step": 2275, |
| "valid_targets_mean": 4361.2, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 3.4234234234234235, |
| "grad_norm": 0.44852402801221397, |
| "learning_rate": 2.4243655087293e-05, |
| "loss": 0.2582, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26332229375839233, |
| "step": 2280, |
| "valid_targets_mean": 6653.6, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 3.430930930930931, |
| "grad_norm": 0.48402583907149443, |
| "learning_rate": 2.4170441751605308e-05, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24115243554115295, |
| "step": 2285, |
| "valid_targets_mean": 4474.8, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 3.4384384384384385, |
| "grad_norm": 0.58593699094807, |
| "learning_rate": 2.4097169942648356e-05, |
| "loss": 0.2145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16966642439365387, |
| "step": 2290, |
| "valid_targets_mean": 5481.7, |
| "valid_targets_min": 1177 |
| }, |
| { |
| "epoch": 3.445945945945946, |
| "grad_norm": 0.4710415176014163, |
| "learning_rate": 2.4023840687757476e-05, |
| "loss": 0.2432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20201632380485535, |
| "step": 2295, |
| "valid_targets_mean": 5250.4, |
| "valid_targets_min": 717 |
| }, |
| { |
| "epoch": 3.4534534534534536, |
| "grad_norm": 0.5084005135734221, |
| "learning_rate": 2.395045501507347e-05, |
| "loss": 0.2254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20893435180187225, |
| "step": 2300, |
| "valid_targets_mean": 4357.3, |
| "valid_targets_min": 489 |
| }, |
| { |
| "epoch": 3.460960960960961, |
| "grad_norm": 0.619899875868498, |
| "learning_rate": 2.387701395352815e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21758192777633667, |
| "step": 2305, |
| "valid_targets_mean": 2881.0, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 3.4684684684684686, |
| "grad_norm": 0.48471567383203296, |
| "learning_rate": 2.380351853282992e-05, |
| "loss": 0.2445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24553707242012024, |
| "step": 2310, |
| "valid_targets_mean": 5598.6, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 3.475975975975976, |
| "grad_norm": 0.6056696323887422, |
| "learning_rate": 2.372996978344937e-05, |
| "loss": 0.2255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26694750785827637, |
| "step": 2315, |
| "valid_targets_mean": 3924.4, |
| "valid_targets_min": 523 |
| }, |
| { |
| "epoch": 3.4834834834834836, |
| "grad_norm": 0.601885827026815, |
| "learning_rate": 2.3656368736604786e-05, |
| "loss": 0.2568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28267890214920044, |
| "step": 2320, |
| "valid_targets_mean": 3601.5, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 3.490990990990991, |
| "grad_norm": 0.6254412393703039, |
| "learning_rate": 2.3582716424247728e-05, |
| "loss": 0.2711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2540096044540405, |
| "step": 2325, |
| "valid_targets_mean": 2951.5, |
| "valid_targets_min": 537 |
| }, |
| { |
| "epoch": 3.4984984984984986, |
| "grad_norm": 0.5798449489473179, |
| "learning_rate": 2.3509013879048526e-05, |
| "loss": 0.2484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30426591634750366, |
| "step": 2330, |
| "valid_targets_mean": 4265.3, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 3.506006006006006, |
| "grad_norm": 0.4923122631477329, |
| "learning_rate": 2.3435262134381823e-05, |
| "loss": 0.2068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1547277569770813, |
| "step": 2335, |
| "valid_targets_mean": 4490.8, |
| "valid_targets_min": 620 |
| }, |
| { |
| "epoch": 3.5135135135135136, |
| "grad_norm": 0.49204973031276056, |
| "learning_rate": 2.3361462224312094e-05, |
| "loss": 0.2224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1860155165195465, |
| "step": 2340, |
| "valid_targets_mean": 4172.9, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 3.521021021021021, |
| "grad_norm": 0.5430832529381092, |
| "learning_rate": 2.3287615183579126e-05, |
| "loss": 0.2485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23752620816230774, |
| "step": 2345, |
| "valid_targets_mean": 3755.6, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 3.5285285285285286, |
| "grad_norm": 0.47304505139451253, |
| "learning_rate": 2.3213722047583517e-05, |
| "loss": 0.2238, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21495875716209412, |
| "step": 2350, |
| "valid_targets_mean": 5194.9, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 3.536036036036036, |
| "grad_norm": 0.5593072985053018, |
| "learning_rate": 2.3139783852372157e-05, |
| "loss": 0.2415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32621026039123535, |
| "step": 2355, |
| "valid_targets_mean": 5330.6, |
| "valid_targets_min": 483 |
| }, |
| { |
| "epoch": 3.5435435435435436, |
| "grad_norm": 0.5133771865366825, |
| "learning_rate": 2.306580163462373e-05, |
| "loss": 0.2152, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24318471550941467, |
| "step": 2360, |
| "valid_targets_mean": 5257.0, |
| "valid_targets_min": 850 |
| }, |
| { |
| "epoch": 3.551051051051051, |
| "grad_norm": 0.7096881143231963, |
| "learning_rate": 2.299177643163413e-05, |
| "loss": 0.2412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24741387367248535, |
| "step": 2365, |
| "valid_targets_mean": 2511.2, |
| "valid_targets_min": 508 |
| }, |
| { |
| "epoch": 3.5585585585585586, |
| "grad_norm": 0.5184545440577579, |
| "learning_rate": 2.2917709281301946e-05, |
| "loss": 0.2377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28968262672424316, |
| "step": 2370, |
| "valid_targets_mean": 4808.0, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 3.566066066066066, |
| "grad_norm": 0.5497412004652409, |
| "learning_rate": 2.2843601222113915e-05, |
| "loss": 0.2846, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24640163779258728, |
| "step": 2375, |
| "valid_targets_mean": 4700.1, |
| "valid_targets_min": 418 |
| }, |
| { |
| "epoch": 3.5735735735735736, |
| "grad_norm": 0.543092075993824, |
| "learning_rate": 2.2769453293130345e-05, |
| "loss": 0.2377, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2757692039012909, |
| "step": 2380, |
| "valid_targets_mean": 3818.9, |
| "valid_targets_min": 423 |
| }, |
| { |
| "epoch": 3.581081081081081, |
| "grad_norm": 0.4756311989207704, |
| "learning_rate": 2.2695266533970556e-05, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2674590051174164, |
| "step": 2385, |
| "valid_targets_mean": 5847.6, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 3.5885885885885886, |
| "grad_norm": 0.7040802634858209, |
| "learning_rate": 2.2621041984798304e-05, |
| "loss": 0.2401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27846670150756836, |
| "step": 2390, |
| "valid_targets_mean": 2509.4, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 3.596096096096096, |
| "grad_norm": 0.6323033311574447, |
| "learning_rate": 2.2546780686307183e-05, |
| "loss": 0.2495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23559826612472534, |
| "step": 2395, |
| "valid_targets_mean": 4216.6, |
| "valid_targets_min": 608 |
| }, |
| { |
| "epoch": 3.6036036036036037, |
| "grad_norm": 0.5439419831820919, |
| "learning_rate": 2.2472483679706067e-05, |
| "loss": 0.2578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.271353542804718, |
| "step": 2400, |
| "valid_targets_mean": 4691.6, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 3.611111111111111, |
| "grad_norm": 0.657338134532918, |
| "learning_rate": 2.2398152006704463e-05, |
| "loss": 0.2602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26753100752830505, |
| "step": 2405, |
| "valid_targets_mean": 3173.4, |
| "valid_targets_min": 404 |
| }, |
| { |
| "epoch": 3.6186186186186187, |
| "grad_norm": 0.45053072622125706, |
| "learning_rate": 2.232378670949795e-05, |
| "loss": 0.2137, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18780098855495453, |
| "step": 2410, |
| "valid_targets_mean": 5203.4, |
| "valid_targets_min": 1334 |
| }, |
| { |
| "epoch": 3.626126126126126, |
| "grad_norm": 0.4023749713359982, |
| "learning_rate": 2.2249388830753534e-05, |
| "loss": 0.2321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17731866240501404, |
| "step": 2415, |
| "valid_targets_mean": 5612.2, |
| "valid_targets_min": 480 |
| }, |
| { |
| "epoch": 3.6336336336336337, |
| "grad_norm": 0.5062285511706474, |
| "learning_rate": 2.217495941359506e-05, |
| "loss": 0.2514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23712016642093658, |
| "step": 2420, |
| "valid_targets_mean": 4567.2, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 3.641141141141141, |
| "grad_norm": 0.5407394227692897, |
| "learning_rate": 2.2100499501588558e-05, |
| "loss": 0.2402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25140225887298584, |
| "step": 2425, |
| "valid_targets_mean": 4480.6, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 3.6486486486486487, |
| "grad_norm": 0.5432137809783814, |
| "learning_rate": 2.2026010138727628e-05, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23100072145462036, |
| "step": 2430, |
| "valid_targets_mean": 4535.2, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 3.656156156156156, |
| "grad_norm": 0.5702741738198654, |
| "learning_rate": 2.1951492369418786e-05, |
| "loss": 0.2448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24533988535404205, |
| "step": 2435, |
| "valid_targets_mean": 4315.2, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 3.6636636636636637, |
| "grad_norm": 0.6650337977127149, |
| "learning_rate": 2.1876947238466838e-05, |
| "loss": 0.256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2869791090488434, |
| "step": 2440, |
| "valid_targets_mean": 3385.6, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 3.671171171171171, |
| "grad_norm": 0.473867504379004, |
| "learning_rate": 2.1802375791060232e-05, |
| "loss": 0.2315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18947833776474, |
| "step": 2445, |
| "valid_targets_mean": 5216.6, |
| "valid_targets_min": 742 |
| }, |
| { |
| "epoch": 3.6786786786786787, |
| "grad_norm": 0.7199290550127364, |
| "learning_rate": 2.1727779072756388e-05, |
| "loss": 0.2197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30827030539512634, |
| "step": 2450, |
| "valid_targets_mean": 4398.8, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 3.686186186186186, |
| "grad_norm": 0.6169439986122458, |
| "learning_rate": 2.1653158129467048e-05, |
| "loss": 0.281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2743998169898987, |
| "step": 2455, |
| "valid_targets_mean": 3159.7, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 3.6936936936936937, |
| "grad_norm": 0.630068337186312, |
| "learning_rate": 2.1578514007443602e-05, |
| "loss": 0.2446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2756376266479492, |
| "step": 2460, |
| "valid_targets_mean": 3321.1, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 3.701201201201201, |
| "grad_norm": 8.40963413100615, |
| "learning_rate": 2.1503847753262447e-05, |
| "loss": 0.2376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21705785393714905, |
| "step": 2465, |
| "valid_targets_mean": 5065.1, |
| "valid_targets_min": 1345 |
| }, |
| { |
| "epoch": 3.7087087087087087, |
| "grad_norm": 0.8840964089151675, |
| "learning_rate": 2.1429160413810268e-05, |
| "loss": 0.2268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2861403822898865, |
| "step": 2470, |
| "valid_targets_mean": 5522.8, |
| "valid_targets_min": 991 |
| }, |
| { |
| "epoch": 3.7162162162162162, |
| "grad_norm": 0.47904088821045393, |
| "learning_rate": 2.1354453036269397e-05, |
| "loss": 0.2283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.182481050491333, |
| "step": 2475, |
| "valid_targets_mean": 3823.9, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 3.7237237237237237, |
| "grad_norm": 0.6350177279756045, |
| "learning_rate": 2.1279726668103112e-05, |
| "loss": 0.2235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.289498507976532, |
| "step": 2480, |
| "valid_targets_mean": 3174.9, |
| "valid_targets_min": 597 |
| }, |
| { |
| "epoch": 3.7312312312312312, |
| "grad_norm": 0.5475085951271096, |
| "learning_rate": 2.1204982357040974e-05, |
| "loss": 0.2321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2232646644115448, |
| "step": 2485, |
| "valid_targets_mean": 3746.9, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 3.7387387387387387, |
| "grad_norm": 0.5721638552098921, |
| "learning_rate": 2.1130221151064095e-05, |
| "loss": 0.2408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2669849693775177, |
| "step": 2490, |
| "valid_targets_mean": 4861.1, |
| "valid_targets_min": 469 |
| }, |
| { |
| "epoch": 3.7462462462462462, |
| "grad_norm": 0.46167196232037994, |
| "learning_rate": 2.105544409839048e-05, |
| "loss": 0.2249, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1929030418395996, |
| "step": 2495, |
| "valid_targets_mean": 4768.8, |
| "valid_targets_min": 888 |
| }, |
| { |
| "epoch": 3.7537537537537538, |
| "grad_norm": 0.5709387953688929, |
| "learning_rate": 2.098065224746031e-05, |
| "loss": 0.2465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26624026894569397, |
| "step": 2500, |
| "valid_targets_mean": 3260.7, |
| "valid_targets_min": 788 |
| }, |
| { |
| "epoch": 3.7612612612612613, |
| "grad_norm": 0.5636970256534266, |
| "learning_rate": 2.0905846646921266e-05, |
| "loss": 0.2595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29653650522232056, |
| "step": 2505, |
| "valid_targets_mean": 3569.1, |
| "valid_targets_min": 856 |
| }, |
| { |
| "epoch": 3.7687687687687688, |
| "grad_norm": 0.4293486036135388, |
| "learning_rate": 2.0831028345613807e-05, |
| "loss": 0.2521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22826270759105682, |
| "step": 2510, |
| "valid_targets_mean": 5393.5, |
| "valid_targets_min": 404 |
| }, |
| { |
| "epoch": 3.7762762762762763, |
| "grad_norm": 0.5914611642027671, |
| "learning_rate": 2.0756198392556458e-05, |
| "loss": 0.2313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22963778674602509, |
| "step": 2515, |
| "valid_targets_mean": 2932.8, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 3.7837837837837838, |
| "grad_norm": 0.5163134230928269, |
| "learning_rate": 2.0681357836931114e-05, |
| "loss": 0.224, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.207438126206398, |
| "step": 2520, |
| "valid_targets_mean": 4660.4, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 3.7912912912912913, |
| "grad_norm": 0.7190308106564102, |
| "learning_rate": 2.0606507728068338e-05, |
| "loss": 0.2276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2699480652809143, |
| "step": 2525, |
| "valid_targets_mean": 2463.4, |
| "valid_targets_min": 475 |
| }, |
| { |
| "epoch": 3.798798798798799, |
| "grad_norm": 0.6346404271383566, |
| "learning_rate": 2.0531649115432626e-05, |
| "loss": 0.2426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26241040229797363, |
| "step": 2530, |
| "valid_targets_mean": 3470.4, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 3.8063063063063063, |
| "grad_norm": 0.5405574803276272, |
| "learning_rate": 2.0456783048607708e-05, |
| "loss": 0.234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2565130591392517, |
| "step": 2535, |
| "valid_targets_mean": 4024.1, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 3.813813813813814, |
| "grad_norm": 0.604890803793606, |
| "learning_rate": 2.038191057728183e-05, |
| "loss": 0.2225, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2380007952451706, |
| "step": 2540, |
| "valid_targets_mean": 3456.8, |
| "valid_targets_min": 662 |
| }, |
| { |
| "epoch": 3.8213213213213213, |
| "grad_norm": 0.6793469587756615, |
| "learning_rate": 2.0307032751233038e-05, |
| "loss": 0.2593, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2839970290660858, |
| "step": 2545, |
| "valid_targets_mean": 4329.7, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 3.828828828828829, |
| "grad_norm": 0.5213037499939942, |
| "learning_rate": 2.023215062031445e-05, |
| "loss": 0.247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2534673511981964, |
| "step": 2550, |
| "valid_targets_mean": 4234.5, |
| "valid_targets_min": 437 |
| }, |
| { |
| "epoch": 3.8363363363363363, |
| "grad_norm": 0.48716095297652656, |
| "learning_rate": 2.0157265234439545e-05, |
| "loss": 0.2399, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17926955223083496, |
| "step": 2555, |
| "valid_targets_mean": 4508.6, |
| "valid_targets_min": 404 |
| }, |
| { |
| "epoch": 3.843843843843844, |
| "grad_norm": 0.45658767125521904, |
| "learning_rate": 2.0082377643567427e-05, |
| "loss": 0.2135, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16734261810779572, |
| "step": 2560, |
| "valid_targets_mean": 4532.5, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 3.8513513513513513, |
| "grad_norm": 0.5887721035383384, |
| "learning_rate": 2.0007488897688145e-05, |
| "loss": 0.2469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2615935802459717, |
| "step": 2565, |
| "valid_targets_mean": 3602.4, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 3.858858858858859, |
| "grad_norm": 0.5556930711337941, |
| "learning_rate": 1.9932600046807914e-05, |
| "loss": 0.2355, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1911911964416504, |
| "step": 2570, |
| "valid_targets_mean": 3493.8, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 3.8663663663663663, |
| "grad_norm": 0.4918999956248638, |
| "learning_rate": 1.985771214093444e-05, |
| "loss": 0.2162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19995930790901184, |
| "step": 2575, |
| "valid_targets_mean": 4204.2, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 3.873873873873874, |
| "grad_norm": 0.52841578647817, |
| "learning_rate": 1.9782826230062155e-05, |
| "loss": 0.2705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28531813621520996, |
| "step": 2580, |
| "valid_targets_mean": 4070.0, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 3.8813813813813813, |
| "grad_norm": 0.5040983553316225, |
| "learning_rate": 1.9707943364157552e-05, |
| "loss": 0.2039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18574920296669006, |
| "step": 2585, |
| "valid_targets_mean": 3998.8, |
| "valid_targets_min": 416 |
| }, |
| { |
| "epoch": 3.888888888888889, |
| "grad_norm": 0.49554889736984387, |
| "learning_rate": 1.9633064593144408e-05, |
| "loss": 0.217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20392203330993652, |
| "step": 2590, |
| "valid_targets_mean": 4092.8, |
| "valid_targets_min": 638 |
| }, |
| { |
| "epoch": 3.8963963963963963, |
| "grad_norm": 0.4727254866083527, |
| "learning_rate": 1.9558190966889093e-05, |
| "loss": 0.2598, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21000804007053375, |
| "step": 2595, |
| "valid_targets_mean": 5088.9, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 3.903903903903904, |
| "grad_norm": 0.43824564462204646, |
| "learning_rate": 1.9483323535185838e-05, |
| "loss": 0.2129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1834757924079895, |
| "step": 2600, |
| "valid_targets_mean": 4795.2, |
| "valid_targets_min": 852 |
| }, |
| { |
| "epoch": 3.9114114114114114, |
| "grad_norm": 0.4414256886221553, |
| "learning_rate": 1.940846334774203e-05, |
| "loss": 0.2198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1729404479265213, |
| "step": 2605, |
| "valid_targets_mean": 4699.6, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 3.918918918918919, |
| "grad_norm": 0.5060621091961622, |
| "learning_rate": 1.933361145416348e-05, |
| "loss": 0.2215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2322886735200882, |
| "step": 2610, |
| "valid_targets_mean": 6213.0, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 3.9264264264264264, |
| "grad_norm": 0.593672866808795, |
| "learning_rate": 1.9258768903939706e-05, |
| "loss": 0.2432, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24251478910446167, |
| "step": 2615, |
| "valid_targets_mean": 3359.5, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 3.933933933933934, |
| "grad_norm": 0.4404905443315122, |
| "learning_rate": 1.9183936746429234e-05, |
| "loss": 0.2666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2132512629032135, |
| "step": 2620, |
| "valid_targets_mean": 5353.2, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 3.9414414414414414, |
| "grad_norm": 0.5116438369388818, |
| "learning_rate": 1.9109116030844874e-05, |
| "loss": 0.2318, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27721619606018066, |
| "step": 2625, |
| "valid_targets_mean": 4330.2, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 3.948948948948949, |
| "grad_norm": 0.5905044794050749, |
| "learning_rate": 1.9034307806239004e-05, |
| "loss": 0.2603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33162492513656616, |
| "step": 2630, |
| "valid_targets_mean": 4979.0, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 3.9564564564564564, |
| "grad_norm": 0.5353633419703424, |
| "learning_rate": 1.8959513121488868e-05, |
| "loss": 0.2544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23549598455429077, |
| "step": 2635, |
| "valid_targets_mean": 4418.6, |
| "valid_targets_min": 858 |
| }, |
| { |
| "epoch": 3.963963963963964, |
| "grad_norm": 0.47963900371966894, |
| "learning_rate": 1.8884733025281876e-05, |
| "loss": 0.244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1948413848876953, |
| "step": 2640, |
| "valid_targets_mean": 4141.8, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 3.9714714714714714, |
| "grad_norm": 0.44606918683200836, |
| "learning_rate": 1.880996856610088e-05, |
| "loss": 0.2417, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21382328867912292, |
| "step": 2645, |
| "valid_targets_mean": 5472.8, |
| "valid_targets_min": 745 |
| }, |
| { |
| "epoch": 3.978978978978979, |
| "grad_norm": 0.5149587332986721, |
| "learning_rate": 1.8735220792209513e-05, |
| "loss": 0.228, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19594892859458923, |
| "step": 2650, |
| "valid_targets_mean": 4153.9, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 3.9864864864864864, |
| "grad_norm": 0.5874287195534135, |
| "learning_rate": 1.8660490751637435e-05, |
| "loss": 0.2352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22586959600448608, |
| "step": 2655, |
| "valid_targets_mean": 3378.9, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 3.993993993993994, |
| "grad_norm": 0.46189741004980345, |
| "learning_rate": 1.858577949216569e-05, |
| "loss": 0.2134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2193407416343689, |
| "step": 2660, |
| "valid_targets_mean": 4348.1, |
| "valid_targets_min": 447 |
| }, |
| { |
| "epoch": 4.001501501501502, |
| "grad_norm": 0.5233378328639746, |
| "learning_rate": 1.8511088061311982e-05, |
| "loss": 0.2246, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2248275727033615, |
| "step": 2665, |
| "valid_targets_mean": 3952.7, |
| "valid_targets_min": 671 |
| }, |
| { |
| "epoch": 4.009009009009009, |
| "grad_norm": 0.6071971400069938, |
| "learning_rate": 1.8436417506316013e-05, |
| "loss": 0.2354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23917962610721588, |
| "step": 2670, |
| "valid_targets_mean": 3420.5, |
| "valid_targets_min": 429 |
| }, |
| { |
| "epoch": 4.016516516516517, |
| "grad_norm": 0.5914162200350297, |
| "learning_rate": 1.8361768874124778e-05, |
| "loss": 0.2518, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2445971816778183, |
| "step": 2675, |
| "valid_targets_mean": 4843.9, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 4.024024024024024, |
| "grad_norm": 0.547907620188072, |
| "learning_rate": 1.8287143211377893e-05, |
| "loss": 0.2157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1973641812801361, |
| "step": 2680, |
| "valid_targets_mean": 4041.2, |
| "valid_targets_min": 418 |
| }, |
| { |
| "epoch": 4.031531531531532, |
| "grad_norm": 0.5133198173072647, |
| "learning_rate": 1.8212541564392924e-05, |
| "loss": 0.2281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17949888110160828, |
| "step": 2685, |
| "valid_targets_mean": 3785.6, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 4.039039039039039, |
| "grad_norm": 0.47846466241843566, |
| "learning_rate": 1.813796497915073e-05, |
| "loss": 0.2478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2564462423324585, |
| "step": 2690, |
| "valid_targets_mean": 5844.4, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 4.046546546546547, |
| "grad_norm": 0.569435583148903, |
| "learning_rate": 1.806341450128076e-05, |
| "loss": 0.2314, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22870904207229614, |
| "step": 2695, |
| "valid_targets_mean": 4163.9, |
| "valid_targets_min": 699 |
| }, |
| { |
| "epoch": 4.054054054054054, |
| "grad_norm": 0.5070243213845931, |
| "learning_rate": 1.798889117604643e-05, |
| "loss": 0.2164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23002973198890686, |
| "step": 2700, |
| "valid_targets_mean": 4445.3, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 4.061561561561562, |
| "grad_norm": 0.4867044644660382, |
| "learning_rate": 1.7914396048330428e-05, |
| "loss": 0.1903, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19053609669208527, |
| "step": 2705, |
| "valid_targets_mean": 4508.4, |
| "valid_targets_min": 569 |
| }, |
| { |
| "epoch": 4.069069069069069, |
| "grad_norm": 0.5805381784749756, |
| "learning_rate": 1.7839930162620128e-05, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1698979139328003, |
| "step": 2710, |
| "valid_targets_mean": 3140.1, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 4.076576576576577, |
| "grad_norm": 0.602504277734938, |
| "learning_rate": 1.7765494562992878e-05, |
| "loss": 0.2122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18390074372291565, |
| "step": 2715, |
| "valid_targets_mean": 3297.9, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 4.084084084084084, |
| "grad_norm": 0.6470125645401709, |
| "learning_rate": 1.7691090293101386e-05, |
| "loss": 0.2572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28710392117500305, |
| "step": 2720, |
| "valid_targets_mean": 3918.4, |
| "valid_targets_min": 437 |
| }, |
| { |
| "epoch": 4.091591591591592, |
| "grad_norm": 0.5066063002958375, |
| "learning_rate": 1.76167183961591e-05, |
| "loss": 0.2266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2291889488697052, |
| "step": 2725, |
| "valid_targets_mean": 5055.3, |
| "valid_targets_min": 388 |
| }, |
| { |
| "epoch": 4.099099099099099, |
| "grad_norm": 0.6455258191217119, |
| "learning_rate": 1.7542379914925575e-05, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23442783951759338, |
| "step": 2730, |
| "valid_targets_mean": 2962.8, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 4.106606606606607, |
| "grad_norm": 0.7386040382747444, |
| "learning_rate": 1.7468075891691832e-05, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21252450346946716, |
| "step": 2735, |
| "valid_targets_mean": 3100.8, |
| "valid_targets_min": 518 |
| }, |
| { |
| "epoch": 4.114114114114114, |
| "grad_norm": 0.48445294014230816, |
| "learning_rate": 1.7393807368265777e-05, |
| "loss": 0.208, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22077061235904694, |
| "step": 2740, |
| "valid_targets_mean": 5577.0, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 4.121621621621622, |
| "grad_norm": 0.48865023064949326, |
| "learning_rate": 1.731957538595756e-05, |
| "loss": 0.22, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19657564163208008, |
| "step": 2745, |
| "valid_targets_mean": 4633.6, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 4.129129129129129, |
| "grad_norm": 0.6690952004993063, |
| "learning_rate": 1.7245380985565014e-05, |
| "loss": 0.2026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18894386291503906, |
| "step": 2750, |
| "valid_targets_mean": 3604.8, |
| "valid_targets_min": 437 |
| }, |
| { |
| "epoch": 4.136636636636637, |
| "grad_norm": 0.7195870104883615, |
| "learning_rate": 1.7171225207359023e-05, |
| "loss": 0.2258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27104708552360535, |
| "step": 2755, |
| "valid_targets_mean": 3011.1, |
| "valid_targets_min": 948 |
| }, |
| { |
| "epoch": 4.1441441441441444, |
| "grad_norm": 0.5379416037342353, |
| "learning_rate": 1.7097109091068965e-05, |
| "loss": 0.2531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3290520906448364, |
| "step": 2760, |
| "valid_targets_mean": 6327.2, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 4.151651651651652, |
| "grad_norm": 0.4819288545219707, |
| "learning_rate": 1.7023033675868107e-05, |
| "loss": 0.2337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19341519474983215, |
| "step": 2765, |
| "valid_targets_mean": 5650.7, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 4.1591591591591595, |
| "grad_norm": 0.4339406422217775, |
| "learning_rate": 1.694900000035907e-05, |
| "loss": 0.1945, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18829095363616943, |
| "step": 2770, |
| "valid_targets_mean": 5408.4, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 4.166666666666667, |
| "grad_norm": 0.5494279815313058, |
| "learning_rate": 1.687500910255924e-05, |
| "loss": 0.2345, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29033520817756653, |
| "step": 2775, |
| "valid_targets_mean": 4524.4, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 4.1741741741741745, |
| "grad_norm": 0.4489742319836925, |
| "learning_rate": 1.6801062019886216e-05, |
| "loss": 0.2443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2034509927034378, |
| "step": 2780, |
| "valid_targets_mean": 4920.3, |
| "valid_targets_min": 427 |
| }, |
| { |
| "epoch": 4.181681681681682, |
| "grad_norm": 0.5280057369516138, |
| "learning_rate": 1.6727159789143276e-05, |
| "loss": 0.2251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25000298023223877, |
| "step": 2785, |
| "valid_targets_mean": 6445.3, |
| "valid_targets_min": 460 |
| }, |
| { |
| "epoch": 4.1891891891891895, |
| "grad_norm": 0.570852623942594, |
| "learning_rate": 1.665330344650484e-05, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23752200603485107, |
| "step": 2790, |
| "valid_targets_mean": 4025.2, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 4.196696696696697, |
| "grad_norm": 0.5022860617467421, |
| "learning_rate": 1.6579494027501926e-05, |
| "loss": 0.2702, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25862377882003784, |
| "step": 2795, |
| "valid_targets_mean": 5591.9, |
| "valid_targets_min": 1079 |
| }, |
| { |
| "epoch": 4.2042042042042045, |
| "grad_norm": 0.5808638456409436, |
| "learning_rate": 1.6505732567007644e-05, |
| "loss": 0.2144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2629520297050476, |
| "step": 2800, |
| "valid_targets_mean": 4279.3, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 4.211711711711712, |
| "grad_norm": 0.5011677067782193, |
| "learning_rate": 1.6432020099222686e-05, |
| "loss": 0.2239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17377246916294098, |
| "step": 2805, |
| "valid_targets_mean": 4540.3, |
| "valid_targets_min": 506 |
| }, |
| { |
| "epoch": 4.2192192192192195, |
| "grad_norm": 0.6312221103561748, |
| "learning_rate": 1.635835765766082e-05, |
| "loss": 0.1895, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1711842268705368, |
| "step": 2810, |
| "valid_targets_mean": 4152.6, |
| "valid_targets_min": 576 |
| }, |
| { |
| "epoch": 4.226726726726727, |
| "grad_norm": 0.5455241347866726, |
| "learning_rate": 1.6284746275134413e-05, |
| "loss": 0.2123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2519665062427521, |
| "step": 2815, |
| "valid_targets_mean": 4392.9, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 4.2342342342342345, |
| "grad_norm": 0.544839041978784, |
| "learning_rate": 1.621118698373992e-05, |
| "loss": 0.2643, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22317945957183838, |
| "step": 2820, |
| "valid_targets_mean": 4256.4, |
| "valid_targets_min": 508 |
| }, |
| { |
| "epoch": 4.241741741741742, |
| "grad_norm": 0.5207115855205976, |
| "learning_rate": 1.6137680814843447e-05, |
| "loss": 0.2287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26101672649383545, |
| "step": 2825, |
| "valid_targets_mean": 4533.8, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 4.2492492492492495, |
| "grad_norm": 0.7554547871541064, |
| "learning_rate": 1.6064228799066272e-05, |
| "loss": 0.2369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2488705813884735, |
| "step": 2830, |
| "valid_targets_mean": 3717.3, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 4.256756756756757, |
| "grad_norm": 0.5076882374389426, |
| "learning_rate": 1.5990831966270396e-05, |
| "loss": 0.2121, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20610791444778442, |
| "step": 2835, |
| "valid_targets_mean": 5082.6, |
| "valid_targets_min": 660 |
| }, |
| { |
| "epoch": 4.2642642642642645, |
| "grad_norm": 0.563842648058139, |
| "learning_rate": 1.5917491345544113e-05, |
| "loss": 0.2136, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18700063228607178, |
| "step": 2840, |
| "valid_targets_mean": 4268.7, |
| "valid_targets_min": 596 |
| }, |
| { |
| "epoch": 4.271771771771772, |
| "grad_norm": 0.5630065305626606, |
| "learning_rate": 1.584420796518756e-05, |
| "loss": 0.244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2228190302848816, |
| "step": 2845, |
| "valid_targets_mean": 3847.0, |
| "valid_targets_min": 865 |
| }, |
| { |
| "epoch": 4.2792792792792795, |
| "grad_norm": 0.5990679311909958, |
| "learning_rate": 1.5770982852698337e-05, |
| "loss": 0.2485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2809998095035553, |
| "step": 2850, |
| "valid_targets_mean": 3885.7, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 4.286786786786787, |
| "grad_norm": 0.5512552937482088, |
| "learning_rate": 1.5697817034757052e-05, |
| "loss": 0.2027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1838597059249878, |
| "step": 2855, |
| "valid_targets_mean": 3917.1, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 4.2942942942942945, |
| "grad_norm": 0.560081521292376, |
| "learning_rate": 1.5624711537212967e-05, |
| "loss": 0.2265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20176030695438385, |
| "step": 2860, |
| "valid_targets_mean": 3504.7, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 4.301801801801802, |
| "grad_norm": 0.7258528593213625, |
| "learning_rate": 1.5551667385069593e-05, |
| "loss": 0.2005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22372370958328247, |
| "step": 2865, |
| "valid_targets_mean": 2295.4, |
| "valid_targets_min": 423 |
| }, |
| { |
| "epoch": 4.3093093093093096, |
| "grad_norm": 0.7471444365279868, |
| "learning_rate": 1.5478685602470324e-05, |
| "loss": 0.2511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24615955352783203, |
| "step": 2870, |
| "valid_targets_mean": 3811.6, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 4.316816816816817, |
| "grad_norm": 0.6829203066694415, |
| "learning_rate": 1.5405767212684078e-05, |
| "loss": 0.2372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21476216614246368, |
| "step": 2875, |
| "valid_targets_mean": 3288.6, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 4.324324324324325, |
| "grad_norm": 0.5733535380374483, |
| "learning_rate": 1.5332913238090962e-05, |
| "loss": 0.2276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2381066530942917, |
| "step": 2880, |
| "valid_targets_mean": 3251.5, |
| "valid_targets_min": 697 |
| }, |
| { |
| "epoch": 4.331831831831832, |
| "grad_norm": 0.6499639228286483, |
| "learning_rate": 1.52601247001679e-05, |
| "loss": 0.2267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23366223275661469, |
| "step": 2885, |
| "valid_targets_mean": 2987.1, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 4.33933933933934, |
| "grad_norm": 0.6285744664120035, |
| "learning_rate": 1.5187402619474361e-05, |
| "loss": 0.2083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.195681631565094, |
| "step": 2890, |
| "valid_targets_mean": 4077.1, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 4.346846846846847, |
| "grad_norm": 0.6210882117570284, |
| "learning_rate": 1.5114748015638013e-05, |
| "loss": 0.2127, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21708352863788605, |
| "step": 2895, |
| "valid_targets_mean": 4107.8, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 4.354354354354355, |
| "grad_norm": 0.5855096649034774, |
| "learning_rate": 1.5042161907340438e-05, |
| "loss": 0.2292, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25563323497772217, |
| "step": 2900, |
| "valid_targets_mean": 3565.5, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 4.361861861861862, |
| "grad_norm": 0.5300025815920703, |
| "learning_rate": 1.4969645312302851e-05, |
| "loss": 0.2197, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22752434015274048, |
| "step": 2905, |
| "valid_targets_mean": 4113.8, |
| "valid_targets_min": 381 |
| }, |
| { |
| "epoch": 4.36936936936937, |
| "grad_norm": 0.5804189010231626, |
| "learning_rate": 1.4897199247271842e-05, |
| "loss": 0.2025, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1874658167362213, |
| "step": 2910, |
| "valid_targets_mean": 3798.9, |
| "valid_targets_min": 452 |
| }, |
| { |
| "epoch": 4.376876876876877, |
| "grad_norm": 0.48760141515061334, |
| "learning_rate": 1.4824824728005092e-05, |
| "loss": 0.2434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.257068395614624, |
| "step": 2915, |
| "valid_targets_mean": 5025.7, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 4.384384384384385, |
| "grad_norm": 0.658477050968013, |
| "learning_rate": 1.4752522769257152e-05, |
| "loss": 0.2147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22656235098838806, |
| "step": 2920, |
| "valid_targets_mean": 3549.4, |
| "valid_targets_min": 624 |
| }, |
| { |
| "epoch": 4.391891891891892, |
| "grad_norm": 0.7492347794498558, |
| "learning_rate": 1.468029438476521e-05, |
| "loss": 0.2305, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22716817259788513, |
| "step": 2925, |
| "valid_targets_mean": 2520.4, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 4.3993993993994, |
| "grad_norm": 0.5532580940259121, |
| "learning_rate": 1.4608140587234887e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20708701014518738, |
| "step": 2930, |
| "valid_targets_mean": 3850.1, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 4.406906906906907, |
| "grad_norm": 0.4546505507730152, |
| "learning_rate": 1.453606238832602e-05, |
| "loss": 0.2218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21117320656776428, |
| "step": 2935, |
| "valid_targets_mean": 6005.3, |
| "valid_targets_min": 813 |
| }, |
| { |
| "epoch": 4.414414414414415, |
| "grad_norm": 0.7252302746614107, |
| "learning_rate": 1.4464060798638484e-05, |
| "loss": 0.2291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18549787998199463, |
| "step": 2940, |
| "valid_targets_mean": 3605.3, |
| "valid_targets_min": 847 |
| }, |
| { |
| "epoch": 4.421921921921922, |
| "grad_norm": 0.43525814011469965, |
| "learning_rate": 1.4392136827698032e-05, |
| "loss": 0.1929, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16544996201992035, |
| "step": 2945, |
| "valid_targets_mean": 5133.1, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 4.42942942942943, |
| "grad_norm": 0.6290052391762472, |
| "learning_rate": 1.4320291483942135e-05, |
| "loss": 0.2245, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21728135645389557, |
| "step": 2950, |
| "valid_targets_mean": 3071.6, |
| "valid_targets_min": 601 |
| }, |
| { |
| "epoch": 4.436936936936937, |
| "grad_norm": 0.568290272425125, |
| "learning_rate": 1.424852577470584e-05, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18296922743320465, |
| "step": 2955, |
| "valid_targets_mean": 5362.2, |
| "valid_targets_min": 803 |
| }, |
| { |
| "epoch": 4.444444444444445, |
| "grad_norm": 0.603259783928807, |
| "learning_rate": 1.417684070620764e-05, |
| "loss": 0.2261, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23192979395389557, |
| "step": 2960, |
| "valid_targets_mean": 3260.2, |
| "valid_targets_min": 713 |
| }, |
| { |
| "epoch": 4.451951951951952, |
| "grad_norm": 0.5712898946994219, |
| "learning_rate": 1.4105237283535376e-05, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2266012728214264, |
| "step": 2965, |
| "valid_targets_mean": 4215.6, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 4.45945945945946, |
| "grad_norm": 0.6445579585402789, |
| "learning_rate": 1.403371651063216e-05, |
| "loss": 0.2363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24278521537780762, |
| "step": 2970, |
| "valid_targets_mean": 3313.9, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 4.466966966966967, |
| "grad_norm": 0.5733027694106058, |
| "learning_rate": 1.3962279390282261e-05, |
| "loss": 0.243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2066403329372406, |
| "step": 2975, |
| "valid_targets_mean": 4162.3, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 4.474474474474475, |
| "grad_norm": 0.613924525173538, |
| "learning_rate": 1.3890926924097071e-05, |
| "loss": 0.1938, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20435193181037903, |
| "step": 2980, |
| "valid_targets_mean": 3513.4, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 4.481981981981982, |
| "grad_norm": 0.5403888711125328, |
| "learning_rate": 1.3819660112501054e-05, |
| "loss": 0.2242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20203976333141327, |
| "step": 2985, |
| "valid_targets_mean": 4108.9, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 4.48948948948949, |
| "grad_norm": 0.5594472556122174, |
| "learning_rate": 1.3748479954717735e-05, |
| "loss": 0.2462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20039498805999756, |
| "step": 2990, |
| "valid_targets_mean": 3769.4, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 4.496996996996997, |
| "grad_norm": 0.5426786497323537, |
| "learning_rate": 1.3677387448755657e-05, |
| "loss": 0.2068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21668657660484314, |
| "step": 2995, |
| "valid_targets_mean": 3945.2, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 4.504504504504505, |
| "grad_norm": 0.4470248026304529, |
| "learning_rate": 1.360638359139442e-05, |
| "loss": 0.2203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2280035763978958, |
| "step": 3000, |
| "valid_targets_mean": 5678.4, |
| "valid_targets_min": 1551 |
| }, |
| { |
| "epoch": 4.512012012012012, |
| "grad_norm": 0.609794314414809, |
| "learning_rate": 1.3535469378170683e-05, |
| "loss": 0.239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2744963467121124, |
| "step": 3005, |
| "valid_targets_mean": 3750.4, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 4.51951951951952, |
| "grad_norm": 0.4627448347366898, |
| "learning_rate": 1.3464645803364228e-05, |
| "loss": 0.2439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21215581893920898, |
| "step": 3010, |
| "valid_targets_mean": 5590.1, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 4.527027027027027, |
| "grad_norm": 0.6035357299819745, |
| "learning_rate": 1.3393913859983996e-05, |
| "loss": 0.2138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2198573499917984, |
| "step": 3015, |
| "valid_targets_mean": 6302.9, |
| "valid_targets_min": 789 |
| }, |
| { |
| "epoch": 4.534534534534535, |
| "grad_norm": 0.5643676209847303, |
| "learning_rate": 1.3323274539754177e-05, |
| "loss": 0.2198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25696855783462524, |
| "step": 3020, |
| "valid_targets_mean": 4303.8, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 4.542042042042042, |
| "grad_norm": 0.570048922978165, |
| "learning_rate": 1.3252728833100296e-05, |
| "loss": 0.2203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19746547937393188, |
| "step": 3025, |
| "valid_targets_mean": 3560.8, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 4.54954954954955, |
| "grad_norm": 0.4464417263684137, |
| "learning_rate": 1.3182277729135358e-05, |
| "loss": 0.2287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19879616796970367, |
| "step": 3030, |
| "valid_targets_mean": 7131.6, |
| "valid_targets_min": 460 |
| }, |
| { |
| "epoch": 4.557057057057057, |
| "grad_norm": 0.5089601591681008, |
| "learning_rate": 1.3111922215645922e-05, |
| "loss": 0.2126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23360319435596466, |
| "step": 3035, |
| "valid_targets_mean": 4634.0, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 4.564564564564565, |
| "grad_norm": 0.6823720809640251, |
| "learning_rate": 1.3041663279078311e-05, |
| "loss": 0.2104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2097683995962143, |
| "step": 3040, |
| "valid_targets_mean": 2433.6, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 4.572072072072072, |
| "grad_norm": 0.6700606322768459, |
| "learning_rate": 1.297150190452473e-05, |
| "loss": 0.2051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2061670869588852, |
| "step": 3045, |
| "valid_targets_mean": 2720.6, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 4.57957957957958, |
| "grad_norm": 0.6228866174244457, |
| "learning_rate": 1.2901439075709506e-05, |
| "loss": 0.2165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18749915063381195, |
| "step": 3050, |
| "valid_targets_mean": 3271.4, |
| "valid_targets_min": 416 |
| }, |
| { |
| "epoch": 4.587087087087087, |
| "grad_norm": 0.600075319444778, |
| "learning_rate": 1.2831475774975247e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24314680695533752, |
| "step": 3055, |
| "valid_targets_mean": 4222.2, |
| "valid_targets_min": 520 |
| }, |
| { |
| "epoch": 4.594594594594595, |
| "grad_norm": 0.4219894648635082, |
| "learning_rate": 1.2761612983269094e-05, |
| "loss": 0.2195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18051698803901672, |
| "step": 3060, |
| "valid_targets_mean": 6413.9, |
| "valid_targets_min": 703 |
| }, |
| { |
| "epoch": 4.602102102102102, |
| "grad_norm": 0.5430062852225149, |
| "learning_rate": 1.2691851680128966e-05, |
| "loss": 0.2119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18320244550704956, |
| "step": 3065, |
| "valid_targets_mean": 3880.8, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 4.60960960960961, |
| "grad_norm": 0.4910324433811435, |
| "learning_rate": 1.2622192843669826e-05, |
| "loss": 0.2111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1959684193134308, |
| "step": 3070, |
| "valid_targets_mean": 5296.5, |
| "valid_targets_min": 512 |
| }, |
| { |
| "epoch": 4.617117117117117, |
| "grad_norm": 0.5134831494706088, |
| "learning_rate": 1.255263745056996e-05, |
| "loss": 0.2051, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21355494856834412, |
| "step": 3075, |
| "valid_targets_mean": 5030.8, |
| "valid_targets_min": 469 |
| }, |
| { |
| "epoch": 4.624624624624625, |
| "grad_norm": 0.5527873198315599, |
| "learning_rate": 1.2483186476057281e-05, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1989469826221466, |
| "step": 3080, |
| "valid_targets_mean": 3602.9, |
| "valid_targets_min": 630 |
| }, |
| { |
| "epoch": 4.632132132132132, |
| "grad_norm": 0.7003658441849595, |
| "learning_rate": 1.2413840893895668e-05, |
| "loss": 0.1931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20069898664951324, |
| "step": 3085, |
| "valid_targets_mean": 3747.1, |
| "valid_targets_min": 474 |
| }, |
| { |
| "epoch": 4.63963963963964, |
| "grad_norm": 0.5774616260959406, |
| "learning_rate": 1.2344601676371312e-05, |
| "loss": 0.2107, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2032512128353119, |
| "step": 3090, |
| "valid_targets_mean": 5143.7, |
| "valid_targets_min": 1085 |
| }, |
| { |
| "epoch": 4.647147147147147, |
| "grad_norm": 0.609625942880746, |
| "learning_rate": 1.2275469794279068e-05, |
| "loss": 0.2376, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24463210999965668, |
| "step": 3095, |
| "valid_targets_mean": 3302.1, |
| "valid_targets_min": 211 |
| }, |
| { |
| "epoch": 4.654654654654655, |
| "grad_norm": 0.5539889957775487, |
| "learning_rate": 1.220644621690885e-05, |
| "loss": 0.2184, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19467709958553314, |
| "step": 3100, |
| "valid_targets_mean": 3723.1, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 4.662162162162162, |
| "grad_norm": 0.5324494392088087, |
| "learning_rate": 1.2137531912032058e-05, |
| "loss": 0.2179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2482069581747055, |
| "step": 3105, |
| "valid_targets_mean": 4753.6, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 4.66966966966967, |
| "grad_norm": 0.5048180559075982, |
| "learning_rate": 1.2068727845887995e-05, |
| "loss": 0.2118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24020060896873474, |
| "step": 3110, |
| "valid_targets_mean": 5051.0, |
| "valid_targets_min": 462 |
| }, |
| { |
| "epoch": 4.677177177177177, |
| "grad_norm": 0.4832724873118443, |
| "learning_rate": 1.2000034983170305e-05, |
| "loss": 0.2357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22151488065719604, |
| "step": 3115, |
| "valid_targets_mean": 5193.5, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 4.684684684684685, |
| "grad_norm": 0.5679523589750985, |
| "learning_rate": 1.193145428701347e-05, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2017378807067871, |
| "step": 3120, |
| "valid_targets_mean": 4752.9, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 4.692192192192192, |
| "grad_norm": 0.8966754020165514, |
| "learning_rate": 1.18629867189793e-05, |
| "loss": 0.2302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24184086918830872, |
| "step": 3125, |
| "valid_targets_mean": 2982.5, |
| "valid_targets_min": 515 |
| }, |
| { |
| "epoch": 4.6996996996997, |
| "grad_norm": 0.49411819508382815, |
| "learning_rate": 1.1794633239043449e-05, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2202903926372528, |
| "step": 3130, |
| "valid_targets_mean": 4615.9, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 4.707207207207207, |
| "grad_norm": 0.4928998645668594, |
| "learning_rate": 1.1726394805581957e-05, |
| "loss": 0.2398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21853674948215485, |
| "step": 3135, |
| "valid_targets_mean": 5042.8, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 4.714714714714715, |
| "grad_norm": 0.5803190883509034, |
| "learning_rate": 1.1658272375357797e-05, |
| "loss": 0.2426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24375799298286438, |
| "step": 3140, |
| "valid_targets_mean": 4044.2, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 4.722222222222222, |
| "grad_norm": 0.5795814998007034, |
| "learning_rate": 1.1590266903507499e-05, |
| "loss": 0.2371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2230663299560547, |
| "step": 3145, |
| "valid_targets_mean": 4489.6, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 4.72972972972973, |
| "grad_norm": 0.6742257430638947, |
| "learning_rate": 1.1522379343527708e-05, |
| "loss": 0.2535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23786276578903198, |
| "step": 3150, |
| "valid_targets_mean": 4348.9, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 4.737237237237237, |
| "grad_norm": 0.49627665219198364, |
| "learning_rate": 1.1454610647261859e-05, |
| "loss": 0.2174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2170691192150116, |
| "step": 3155, |
| "valid_targets_mean": 4579.3, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 4.744744744744745, |
| "grad_norm": 0.4965773011218609, |
| "learning_rate": 1.1386961764886806e-05, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21680960059165955, |
| "step": 3160, |
| "valid_targets_mean": 4751.6, |
| "valid_targets_min": 970 |
| }, |
| { |
| "epoch": 4.752252252252252, |
| "grad_norm": 0.46564876478736006, |
| "learning_rate": 1.1319433644899496e-05, |
| "loss": 0.2346, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20024517178535461, |
| "step": 3165, |
| "valid_targets_mean": 5608.7, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 4.75975975975976, |
| "grad_norm": 0.8219903727111237, |
| "learning_rate": 1.1252027234103709e-05, |
| "loss": 0.2175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21334412693977356, |
| "step": 3170, |
| "valid_targets_mean": 3558.3, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 4.767267267267267, |
| "grad_norm": 0.5331331638771257, |
| "learning_rate": 1.118474347759673e-05, |
| "loss": 0.2032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23813585937023163, |
| "step": 3175, |
| "valid_targets_mean": 4562.6, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 4.774774774774775, |
| "grad_norm": 0.7204879070632291, |
| "learning_rate": 1.1117583318756128e-05, |
| "loss": 0.2218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21081534028053284, |
| "step": 3180, |
| "valid_targets_mean": 4559.9, |
| "valid_targets_min": 347 |
| }, |
| { |
| "epoch": 4.782282282282282, |
| "grad_norm": 0.6342862982793008, |
| "learning_rate": 1.1050547699226522e-05, |
| "loss": 0.2234, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21464157104492188, |
| "step": 3185, |
| "valid_targets_mean": 4187.8, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 4.78978978978979, |
| "grad_norm": 0.5094911353991051, |
| "learning_rate": 1.09836375589064e-05, |
| "loss": 0.2126, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21020804345607758, |
| "step": 3190, |
| "valid_targets_mean": 5157.7, |
| "valid_targets_min": 1150 |
| }, |
| { |
| "epoch": 4.797297297297297, |
| "grad_norm": 0.47526721126268623, |
| "learning_rate": 1.0916853835934891e-05, |
| "loss": 0.2157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22524023056030273, |
| "step": 3195, |
| "valid_targets_mean": 5497.2, |
| "valid_targets_min": 714 |
| }, |
| { |
| "epoch": 4.804804804804805, |
| "grad_norm": 0.7451217907444951, |
| "learning_rate": 1.0850197466678662e-05, |
| "loss": 0.232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20764270424842834, |
| "step": 3200, |
| "valid_targets_mean": 4149.2, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 4.812312312312312, |
| "grad_norm": 0.4957698184650846, |
| "learning_rate": 1.0783669385718762e-05, |
| "loss": 0.2371, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21627801656723022, |
| "step": 3205, |
| "valid_targets_mean": 5803.0, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 4.81981981981982, |
| "grad_norm": 0.5309967929446427, |
| "learning_rate": 1.0717270525837523e-05, |
| "loss": 0.2449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2549176514148712, |
| "step": 3210, |
| "valid_targets_mean": 5175.2, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 4.827327327327327, |
| "grad_norm": 0.6675846311975975, |
| "learning_rate": 1.0651001818005487e-05, |
| "loss": 0.2157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2339574694633484, |
| "step": 3215, |
| "valid_targets_mean": 3242.3, |
| "valid_targets_min": 499 |
| }, |
| { |
| "epoch": 4.834834834834835, |
| "grad_norm": 0.5348472304451167, |
| "learning_rate": 1.0584864191368345e-05, |
| "loss": 0.2287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2503393888473511, |
| "step": 3220, |
| "valid_targets_mean": 5664.9, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 4.842342342342342, |
| "grad_norm": 0.5338144959827715, |
| "learning_rate": 1.0518858573233911e-05, |
| "loss": 0.2171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21501460671424866, |
| "step": 3225, |
| "valid_targets_mean": 4275.4, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 4.84984984984985, |
| "grad_norm": 0.583867201837148, |
| "learning_rate": 1.0452985889059151e-05, |
| "loss": 0.2321, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2584874629974365, |
| "step": 3230, |
| "valid_targets_mean": 3758.3, |
| "valid_targets_min": 367 |
| }, |
| { |
| "epoch": 4.857357357357357, |
| "grad_norm": 0.4704381431905369, |
| "learning_rate": 1.0387247062437144e-05, |
| "loss": 0.2159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2556239068508148, |
| "step": 3235, |
| "valid_targets_mean": 5887.3, |
| "valid_targets_min": 489 |
| }, |
| { |
| "epoch": 4.864864864864865, |
| "grad_norm": 0.6249528070324213, |
| "learning_rate": 1.0321643015084187e-05, |
| "loss": 0.2111, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23891428112983704, |
| "step": 3240, |
| "valid_targets_mean": 3309.9, |
| "valid_targets_min": 301 |
| }, |
| { |
| "epoch": 4.872372372372372, |
| "grad_norm": 0.44764920429718186, |
| "learning_rate": 1.0256174666826841e-05, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19511452317237854, |
| "step": 3245, |
| "valid_targets_mean": 5169.8, |
| "valid_targets_min": 980 |
| }, |
| { |
| "epoch": 4.87987987987988, |
| "grad_norm": 0.5340956174536189, |
| "learning_rate": 1.0190842935589065e-05, |
| "loss": 0.206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18626420199871063, |
| "step": 3250, |
| "valid_targets_mean": 3967.4, |
| "valid_targets_min": 798 |
| }, |
| { |
| "epoch": 4.887387387387387, |
| "grad_norm": 0.56288269038886, |
| "learning_rate": 1.0125648737379307e-05, |
| "loss": 0.2185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20922933518886566, |
| "step": 3255, |
| "valid_targets_mean": 4145.1, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 4.894894894894895, |
| "grad_norm": 0.4659624202841574, |
| "learning_rate": 1.0060592986277693e-05, |
| "loss": 0.2216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18871676921844482, |
| "step": 3260, |
| "valid_targets_mean": 5421.9, |
| "valid_targets_min": 2150 |
| }, |
| { |
| "epoch": 4.902402402402402, |
| "grad_norm": 0.5691277577002785, |
| "learning_rate": 9.995676594423186e-06, |
| "loss": 0.2241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22213050723075867, |
| "step": 3265, |
| "valid_targets_mean": 4555.8, |
| "valid_targets_min": 839 |
| }, |
| { |
| "epoch": 4.90990990990991, |
| "grad_norm": 0.6445683801786387, |
| "learning_rate": 9.930900472000834e-06, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20591846108436584, |
| "step": 3270, |
| "valid_targets_mean": 3039.4, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 4.9174174174174174, |
| "grad_norm": 0.48632405588473493, |
| "learning_rate": 9.866265527228961e-06, |
| "loss": 0.2047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.224864199757576, |
| "step": 3275, |
| "valid_targets_mean": 5041.8, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 4.924924924924925, |
| "grad_norm": 0.4551299572592259, |
| "learning_rate": 9.801772666346462e-06, |
| "loss": 0.2383, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17636257410049438, |
| "step": 3280, |
| "valid_targets_mean": 5264.3, |
| "valid_targets_min": 260 |
| }, |
| { |
| "epoch": 4.9324324324324325, |
| "grad_norm": 0.5303503051433811, |
| "learning_rate": 9.737422793600092e-06, |
| "loss": 0.2529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2605491876602173, |
| "step": 3285, |
| "valid_targets_mean": 4923.2, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 4.93993993993994, |
| "grad_norm": 0.5619328215648045, |
| "learning_rate": 9.67321681123179e-06, |
| "loss": 0.2219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21425651013851166, |
| "step": 3290, |
| "valid_targets_mean": 4545.6, |
| "valid_targets_min": 515 |
| }, |
| { |
| "epoch": 4.9474474474474475, |
| "grad_norm": 0.4969814195952852, |
| "learning_rate": 9.609155619466016e-06, |
| "loss": 0.202, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19319353997707367, |
| "step": 3295, |
| "valid_targets_mean": 4383.9, |
| "valid_targets_min": 711 |
| }, |
| { |
| "epoch": 4.954954954954955, |
| "grad_norm": 0.6244151395343142, |
| "learning_rate": 9.545240116497143e-06, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18449707329273224, |
| "step": 3300, |
| "valid_targets_mean": 3211.4, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 4.9624624624624625, |
| "grad_norm": 0.5893223235253725, |
| "learning_rate": 9.481471198476855e-06, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22556568682193756, |
| "step": 3305, |
| "valid_targets_mean": 5031.6, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 4.96996996996997, |
| "grad_norm": 0.4915902916242456, |
| "learning_rate": 9.417849759501603e-06, |
| "loss": 0.2226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2357444167137146, |
| "step": 3310, |
| "valid_targets_mean": 5379.2, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 4.9774774774774775, |
| "grad_norm": 0.5245483991646102, |
| "learning_rate": 9.354376691600034e-06, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18305274844169617, |
| "step": 3315, |
| "valid_targets_mean": 4195.8, |
| "valid_targets_min": 388 |
| }, |
| { |
| "epoch": 4.984984984984985, |
| "grad_norm": 0.49053726456598334, |
| "learning_rate": 9.2910528847205e-06, |
| "loss": 0.2419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23515072464942932, |
| "step": 3320, |
| "valid_targets_mean": 4802.1, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 4.9924924924924925, |
| "grad_norm": 0.5458070078892359, |
| "learning_rate": 9.227879226718595e-06, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2729540467262268, |
| "step": 3325, |
| "valid_targets_mean": 4229.2, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.4617612878592164, |
| "learning_rate": 9.164856603344681e-06, |
| "loss": 0.2209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19838783144950867, |
| "step": 3330, |
| "valid_targets_mean": 5383.6, |
| "valid_targets_min": 1005 |
| }, |
| { |
| "epoch": 5.0075075075075075, |
| "grad_norm": 0.5006372512661854, |
| "learning_rate": 9.10198589823149e-06, |
| "loss": 0.2043, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21871143579483032, |
| "step": 3335, |
| "valid_targets_mean": 4899.0, |
| "valid_targets_min": 478 |
| }, |
| { |
| "epoch": 5.015015015015015, |
| "grad_norm": 0.493071836759497, |
| "learning_rate": 9.039267992881724e-06, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15860621631145477, |
| "step": 3340, |
| "valid_targets_mean": 4637.3, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 5.0225225225225225, |
| "grad_norm": 0.5942000008682329, |
| "learning_rate": 8.97670376665569e-06, |
| "loss": 0.212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21339187026023865, |
| "step": 3345, |
| "valid_targets_mean": 4111.1, |
| "valid_targets_min": 482 |
| }, |
| { |
| "epoch": 5.03003003003003, |
| "grad_norm": 0.5098653931776418, |
| "learning_rate": 8.914294096758995e-06, |
| "loss": 0.2524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21369382739067078, |
| "step": 3350, |
| "valid_targets_mean": 5529.7, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 5.0375375375375375, |
| "grad_norm": 0.48801798277011926, |
| "learning_rate": 8.852039858230217e-06, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16710881888866425, |
| "step": 3355, |
| "valid_targets_mean": 4623.7, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 5.045045045045045, |
| "grad_norm": 0.5406142033120225, |
| "learning_rate": 8.78994192392865e-06, |
| "loss": 0.1969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18688131868839264, |
| "step": 3360, |
| "valid_targets_mean": 3961.8, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 5.0525525525525525, |
| "grad_norm": 0.49064863606657333, |
| "learning_rate": 8.728001164522068e-06, |
| "loss": 0.2054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19211602210998535, |
| "step": 3365, |
| "valid_targets_mean": 5132.5, |
| "valid_targets_min": 557 |
| }, |
| { |
| "epoch": 5.06006006006006, |
| "grad_norm": 0.5428647141950651, |
| "learning_rate": 8.666218448474517e-06, |
| "loss": 0.2235, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19043126702308655, |
| "step": 3370, |
| "valid_targets_mean": 4518.9, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 5.0675675675675675, |
| "grad_norm": 0.5285735991494391, |
| "learning_rate": 8.604594642034126e-06, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22566662728786469, |
| "step": 3375, |
| "valid_targets_mean": 4554.3, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 5.075075075075075, |
| "grad_norm": 0.6397497283612681, |
| "learning_rate": 8.543130609220982e-06, |
| "loss": 0.1913, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17037567496299744, |
| "step": 3380, |
| "valid_targets_mean": 3197.0, |
| "valid_targets_min": 631 |
| }, |
| { |
| "epoch": 5.0825825825825826, |
| "grad_norm": 0.5624772140252701, |
| "learning_rate": 8.481827211814991e-06, |
| "loss": 0.2315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2726784348487854, |
| "step": 3385, |
| "valid_targets_mean": 4160.6, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 5.09009009009009, |
| "grad_norm": 0.5877366129284431, |
| "learning_rate": 8.420685309343835e-06, |
| "loss": 0.2131, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20283541083335876, |
| "step": 3390, |
| "valid_targets_mean": 3707.2, |
| "valid_targets_min": 663 |
| }, |
| { |
| "epoch": 5.097597597597598, |
| "grad_norm": 0.6489090565754443, |
| "learning_rate": 8.35970575907087e-06, |
| "loss": 0.2123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2192349135875702, |
| "step": 3395, |
| "valid_targets_mean": 5407.1, |
| "valid_targets_min": 672 |
| }, |
| { |
| "epoch": 5.105105105105105, |
| "grad_norm": 0.5565202403018633, |
| "learning_rate": 8.298889415983142e-06, |
| "loss": 0.2057, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1590254306793213, |
| "step": 3400, |
| "valid_targets_mean": 3583.3, |
| "valid_targets_min": 735 |
| }, |
| { |
| "epoch": 5.112612612612613, |
| "grad_norm": 0.41960211523789304, |
| "learning_rate": 8.23823713277938e-06, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14446228742599487, |
| "step": 3405, |
| "valid_targets_mean": 5082.1, |
| "valid_targets_min": 276 |
| }, |
| { |
| "epoch": 5.12012012012012, |
| "grad_norm": 0.6517049110770983, |
| "learning_rate": 8.17774975985806e-06, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23023463785648346, |
| "step": 3410, |
| "valid_targets_mean": 4596.8, |
| "valid_targets_min": 786 |
| }, |
| { |
| "epoch": 5.127627627627628, |
| "grad_norm": 0.8256063611735115, |
| "learning_rate": 8.117428145305464e-06, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19371360540390015, |
| "step": 3415, |
| "valid_targets_mean": 3733.1, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 5.135135135135135, |
| "grad_norm": 0.47817908036094603, |
| "learning_rate": 8.057273134883794e-06, |
| "loss": 0.2065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20559421181678772, |
| "step": 3420, |
| "valid_targets_mean": 5914.1, |
| "valid_targets_min": 746 |
| }, |
| { |
| "epoch": 5.142642642642643, |
| "grad_norm": 0.6404035798093046, |
| "learning_rate": 7.997285572019316e-06, |
| "loss": 0.2294, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19509994983673096, |
| "step": 3425, |
| "valid_targets_mean": 3609.6, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 5.15015015015015, |
| "grad_norm": 0.7814615076086997, |
| "learning_rate": 7.937466297790542e-06, |
| "loss": 0.2033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17219263315200806, |
| "step": 3430, |
| "valid_targets_mean": 4124.9, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 5.157657657657658, |
| "grad_norm": 0.5711178140418124, |
| "learning_rate": 7.877816150916422e-06, |
| "loss": 0.2186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20192334055900574, |
| "step": 3435, |
| "valid_targets_mean": 4497.1, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 5.165165165165165, |
| "grad_norm": 0.6605000045012411, |
| "learning_rate": 7.81833596774459e-06, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21957352757453918, |
| "step": 3440, |
| "valid_targets_mean": 3223.1, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 5.172672672672673, |
| "grad_norm": 1.2228952471867771, |
| "learning_rate": 7.759026582239639e-06, |
| "loss": 0.1919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2631041407585144, |
| "step": 3445, |
| "valid_targets_mean": 4348.8, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 5.18018018018018, |
| "grad_norm": 0.858620752436695, |
| "learning_rate": 7.699888825971433e-06, |
| "loss": 0.2026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.162127286195755, |
| "step": 3450, |
| "valid_targets_mean": 6938.4, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 5.187687687687688, |
| "grad_norm": 0.6070759956430632, |
| "learning_rate": 7.640923528103441e-06, |
| "loss": 0.2168, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2934483289718628, |
| "step": 3455, |
| "valid_targets_mean": 4662.9, |
| "valid_targets_min": 739 |
| }, |
| { |
| "epoch": 5.195195195195195, |
| "grad_norm": 0.5186921298999412, |
| "learning_rate": 7.582131515381108e-06, |
| "loss": 0.203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2093011438846588, |
| "step": 3460, |
| "valid_targets_mean": 4782.7, |
| "valid_targets_min": 492 |
| }, |
| { |
| "epoch": 5.202702702702703, |
| "grad_norm": 0.5661778349613429, |
| "learning_rate": 7.5235136121202675e-06, |
| "loss": 0.2171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24795249104499817, |
| "step": 3465, |
| "valid_targets_mean": 4599.2, |
| "valid_targets_min": 324 |
| }, |
| { |
| "epoch": 5.21021021021021, |
| "grad_norm": 0.5360911975296877, |
| "learning_rate": 7.465070640195606e-06, |
| "loss": 0.2068, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26138007640838623, |
| "step": 3470, |
| "valid_targets_mean": 4960.6, |
| "valid_targets_min": 376 |
| }, |
| { |
| "epoch": 5.217717717717718, |
| "grad_norm": 0.5642393094183789, |
| "learning_rate": 7.406803419029094e-06, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24130575358867645, |
| "step": 3475, |
| "valid_targets_mean": 4966.7, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 5.225225225225225, |
| "grad_norm": 0.4550076790955841, |
| "learning_rate": 7.3487127655785295e-06, |
| "loss": 0.2106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1952485740184784, |
| "step": 3480, |
| "valid_targets_mean": 5512.1, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 5.232732732732733, |
| "grad_norm": 0.6885372734490723, |
| "learning_rate": 7.290799494326077e-06, |
| "loss": 0.2016, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16893789172172546, |
| "step": 3485, |
| "valid_targets_mean": 4656.0, |
| "valid_targets_min": 477 |
| }, |
| { |
| "epoch": 5.24024024024024, |
| "grad_norm": 0.5045869253443142, |
| "learning_rate": 7.233064417266846e-06, |
| "loss": 0.231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16010183095932007, |
| "step": 3490, |
| "valid_targets_mean": 3909.6, |
| "valid_targets_min": 609 |
| }, |
| { |
| "epoch": 5.247747747747748, |
| "grad_norm": 0.6679277663347103, |
| "learning_rate": 7.1755083438975056e-06, |
| "loss": 0.22, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2579156756401062, |
| "step": 3495, |
| "valid_targets_mean": 3035.2, |
| "valid_targets_min": 410 |
| }, |
| { |
| "epoch": 5.255255255255255, |
| "grad_norm": 0.48166787337419537, |
| "learning_rate": 7.118132081204936e-06, |
| "loss": 0.2034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17768923938274384, |
| "step": 3500, |
| "valid_targets_mean": 4611.5, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 5.262762762762763, |
| "grad_norm": 0.6437356623831512, |
| "learning_rate": 7.060936433654901e-06, |
| "loss": 0.2106, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22873665392398834, |
| "step": 3505, |
| "valid_targets_mean": 4224.2, |
| "valid_targets_min": 1214 |
| }, |
| { |
| "epoch": 5.27027027027027, |
| "grad_norm": 0.5041184297812231, |
| "learning_rate": 7.003922203180813e-06, |
| "loss": 0.1829, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17131251096725464, |
| "step": 3510, |
| "valid_targets_mean": 4996.4, |
| "valid_targets_min": 762 |
| }, |
| { |
| "epoch": 5.277777777777778, |
| "grad_norm": 0.42636959404581054, |
| "learning_rate": 6.947090189172425e-06, |
| "loss": 0.1905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17408744990825653, |
| "step": 3515, |
| "valid_targets_mean": 6548.1, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 5.285285285285285, |
| "grad_norm": 0.7004634661839949, |
| "learning_rate": 6.89044118846467e-06, |
| "loss": 0.1871, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21478641033172607, |
| "step": 3520, |
| "valid_targets_mean": 3402.0, |
| "valid_targets_min": 534 |
| }, |
| { |
| "epoch": 5.292792792792793, |
| "grad_norm": 0.6584020869113968, |
| "learning_rate": 6.833975995326465e-06, |
| "loss": 0.2226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17992106080055237, |
| "step": 3525, |
| "valid_targets_mean": 3046.6, |
| "valid_targets_min": 592 |
| }, |
| { |
| "epoch": 5.3003003003003, |
| "grad_norm": 0.505387458907387, |
| "learning_rate": 6.777695401449591e-06, |
| "loss": 0.1905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20670431852340698, |
| "step": 3530, |
| "valid_targets_mean": 5285.2, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 5.307807807807808, |
| "grad_norm": 0.5767720272580488, |
| "learning_rate": 6.721600195937578e-06, |
| "loss": 0.1898, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18273615837097168, |
| "step": 3535, |
| "valid_targets_mean": 3702.8, |
| "valid_targets_min": 877 |
| }, |
| { |
| "epoch": 5.315315315315315, |
| "grad_norm": 0.5468384364940457, |
| "learning_rate": 6.665691165294654e-06, |
| "loss": 0.2308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2389727234840393, |
| "step": 3540, |
| "valid_targets_mean": 4842.5, |
| "valid_targets_min": 1056 |
| }, |
| { |
| "epoch": 5.322822822822823, |
| "grad_norm": 0.5417666029457835, |
| "learning_rate": 6.609969093414699e-06, |
| "loss": 0.2186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2088838666677475, |
| "step": 3545, |
| "valid_targets_mean": 4254.4, |
| "valid_targets_min": 367 |
| }, |
| { |
| "epoch": 5.33033033033033, |
| "grad_norm": 0.5649058281181645, |
| "learning_rate": 6.55443476157029e-06, |
| "loss": 0.1991, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1812952756881714, |
| "step": 3550, |
| "valid_targets_mean": 4252.7, |
| "valid_targets_min": 673 |
| }, |
| { |
| "epoch": 5.337837837837838, |
| "grad_norm": 0.5452388205148444, |
| "learning_rate": 6.4990889484017e-06, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1796906590461731, |
| "step": 3555, |
| "valid_targets_mean": 3792.6, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 5.345345345345345, |
| "grad_norm": 0.5732225965401323, |
| "learning_rate": 6.443932429906013e-06, |
| "loss": 0.2323, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2930184006690979, |
| "step": 3560, |
| "valid_targets_mean": 4310.6, |
| "valid_targets_min": 541 |
| }, |
| { |
| "epoch": 5.352852852852853, |
| "grad_norm": 0.6028750589087655, |
| "learning_rate": 6.3889659794262334e-06, |
| "loss": 0.2129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21735335886478424, |
| "step": 3565, |
| "valid_targets_mean": 3685.1, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 5.36036036036036, |
| "grad_norm": 0.602478347893381, |
| "learning_rate": 6.334190367640449e-06, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18190817534923553, |
| "step": 3570, |
| "valid_targets_mean": 4439.8, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 5.367867867867868, |
| "grad_norm": 0.5557346424426345, |
| "learning_rate": 6.279606362551016e-06, |
| "loss": 0.2101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1880781054496765, |
| "step": 3575, |
| "valid_targets_mean": 4198.0, |
| "valid_targets_min": 456 |
| }, |
| { |
| "epoch": 5.375375375375375, |
| "grad_norm": 0.4806991447402713, |
| "learning_rate": 6.225214729473794e-06, |
| "loss": 0.2637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22571183741092682, |
| "step": 3580, |
| "valid_targets_mean": 5347.3, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 5.382882882882883, |
| "grad_norm": 0.6189915178471305, |
| "learning_rate": 6.171016231027418e-06, |
| "loss": 0.2266, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22540658712387085, |
| "step": 3585, |
| "valid_targets_mean": 3396.4, |
| "valid_targets_min": 619 |
| }, |
| { |
| "epoch": 5.39039039039039, |
| "grad_norm": 0.4781145702083429, |
| "learning_rate": 6.117011627122617e-06, |
| "loss": 0.2178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22122199833393097, |
| "step": 3590, |
| "valid_targets_mean": 5498.2, |
| "valid_targets_min": 407 |
| }, |
| { |
| "epoch": 5.397897897897898, |
| "grad_norm": 0.501236643073855, |
| "learning_rate": 6.063201674951535e-06, |
| "loss": 0.2113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19432801008224487, |
| "step": 3595, |
| "valid_targets_mean": 4399.0, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 5.405405405405405, |
| "grad_norm": 0.5083333895430631, |
| "learning_rate": 6.009587128977128e-06, |
| "loss": 0.1969, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21600385010242462, |
| "step": 3600, |
| "valid_targets_mean": 4527.8, |
| "valid_targets_min": 441 |
| }, |
| { |
| "epoch": 5.412912912912913, |
| "grad_norm": 0.43801311222355105, |
| "learning_rate": 5.956168740922592e-06, |
| "loss": 0.2232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17686530947685242, |
| "step": 3605, |
| "valid_targets_mean": 5968.8, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 5.42042042042042, |
| "grad_norm": 0.5142170347253675, |
| "learning_rate": 5.902947259760805e-06, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16562317311763763, |
| "step": 3610, |
| "valid_targets_mean": 4170.2, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 5.427927927927928, |
| "grad_norm": 0.57494822664475, |
| "learning_rate": 5.84992343170385e-06, |
| "loss": 0.2344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19728896021842957, |
| "step": 3615, |
| "valid_targets_mean": 3665.9, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 5.435435435435435, |
| "grad_norm": 0.6682604390565138, |
| "learning_rate": 5.797098000192527e-06, |
| "loss": 0.194, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18809694051742554, |
| "step": 3620, |
| "valid_targets_mean": 5038.7, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 5.442942942942943, |
| "grad_norm": 0.5420242165199347, |
| "learning_rate": 5.744471705885946e-06, |
| "loss": 0.2203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19964119791984558, |
| "step": 3625, |
| "valid_targets_mean": 4113.4, |
| "valid_targets_min": 400 |
| }, |
| { |
| "epoch": 5.45045045045045, |
| "grad_norm": 0.4897694331671357, |
| "learning_rate": 5.692045286651145e-06, |
| "loss": 0.2233, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21164345741271973, |
| "step": 3630, |
| "valid_targets_mean": 5133.8, |
| "valid_targets_min": 842 |
| }, |
| { |
| "epoch": 5.457957957957958, |
| "grad_norm": 0.5130796784439051, |
| "learning_rate": 5.6398194775527305e-06, |
| "loss": 0.2175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1640782356262207, |
| "step": 3635, |
| "valid_targets_mean": 4620.8, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 5.465465465465465, |
| "grad_norm": 0.7096256538606244, |
| "learning_rate": 5.587795010842578e-06, |
| "loss": 0.2188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.229142963886261, |
| "step": 3640, |
| "valid_targets_mean": 3584.5, |
| "valid_targets_min": 291 |
| }, |
| { |
| "epoch": 5.472972972972973, |
| "grad_norm": 0.45320281126185963, |
| "learning_rate": 5.535972615949565e-06, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15912821888923645, |
| "step": 3645, |
| "valid_targets_mean": 6046.6, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 5.48048048048048, |
| "grad_norm": 0.6580766138686164, |
| "learning_rate": 5.484353019469344e-06, |
| "loss": 0.2385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24230948090553284, |
| "step": 3650, |
| "valid_targets_mean": 3922.4, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 5.487987987987988, |
| "grad_norm": 0.560301246319454, |
| "learning_rate": 5.432936945154159e-06, |
| "loss": 0.2035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18417420983314514, |
| "step": 3655, |
| "valid_targets_mean": 4271.6, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 5.495495495495495, |
| "grad_norm": 0.6206056063840636, |
| "learning_rate": 5.381725113902689e-06, |
| "loss": 0.1936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17472167313098907, |
| "step": 3660, |
| "valid_targets_mean": 3848.2, |
| "valid_targets_min": 581 |
| }, |
| { |
| "epoch": 5.503003003003003, |
| "grad_norm": 0.4966662168616601, |
| "learning_rate": 5.330718243749942e-06, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.191782146692276, |
| "step": 3665, |
| "valid_targets_mean": 4883.6, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 5.51051051051051, |
| "grad_norm": 0.5471645413638431, |
| "learning_rate": 5.279917049857209e-06, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17728394269943237, |
| "step": 3670, |
| "valid_targets_mean": 3883.9, |
| "valid_targets_min": 531 |
| }, |
| { |
| "epoch": 5.518018018018018, |
| "grad_norm": 0.49020284035840306, |
| "learning_rate": 5.229322244501996e-06, |
| "loss": 0.1986, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2151007056236267, |
| "step": 3675, |
| "valid_targets_mean": 5625.6, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 5.525525525525525, |
| "grad_norm": 0.502623769306998, |
| "learning_rate": 5.1789345370680726e-06, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18778328597545624, |
| "step": 3680, |
| "valid_targets_mean": 5465.0, |
| "valid_targets_min": 604 |
| }, |
| { |
| "epoch": 5.533033033033033, |
| "grad_norm": 0.6082538279267172, |
| "learning_rate": 5.128754634035509e-06, |
| "loss": 0.2006, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2307537943124771, |
| "step": 3685, |
| "valid_targets_mean": 3897.9, |
| "valid_targets_min": 475 |
| }, |
| { |
| "epoch": 5.54054054054054, |
| "grad_norm": 0.4677087975060976, |
| "learning_rate": 5.078783238970775e-06, |
| "loss": 0.1746, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1452668309211731, |
| "step": 3690, |
| "valid_targets_mean": 4697.0, |
| "valid_targets_min": 820 |
| }, |
| { |
| "epoch": 5.548048048048048, |
| "grad_norm": 0.5258809236597033, |
| "learning_rate": 5.029021052516874e-06, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1686006635427475, |
| "step": 3695, |
| "valid_targets_mean": 5070.6, |
| "valid_targets_min": 874 |
| }, |
| { |
| "epoch": 5.555555555555555, |
| "grad_norm": 0.5418543854859791, |
| "learning_rate": 4.979468772383525e-06, |
| "loss": 0.2528, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23895879089832306, |
| "step": 3700, |
| "valid_targets_mean": 4703.9, |
| "valid_targets_min": 799 |
| }, |
| { |
| "epoch": 5.563063063063063, |
| "grad_norm": 0.5580957987554833, |
| "learning_rate": 4.93012709333736e-06, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18779677152633667, |
| "step": 3705, |
| "valid_targets_mean": 3780.4, |
| "valid_targets_min": 700 |
| }, |
| { |
| "epoch": 5.57057057057057, |
| "grad_norm": 0.5796418427811311, |
| "learning_rate": 4.880996707192227e-06, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18160055577754974, |
| "step": 3710, |
| "valid_targets_mean": 3617.5, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 5.578078078078078, |
| "grad_norm": 0.625613489620117, |
| "learning_rate": 4.832078302799437e-06, |
| "loss": 0.231, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2596314549446106, |
| "step": 3715, |
| "valid_targets_mean": 4067.5, |
| "valid_targets_min": 928 |
| }, |
| { |
| "epoch": 5.585585585585585, |
| "grad_norm": 0.4752383217997911, |
| "learning_rate": 4.7833725660381356e-06, |
| "loss": 0.21, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15992337465286255, |
| "step": 3720, |
| "valid_targets_mean": 4770.9, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 5.593093093093093, |
| "grad_norm": 0.5779722936684374, |
| "learning_rate": 4.734880179805685e-06, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18457244336605072, |
| "step": 3725, |
| "valid_targets_mean": 3342.9, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 5.6006006006006, |
| "grad_norm": 0.550075630002128, |
| "learning_rate": 4.686601824008079e-06, |
| "loss": 0.2177, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18044841289520264, |
| "step": 3730, |
| "valid_targets_mean": 4945.1, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 5.608108108108108, |
| "grad_norm": 0.631353153629254, |
| "learning_rate": 4.638538175550422e-06, |
| "loss": 0.195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21107108891010284, |
| "step": 3735, |
| "valid_targets_mean": 3289.5, |
| "valid_targets_min": 552 |
| }, |
| { |
| "epoch": 5.615615615615615, |
| "grad_norm": 0.7558092942754301, |
| "learning_rate": 4.590689908327428e-06, |
| "loss": 0.2214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20774057507514954, |
| "step": 3740, |
| "valid_targets_mean": 2326.2, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 5.623123123123123, |
| "grad_norm": 0.6050928606517935, |
| "learning_rate": 4.543057693213973e-06, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.230237677693367, |
| "step": 3745, |
| "valid_targets_mean": 3875.2, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 5.63063063063063, |
| "grad_norm": 0.5844617202863044, |
| "learning_rate": 4.495642198055707e-06, |
| "loss": 0.2215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2029937505722046, |
| "step": 3750, |
| "valid_targets_mean": 4027.4, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 5.638138138138138, |
| "grad_norm": 0.7169568097777915, |
| "learning_rate": 4.4484440876596625e-06, |
| "loss": 0.2364, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22157275676727295, |
| "step": 3755, |
| "valid_targets_mean": 2619.1, |
| "valid_targets_min": 657 |
| }, |
| { |
| "epoch": 5.645645645645645, |
| "grad_norm": 0.5563696214524937, |
| "learning_rate": 4.401464023784945e-06, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1895512342453003, |
| "step": 3760, |
| "valid_targets_mean": 4033.1, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 5.653153153153153, |
| "grad_norm": 0.7184497569373026, |
| "learning_rate": 4.354702665133457e-06, |
| "loss": 0.2035, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17378777265548706, |
| "step": 3765, |
| "valid_targets_mean": 4711.1, |
| "valid_targets_min": 460 |
| }, |
| { |
| "epoch": 5.66066066066066, |
| "grad_norm": 0.672562372546706, |
| "learning_rate": 4.308160667340671e-06, |
| "loss": 0.22, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23928751051425934, |
| "step": 3770, |
| "valid_targets_mean": 2964.8, |
| "valid_targets_min": 402 |
| }, |
| { |
| "epoch": 5.668168168168168, |
| "grad_norm": 0.4887664405970491, |
| "learning_rate": 4.261838682966413e-06, |
| "loss": 0.2001, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19159993529319763, |
| "step": 3775, |
| "valid_targets_mean": 5129.8, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 5.675675675675675, |
| "grad_norm": 0.5457059516129726, |
| "learning_rate": 4.215737361485737e-06, |
| "loss": 0.2193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21986320614814758, |
| "step": 3780, |
| "valid_targets_mean": 5641.1, |
| "valid_targets_min": 915 |
| }, |
| { |
| "epoch": 5.683183183183183, |
| "grad_norm": 0.5115604631418055, |
| "learning_rate": 4.1698573492798e-06, |
| "loss": 0.198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1333058923482895, |
| "step": 3785, |
| "valid_targets_mean": 3278.0, |
| "valid_targets_min": 647 |
| }, |
| { |
| "epoch": 5.6906906906906904, |
| "grad_norm": 0.7200821505353998, |
| "learning_rate": 4.124199289626818e-06, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22922024130821228, |
| "step": 3790, |
| "valid_targets_mean": 2683.2, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 5.698198198198198, |
| "grad_norm": 0.42145237729701907, |
| "learning_rate": 4.078763822693021e-06, |
| "loss": 0.206, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18455691635608673, |
| "step": 3795, |
| "valid_targets_mean": 6690.8, |
| "valid_targets_min": 920 |
| }, |
| { |
| "epoch": 5.7057057057057055, |
| "grad_norm": 0.5325975126541347, |
| "learning_rate": 4.033551585523716e-06, |
| "loss": 0.2049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19546617567539215, |
| "step": 3800, |
| "valid_targets_mean": 5228.1, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 5.713213213213213, |
| "grad_norm": 0.6601846614023362, |
| "learning_rate": 3.988563212034315e-06, |
| "loss": 0.2511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15158836543560028, |
| "step": 3805, |
| "valid_targets_mean": 3667.6, |
| "valid_targets_min": 358 |
| }, |
| { |
| "epoch": 5.7207207207207205, |
| "grad_norm": 0.6027115950409477, |
| "learning_rate": 3.943799333001466e-06, |
| "loss": 0.2164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19812247157096863, |
| "step": 3810, |
| "valid_targets_mean": 3187.2, |
| "valid_targets_min": 542 |
| }, |
| { |
| "epoch": 5.728228228228228, |
| "grad_norm": 0.7999468435844861, |
| "learning_rate": 3.899260576054209e-06, |
| "loss": 0.2164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24161022901535034, |
| "step": 3815, |
| "valid_targets_mean": 2608.4, |
| "valid_targets_min": 416 |
| }, |
| { |
| "epoch": 5.7357357357357355, |
| "grad_norm": 0.6197457192371475, |
| "learning_rate": 3.854947565665172e-06, |
| "loss": 0.2337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20346400141716003, |
| "step": 3820, |
| "valid_targets_mean": 3887.9, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 5.743243243243243, |
| "grad_norm": 0.5811299922570492, |
| "learning_rate": 3.810860923141824e-06, |
| "loss": 0.2173, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2590106129646301, |
| "step": 3825, |
| "valid_targets_mean": 4175.2, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 5.7507507507507505, |
| "grad_norm": 0.6108735444142156, |
| "learning_rate": 3.767001266617747e-06, |
| "loss": 0.2198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21409021317958832, |
| "step": 3830, |
| "valid_targets_mean": 3856.4, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 5.758258258258258, |
| "grad_norm": 0.5427297235952976, |
| "learning_rate": 3.7233692110439814e-06, |
| "loss": 0.2104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20367692410945892, |
| "step": 3835, |
| "valid_targets_mean": 4545.9, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 5.7657657657657655, |
| "grad_norm": 0.4682965132065941, |
| "learning_rate": 3.679965368180416e-06, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1938939094543457, |
| "step": 3840, |
| "valid_targets_mean": 5888.4, |
| "valid_targets_min": 915 |
| }, |
| { |
| "epoch": 5.773273273273273, |
| "grad_norm": 0.5399446918848115, |
| "learning_rate": 3.6367903465871755e-06, |
| "loss": 0.2268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24548377096652985, |
| "step": 3845, |
| "valid_targets_mean": 5109.5, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 5.7807807807807805, |
| "grad_norm": 0.4864834575204545, |
| "learning_rate": 3.59384475161612e-06, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21027377247810364, |
| "step": 3850, |
| "valid_targets_mean": 4894.0, |
| "valid_targets_min": 636 |
| }, |
| { |
| "epoch": 5.788288288288288, |
| "grad_norm": 0.5438912695013488, |
| "learning_rate": 3.5511291854023466e-06, |
| "loss": 0.2059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23461908102035522, |
| "step": 3855, |
| "valid_targets_mean": 4590.5, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 5.7957957957957955, |
| "grad_norm": 0.5232434234880898, |
| "learning_rate": 3.508644246855739e-06, |
| "loss": 0.2097, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20156699419021606, |
| "step": 3860, |
| "valid_targets_mean": 4557.0, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 5.803303303303303, |
| "grad_norm": 0.5868070563906084, |
| "learning_rate": 3.466390531652588e-06, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19073697924613953, |
| "step": 3865, |
| "valid_targets_mean": 4407.1, |
| "valid_targets_min": 259 |
| }, |
| { |
| "epoch": 5.8108108108108105, |
| "grad_norm": 0.5169034481605863, |
| "learning_rate": 3.4243686322272195e-06, |
| "loss": 0.2133, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2452038675546646, |
| "step": 3870, |
| "valid_targets_mean": 5199.6, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 5.818318318318318, |
| "grad_norm": 0.5384261747880087, |
| "learning_rate": 3.3825791377636998e-06, |
| "loss": 0.1954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2101140320301056, |
| "step": 3875, |
| "valid_targets_mean": 4844.0, |
| "valid_targets_min": 427 |
| }, |
| { |
| "epoch": 5.8258258258258255, |
| "grad_norm": 0.7881322308404421, |
| "learning_rate": 3.341022634187585e-06, |
| "loss": 0.2041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23327091336250305, |
| "step": 3880, |
| "valid_targets_mean": 3447.8, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 5.833333333333333, |
| "grad_norm": 0.5514296552758701, |
| "learning_rate": 3.2996997041576795e-06, |
| "loss": 0.2105, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20250976085662842, |
| "step": 3885, |
| "valid_targets_mean": 4440.7, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 5.8408408408408405, |
| "grad_norm": 0.651802460092001, |
| "learning_rate": 3.2586109270578836e-06, |
| "loss": 0.193, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2257906049489975, |
| "step": 3890, |
| "valid_targets_mean": 4516.6, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 5.848348348348348, |
| "grad_norm": 0.5643346645467794, |
| "learning_rate": 3.217756878989069e-06, |
| "loss": 0.2237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22649335861206055, |
| "step": 3895, |
| "valid_targets_mean": 4361.2, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 5.8558558558558556, |
| "grad_norm": 0.6943626771374626, |
| "learning_rate": 3.1771381327609997e-06, |
| "loss": 0.2263, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23687607049942017, |
| "step": 3900, |
| "valid_targets_mean": 3878.1, |
| "valid_targets_min": 391 |
| }, |
| { |
| "epoch": 5.863363363363363, |
| "grad_norm": 0.5703396214687839, |
| "learning_rate": 3.1367552578842986e-06, |
| "loss": 0.1972, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22399486601352692, |
| "step": 3905, |
| "valid_targets_mean": 4644.7, |
| "valid_targets_min": 439 |
| }, |
| { |
| "epoch": 5.870870870870871, |
| "grad_norm": 3.5482019538966396, |
| "learning_rate": 3.096608820562468e-06, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14243656396865845, |
| "step": 3910, |
| "valid_targets_mean": 3601.3, |
| "valid_targets_min": 723 |
| }, |
| { |
| "epoch": 5.878378378378378, |
| "grad_norm": 0.6997352643905546, |
| "learning_rate": 3.0566993836839387e-06, |
| "loss": 0.2354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22578692436218262, |
| "step": 3915, |
| "valid_targets_mean": 2871.8, |
| "valid_targets_min": 481 |
| }, |
| { |
| "epoch": 5.885885885885886, |
| "grad_norm": 0.61982038677274, |
| "learning_rate": 3.017027506814203e-06, |
| "loss": 0.2138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.212412029504776, |
| "step": 3920, |
| "valid_targets_mean": 3693.6, |
| "valid_targets_min": 641 |
| }, |
| { |
| "epoch": 5.893393393393393, |
| "grad_norm": 0.502898749801898, |
| "learning_rate": 2.9775937461879368e-06, |
| "loss": 0.2034, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18976537883281708, |
| "step": 3925, |
| "valid_targets_mean": 5294.2, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 5.900900900900901, |
| "grad_norm": 0.705380106461315, |
| "learning_rate": 2.9383986547012222e-06, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21276956796646118, |
| "step": 3930, |
| "valid_targets_mean": 2696.2, |
| "valid_targets_min": 569 |
| }, |
| { |
| "epoch": 5.908408408408408, |
| "grad_norm": 0.6824495687596949, |
| "learning_rate": 2.8994427819037873e-06, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27314475178718567, |
| "step": 3935, |
| "valid_targets_mean": 5253.1, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 5.915915915915916, |
| "grad_norm": 0.6133652704497186, |
| "learning_rate": 2.8607266739913077e-06, |
| "loss": 0.2078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24844960868358612, |
| "step": 3940, |
| "valid_targets_mean": 4655.8, |
| "valid_targets_min": 819 |
| }, |
| { |
| "epoch": 5.923423423423423, |
| "grad_norm": 0.5714988842182993, |
| "learning_rate": 2.822250873797743e-06, |
| "loss": 0.226, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19975441694259644, |
| "step": 3945, |
| "valid_targets_mean": 4395.9, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 5.930930930930931, |
| "grad_norm": 0.8230004411475231, |
| "learning_rate": 2.784015920787719e-06, |
| "loss": 0.2254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3142227828502655, |
| "step": 3950, |
| "valid_targets_mean": 4321.6, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 5.938438438438438, |
| "grad_norm": 0.572231017896013, |
| "learning_rate": 2.746022351048978e-06, |
| "loss": 0.2267, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2292689085006714, |
| "step": 3955, |
| "valid_targets_mean": 4084.4, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 5.945945945945946, |
| "grad_norm": 0.8188722407870543, |
| "learning_rate": 2.708270697284865e-06, |
| "loss": 0.2123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24927443265914917, |
| "step": 3960, |
| "valid_targets_mean": 3767.1, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 5.953453453453453, |
| "grad_norm": 0.5185251151107919, |
| "learning_rate": 2.6707614888068365e-06, |
| "loss": 0.209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19668208062648773, |
| "step": 3965, |
| "valid_targets_mean": 4310.9, |
| "valid_targets_min": 423 |
| }, |
| { |
| "epoch": 5.960960960960961, |
| "grad_norm": 0.5542673950873109, |
| "learning_rate": 2.633495251527054e-06, |
| "loss": 0.1931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24870452284812927, |
| "step": 3970, |
| "valid_targets_mean": 5467.7, |
| "valid_targets_min": 973 |
| }, |
| { |
| "epoch": 5.968468468468468, |
| "grad_norm": 0.6048295638583769, |
| "learning_rate": 2.5964725079510134e-06, |
| "loss": 0.2045, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17934688925743103, |
| "step": 3975, |
| "valid_targets_mean": 3691.8, |
| "valid_targets_min": 715 |
| }, |
| { |
| "epoch": 5.975975975975976, |
| "grad_norm": 0.5714679755869654, |
| "learning_rate": 2.5596937771702113e-06, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18001726269721985, |
| "step": 3980, |
| "valid_targets_mean": 3830.1, |
| "valid_targets_min": 698 |
| }, |
| { |
| "epoch": 5.983483483483483, |
| "grad_norm": 0.5678385470019257, |
| "learning_rate": 2.523159574854872e-06, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19507171213626862, |
| "step": 3985, |
| "valid_targets_mean": 3516.0, |
| "valid_targets_min": 311 |
| }, |
| { |
| "epoch": 5.990990990990991, |
| "grad_norm": 0.685934053595724, |
| "learning_rate": 2.4868704132467115e-06, |
| "loss": 0.2047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2302461564540863, |
| "step": 3990, |
| "valid_targets_mean": 2869.4, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 5.998498498498498, |
| "grad_norm": 0.6065925509118129, |
| "learning_rate": 2.45082680115176e-06, |
| "loss": 0.2199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19993174076080322, |
| "step": 3995, |
| "valid_targets_mean": 3674.2, |
| "valid_targets_min": 414 |
| }, |
| { |
| "epoch": 6.006006006006006, |
| "grad_norm": 0.4490328583511514, |
| "learning_rate": 2.4150292439332355e-06, |
| "loss": 0.1979, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19256381690502167, |
| "step": 4000, |
| "valid_targets_mean": 5463.9, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 6.013513513513513, |
| "grad_norm": 0.5503944239111109, |
| "learning_rate": 2.3794782435044384e-06, |
| "loss": 0.1788, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17218606173992157, |
| "step": 4005, |
| "valid_targets_mean": 3465.8, |
| "valid_targets_min": 930 |
| }, |
| { |
| "epoch": 6.021021021021021, |
| "grad_norm": 0.5533090724442471, |
| "learning_rate": 2.344174298321733e-06, |
| "loss": 0.2125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.213973268866539, |
| "step": 4010, |
| "valid_targets_mean": 4543.8, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 6.028528528528528, |
| "grad_norm": 0.6792685607327363, |
| "learning_rate": 2.3091179033775445e-06, |
| "loss": 0.2038, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2688198983669281, |
| "step": 4015, |
| "valid_targets_mean": 3235.7, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 6.036036036036036, |
| "grad_norm": 0.46026148213907403, |
| "learning_rate": 2.27430955019343e-06, |
| "loss": 0.2157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1564239263534546, |
| "step": 4020, |
| "valid_targets_mean": 5029.9, |
| "valid_targets_min": 1069 |
| }, |
| { |
| "epoch": 6.043543543543543, |
| "grad_norm": 0.5322076051668858, |
| "learning_rate": 2.239749726813183e-06, |
| "loss": 0.2239, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19674474000930786, |
| "step": 4025, |
| "valid_targets_mean": 4798.2, |
| "valid_targets_min": 478 |
| }, |
| { |
| "epoch": 6.051051051051051, |
| "grad_norm": 0.5891185848467975, |
| "learning_rate": 2.20543891779599e-06, |
| "loss": 0.199, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18149876594543457, |
| "step": 4030, |
| "valid_targets_mean": 4520.9, |
| "valid_targets_min": 648 |
| }, |
| { |
| "epoch": 6.058558558558558, |
| "grad_norm": 0.6755239064217278, |
| "learning_rate": 2.1713776042096302e-06, |
| "loss": 0.2046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2210536003112793, |
| "step": 4035, |
| "valid_targets_mean": 3545.1, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 6.066066066066066, |
| "grad_norm": 0.6088360110015828, |
| "learning_rate": 2.1375662636237493e-06, |
| "loss": 0.1992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22115203738212585, |
| "step": 4040, |
| "valid_targets_mean": 5270.9, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 6.073573573573573, |
| "grad_norm": 0.5822383908375098, |
| "learning_rate": 2.1040053701031414e-06, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21398739516735077, |
| "step": 4045, |
| "valid_targets_mean": 4107.5, |
| "valid_targets_min": 483 |
| }, |
| { |
| "epoch": 6.081081081081081, |
| "grad_norm": 0.6863357601545187, |
| "learning_rate": 2.0706953942011165e-06, |
| "loss": 0.2227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21303421258926392, |
| "step": 4050, |
| "valid_targets_mean": 3397.6, |
| "valid_targets_min": 691 |
| }, |
| { |
| "epoch": 6.088588588588588, |
| "grad_norm": 0.6835718993938039, |
| "learning_rate": 2.0376368029528935e-06, |
| "loss": 0.2104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2734207510948181, |
| "step": 4055, |
| "valid_targets_mean": 3650.6, |
| "valid_targets_min": 652 |
| }, |
| { |
| "epoch": 6.096096096096096, |
| "grad_norm": 0.45120552286100196, |
| "learning_rate": 2.0048300598690627e-06, |
| "loss": 0.2164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25283950567245483, |
| "step": 4060, |
| "valid_targets_mean": 7365.3, |
| "valid_targets_min": 993 |
| }, |
| { |
| "epoch": 6.103603603603603, |
| "grad_norm": 0.63959559159808, |
| "learning_rate": 1.9722756249290785e-06, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2537308633327484, |
| "step": 4065, |
| "valid_targets_mean": 4346.6, |
| "valid_targets_min": 668 |
| }, |
| { |
| "epoch": 6.111111111111111, |
| "grad_norm": 0.6496824147481889, |
| "learning_rate": 1.939973954574812e-06, |
| "loss": 0.175, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15889085829257965, |
| "step": 4070, |
| "valid_targets_mean": 3991.0, |
| "valid_targets_min": 738 |
| }, |
| { |
| "epoch": 6.118618618618618, |
| "grad_norm": 0.5705409403401243, |
| "learning_rate": 1.9079255017041487e-06, |
| "loss": 0.2026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17797492444515228, |
| "step": 4075, |
| "valid_targets_mean": 4241.4, |
| "valid_targets_min": 618 |
| }, |
| { |
| "epoch": 6.126126126126126, |
| "grad_norm": 0.4815875979801429, |
| "learning_rate": 1.8761307156646547e-06, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15079014003276825, |
| "step": 4080, |
| "valid_targets_mean": 4996.1, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 6.133633633633633, |
| "grad_norm": 0.5146233292308801, |
| "learning_rate": 1.8445900422472495e-06, |
| "loss": 0.2046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18511003255844116, |
| "step": 4085, |
| "valid_targets_mean": 4634.7, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 6.141141141141141, |
| "grad_norm": 0.5624700118014101, |
| "learning_rate": 1.8133039236799788e-06, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2083277553319931, |
| "step": 4090, |
| "valid_targets_mean": 4171.3, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 6.148648648648648, |
| "grad_norm": 0.7177782923244695, |
| "learning_rate": 1.7822727986217957e-06, |
| "loss": 0.2237, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18404030799865723, |
| "step": 4095, |
| "valid_targets_mean": 2409.4, |
| "valid_targets_min": 593 |
| }, |
| { |
| "epoch": 6.156156156156156, |
| "grad_norm": 0.5228873362141804, |
| "learning_rate": 1.7514971021564275e-06, |
| "loss": 0.2147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1940818727016449, |
| "step": 4100, |
| "valid_targets_mean": 4779.9, |
| "valid_targets_min": 511 |
| }, |
| { |
| "epoch": 6.163663663663663, |
| "grad_norm": 0.4487406897661156, |
| "learning_rate": 1.7209772657862657e-06, |
| "loss": 0.1958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1845383495092392, |
| "step": 4105, |
| "valid_targets_mean": 6135.4, |
| "valid_targets_min": 515 |
| }, |
| { |
| "epoch": 6.171171171171171, |
| "grad_norm": 0.5106337969240039, |
| "learning_rate": 1.6907137174263156e-06, |
| "loss": 0.2004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17622476816177368, |
| "step": 4110, |
| "valid_targets_mean": 4512.0, |
| "valid_targets_min": 463 |
| }, |
| { |
| "epoch": 6.178678678678678, |
| "grad_norm": 0.6441468445611757, |
| "learning_rate": 1.6607068813981952e-06, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2345384955406189, |
| "step": 4115, |
| "valid_targets_mean": 3844.5, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 6.186186186186186, |
| "grad_norm": 0.5581311436354888, |
| "learning_rate": 1.6309571784242062e-06, |
| "loss": 0.2017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17409540712833405, |
| "step": 4120, |
| "valid_targets_mean": 4888.1, |
| "valid_targets_min": 645 |
| }, |
| { |
| "epoch": 6.193693693693693, |
| "grad_norm": 0.5762764403446647, |
| "learning_rate": 1.601465025621398e-06, |
| "loss": 0.2212, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22839732468128204, |
| "step": 4125, |
| "valid_targets_mean": 4442.8, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 6.201201201201201, |
| "grad_norm": 0.488635665892412, |
| "learning_rate": 1.5722308364957517e-06, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19067010283470154, |
| "step": 4130, |
| "valid_targets_mean": 5109.4, |
| "valid_targets_min": 606 |
| }, |
| { |
| "epoch": 6.208708708708708, |
| "grad_norm": 0.5702695176534012, |
| "learning_rate": 1.5432550209363606e-06, |
| "loss": 0.2119, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19797605276107788, |
| "step": 4135, |
| "valid_targets_mean": 4942.1, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 6.216216216216216, |
| "grad_norm": 0.5547765610808129, |
| "learning_rate": 1.5145379852097054e-06, |
| "loss": 0.1995, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21563218533992767, |
| "step": 4140, |
| "valid_targets_mean": 4537.9, |
| "valid_targets_min": 498 |
| }, |
| { |
| "epoch": 6.223723723723724, |
| "grad_norm": 0.6133297188420032, |
| "learning_rate": 1.4860801319539354e-06, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2022094428539276, |
| "step": 4145, |
| "valid_targets_mean": 3766.9, |
| "valid_targets_min": 602 |
| }, |
| { |
| "epoch": 6.231231231231231, |
| "grad_norm": 0.5500242111051548, |
| "learning_rate": 1.457881860173236e-06, |
| "loss": 0.1928, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14841407537460327, |
| "step": 4150, |
| "valid_targets_mean": 3554.3, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 6.238738738738739, |
| "grad_norm": 0.6493235742255749, |
| "learning_rate": 1.429943565232228e-06, |
| "loss": 0.2165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29499688744544983, |
| "step": 4155, |
| "valid_targets_mean": 4105.4, |
| "valid_targets_min": 391 |
| }, |
| { |
| "epoch": 6.246246246246246, |
| "grad_norm": 0.46401350568259536, |
| "learning_rate": 1.4022656388504418e-06, |
| "loss": 0.2026, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1871238350868225, |
| "step": 4160, |
| "valid_targets_mean": 5385.7, |
| "valid_targets_min": 467 |
| }, |
| { |
| "epoch": 6.253753753753754, |
| "grad_norm": 0.5751734802750025, |
| "learning_rate": 1.3748484690967967e-06, |
| "loss": 0.1754, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17546819150447845, |
| "step": 4165, |
| "valid_targets_mean": 4171.8, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 6.261261261261261, |
| "grad_norm": 0.824863745151526, |
| "learning_rate": 1.3476924403841762e-06, |
| "loss": 0.2352, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21639591455459595, |
| "step": 4170, |
| "valid_targets_mean": 2713.2, |
| "valid_targets_min": 473 |
| }, |
| { |
| "epoch": 6.268768768768769, |
| "grad_norm": 0.570544358689332, |
| "learning_rate": 1.3207979334640419e-06, |
| "loss": 0.2095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20927639305591583, |
| "step": 4175, |
| "valid_targets_mean": 4503.6, |
| "valid_targets_min": 774 |
| }, |
| { |
| "epoch": 6.276276276276276, |
| "grad_norm": 0.5313264329238784, |
| "learning_rate": 1.294165325421084e-06, |
| "loss": 0.2398, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29111388325691223, |
| "step": 4180, |
| "valid_targets_mean": 5414.2, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 6.283783783783784, |
| "grad_norm": 0.5675843811457961, |
| "learning_rate": 1.2677949896679408e-06, |
| "loss": 0.2117, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20922914147377014, |
| "step": 4185, |
| "valid_targets_mean": 4288.4, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 6.291291291291291, |
| "grad_norm": 0.5380343131647501, |
| "learning_rate": 1.241687295939966e-06, |
| "loss": 0.1725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14380943775177002, |
| "step": 4190, |
| "valid_targets_mean": 4689.5, |
| "valid_targets_min": 367 |
| }, |
| { |
| "epoch": 6.298798798798799, |
| "grad_norm": 0.5899919262888533, |
| "learning_rate": 1.2158426102900345e-06, |
| "loss": 0.189, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19863969087600708, |
| "step": 4195, |
| "valid_targets_mean": 4058.4, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 6.306306306306306, |
| "grad_norm": 0.5264653142973713, |
| "learning_rate": 1.1902612950834213e-06, |
| "loss": 0.2007, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.197919100522995, |
| "step": 4200, |
| "valid_targets_mean": 4504.0, |
| "valid_targets_min": 727 |
| }, |
| { |
| "epoch": 6.313813813813814, |
| "grad_norm": 0.5816807471532681, |
| "learning_rate": 1.164943708992714e-06, |
| "loss": 0.1954, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19351375102996826, |
| "step": 4205, |
| "valid_targets_mean": 3772.9, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 6.321321321321321, |
| "grad_norm": 0.6196400182011077, |
| "learning_rate": 1.1398902069927842e-06, |
| "loss": 0.232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3165440261363983, |
| "step": 4210, |
| "valid_targets_mean": 4516.8, |
| "valid_targets_min": 374 |
| }, |
| { |
| "epoch": 6.328828828828829, |
| "grad_norm": 0.5403053431375547, |
| "learning_rate": 1.115101140355812e-06, |
| "loss": 0.2077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20008732378482819, |
| "step": 4215, |
| "valid_targets_mean": 4993.6, |
| "valid_targets_min": 667 |
| }, |
| { |
| "epoch": 6.336336336336337, |
| "grad_norm": 0.5311224743152807, |
| "learning_rate": 1.0905768566463593e-06, |
| "loss": 0.2158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2345670610666275, |
| "step": 4220, |
| "valid_targets_mean": 5031.6, |
| "valid_targets_min": 559 |
| }, |
| { |
| "epoch": 6.343843843843844, |
| "grad_norm": 0.7193489501948159, |
| "learning_rate": 1.0663176997165037e-06, |
| "loss": 0.2083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18373778462409973, |
| "step": 4225, |
| "valid_targets_mean": 2563.9, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 6.351351351351352, |
| "grad_norm": 0.6194973179199644, |
| "learning_rate": 1.0423240097010056e-06, |
| "loss": 0.1904, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17724689841270447, |
| "step": 4230, |
| "valid_targets_mean": 2932.5, |
| "valid_targets_min": 550 |
| }, |
| { |
| "epoch": 6.358858858858859, |
| "grad_norm": 0.5938101431895507, |
| "learning_rate": 1.018596123012545e-06, |
| "loss": 0.2014, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15485897660255432, |
| "step": 4235, |
| "valid_targets_mean": 3859.1, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 6.366366366366367, |
| "grad_norm": 0.5832105338347596, |
| "learning_rate": 9.951343723370145e-07, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27296674251556396, |
| "step": 4240, |
| "valid_targets_mean": 4697.3, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 6.373873873873874, |
| "grad_norm": 0.6257938479877299, |
| "learning_rate": 9.719390866288325e-07, |
| "loss": 0.2018, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21452078223228455, |
| "step": 4245, |
| "valid_targets_mean": 3980.8, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 6.381381381381382, |
| "grad_norm": 0.4748467821348681, |
| "learning_rate": 9.490105911063519e-07, |
| "loss": 0.1984, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19311422109603882, |
| "step": 4250, |
| "valid_targets_mean": 4970.2, |
| "valid_targets_min": 958 |
| }, |
| { |
| "epoch": 6.388888888888889, |
| "grad_norm": 0.49848343014176094, |
| "learning_rate": 9.263492072472879e-07, |
| "loss": 0.2041, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20664718747138977, |
| "step": 4255, |
| "valid_targets_mean": 5091.6, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 6.396396396396397, |
| "grad_norm": 0.4839998287321489, |
| "learning_rate": 9.039552527842188e-07, |
| "loss": 0.1931, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15590183436870575, |
| "step": 4260, |
| "valid_targets_mean": 4334.7, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 6.403903903903904, |
| "grad_norm": 0.47675581127591066, |
| "learning_rate": 8.818290417001218e-07, |
| "loss": 0.1877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18418073654174805, |
| "step": 4265, |
| "valid_targets_mean": 5461.1, |
| "valid_targets_min": 875 |
| }, |
| { |
| "epoch": 6.411411411411412, |
| "grad_norm": 0.5148421630943572, |
| "learning_rate": 8.599708842239795e-07, |
| "loss": 0.2056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1673521250486374, |
| "step": 4270, |
| "valid_targets_mean": 5613.2, |
| "valid_targets_min": 791 |
| }, |
| { |
| "epoch": 6.418918918918919, |
| "grad_norm": 0.6034041442260967, |
| "learning_rate": 8.383810868264253e-07, |
| "loss": 0.2101, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2042214274406433, |
| "step": 4275, |
| "valid_targets_mean": 4745.4, |
| "valid_targets_min": 521 |
| }, |
| { |
| "epoch": 6.426426426426427, |
| "grad_norm": 0.44620270158602615, |
| "learning_rate": 8.17059952215451e-07, |
| "loss": 0.1892, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14886009693145752, |
| "step": 4280, |
| "valid_targets_mean": 5529.8, |
| "valid_targets_min": 1189 |
| }, |
| { |
| "epoch": 6.433933933933934, |
| "grad_norm": 0.5070235125913082, |
| "learning_rate": 7.960077793321552e-07, |
| "loss": 0.1769, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19193494319915771, |
| "step": 4285, |
| "valid_targets_mean": 5251.6, |
| "valid_targets_min": 425 |
| }, |
| { |
| "epoch": 6.441441441441442, |
| "grad_norm": 0.5615395471791965, |
| "learning_rate": 7.752248633465576e-07, |
| "loss": 0.215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22860676050186157, |
| "step": 4290, |
| "valid_targets_mean": 3936.7, |
| "valid_targets_min": 583 |
| }, |
| { |
| "epoch": 6.448948948948949, |
| "grad_norm": 0.5442260146056317, |
| "learning_rate": 7.547114956534574e-07, |
| "loss": 0.1909, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1491059809923172, |
| "step": 4295, |
| "valid_targets_mean": 3889.1, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 6.456456456456457, |
| "grad_norm": 0.5835357955664173, |
| "learning_rate": 7.344679638683527e-07, |
| "loss": 0.2332, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2454603910446167, |
| "step": 4300, |
| "valid_targets_mean": 5267.1, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 6.463963963963964, |
| "grad_norm": 0.6370221393360167, |
| "learning_rate": 7.144945518234014e-07, |
| "loss": 0.2188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20245075225830078, |
| "step": 4305, |
| "valid_targets_mean": 3993.6, |
| "valid_targets_min": 292 |
| }, |
| { |
| "epoch": 6.471471471471472, |
| "grad_norm": 0.487081794320264, |
| "learning_rate": 6.947915395634463e-07, |
| "loss": 0.2125, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22089102864265442, |
| "step": 4310, |
| "valid_targets_mean": 4927.1, |
| "valid_targets_min": 801 |
| }, |
| { |
| "epoch": 6.478978978978979, |
| "grad_norm": 0.6970402670081776, |
| "learning_rate": 6.753592033420809e-07, |
| "loss": 0.1902, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19842252135276794, |
| "step": 4315, |
| "valid_targets_mean": 2896.4, |
| "valid_targets_min": 475 |
| }, |
| { |
| "epoch": 6.486486486486487, |
| "grad_norm": 0.5079593962075888, |
| "learning_rate": 6.561978156177939e-07, |
| "loss": 0.1899, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1689176708459854, |
| "step": 4320, |
| "valid_targets_mean": 4254.1, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 6.493993993993994, |
| "grad_norm": 0.6574113141398381, |
| "learning_rate": 6.37307645050127e-07, |
| "loss": 0.2036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2085978239774704, |
| "step": 4325, |
| "valid_targets_mean": 3372.8, |
| "valid_targets_min": 478 |
| }, |
| { |
| "epoch": 6.501501501501502, |
| "grad_norm": 0.508520487800978, |
| "learning_rate": 6.186889564959209e-07, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23924149572849274, |
| "step": 4330, |
| "valid_targets_mean": 5251.2, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 6.509009009009009, |
| "grad_norm": 0.6324952400411343, |
| "learning_rate": 6.003420110056035e-07, |
| "loss": 0.204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2557426691055298, |
| "step": 4335, |
| "valid_targets_mean": 4012.0, |
| "valid_targets_min": 503 |
| }, |
| { |
| "epoch": 6.516516516516517, |
| "grad_norm": 0.553904609232918, |
| "learning_rate": 5.822670658195173e-07, |
| "loss": 0.1907, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21928340196609497, |
| "step": 4340, |
| "valid_targets_mean": 4482.4, |
| "valid_targets_min": 462 |
| }, |
| { |
| "epoch": 6.524024024024024, |
| "grad_norm": 0.616465266517478, |
| "learning_rate": 5.644643743643308e-07, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21219468116760254, |
| "step": 4345, |
| "valid_targets_mean": 3722.6, |
| "valid_targets_min": 504 |
| }, |
| { |
| "epoch": 6.531531531531532, |
| "grad_norm": 0.7300734830816725, |
| "learning_rate": 5.469341862494637e-07, |
| "loss": 0.2046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2306327223777771, |
| "step": 4350, |
| "valid_targets_mean": 2665.6, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 6.539039039039039, |
| "grad_norm": 0.5642202986656522, |
| "learning_rate": 5.296767472636077e-07, |
| "loss": 0.1916, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1920192539691925, |
| "step": 4355, |
| "valid_targets_mean": 3940.9, |
| "valid_targets_min": 461 |
| }, |
| { |
| "epoch": 6.546546546546547, |
| "grad_norm": 0.5150972885704285, |
| "learning_rate": 5.12692299371269e-07, |
| "loss": 0.1942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14734071493148804, |
| "step": 4360, |
| "valid_targets_mean": 4389.3, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 6.554054054054054, |
| "grad_norm": 0.6913329068038451, |
| "learning_rate": 4.959810807093779e-07, |
| "loss": 0.2347, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2543680667877197, |
| "step": 4365, |
| "valid_targets_mean": 4525.6, |
| "valid_targets_min": 554 |
| }, |
| { |
| "epoch": 6.561561561561562, |
| "grad_norm": 0.5451201542998624, |
| "learning_rate": 4.795433255839488e-07, |
| "loss": 0.2049, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21131403744220734, |
| "step": 4370, |
| "valid_targets_mean": 4360.6, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 6.569069069069069, |
| "grad_norm": 0.47040078136948726, |
| "learning_rate": 4.633792644667967e-07, |
| "loss": 0.1887, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19125640392303467, |
| "step": 4375, |
| "valid_targets_mean": 5975.6, |
| "valid_targets_min": 1693 |
| }, |
| { |
| "epoch": 6.576576576576577, |
| "grad_norm": 0.5920967555082476, |
| "learning_rate": 4.474891239923063e-07, |
| "loss": 0.209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21285581588745117, |
| "step": 4380, |
| "valid_targets_mean": 4406.5, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 6.584084084084084, |
| "grad_norm": 0.7205742446023933, |
| "learning_rate": 4.318731269542542e-07, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21254310011863708, |
| "step": 4385, |
| "valid_targets_mean": 3167.4, |
| "valid_targets_min": 489 |
| }, |
| { |
| "epoch": 6.591591591591592, |
| "grad_norm": 0.5312844013389322, |
| "learning_rate": 4.1653149230268087e-07, |
| "loss": 0.2147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18900719285011292, |
| "step": 4390, |
| "valid_targets_mean": 4654.4, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 6.599099099099099, |
| "grad_norm": 0.5723780339209558, |
| "learning_rate": 4.014644351408259e-07, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22007179260253906, |
| "step": 4395, |
| "valid_targets_mean": 4301.8, |
| "valid_targets_min": 879 |
| }, |
| { |
| "epoch": 6.606606606606607, |
| "grad_norm": 0.5052598547107464, |
| "learning_rate": 3.8667216672211515e-07, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17064377665519714, |
| "step": 4400, |
| "valid_targets_mean": 4867.7, |
| "valid_targets_min": 651 |
| }, |
| { |
| "epoch": 6.614114114114114, |
| "grad_norm": 0.7316891946951816, |
| "learning_rate": 3.7215489444718313e-07, |
| "loss": 0.2098, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22059103846549988, |
| "step": 4405, |
| "valid_targets_mean": 2672.8, |
| "valid_targets_min": 724 |
| }, |
| { |
| "epoch": 6.621621621621622, |
| "grad_norm": 0.6761848493284879, |
| "learning_rate": 3.5791282186099064e-07, |
| "loss": 0.2279, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23260068893432617, |
| "step": 4410, |
| "valid_targets_mean": 3445.1, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 6.629129129129129, |
| "grad_norm": 0.6708523109273121, |
| "learning_rate": 3.439461486499451e-07, |
| "loss": 0.2085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23754608631134033, |
| "step": 4415, |
| "valid_targets_mean": 3454.1, |
| "valid_targets_min": 495 |
| }, |
| { |
| "epoch": 6.636636636636637, |
| "grad_norm": 0.5130944622824821, |
| "learning_rate": 3.302550706391161e-07, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1540905237197876, |
| "step": 4420, |
| "valid_targets_mean": 4449.4, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 6.6441441441441444, |
| "grad_norm": 0.5253445851442728, |
| "learning_rate": 3.168397797894818e-07, |
| "loss": 0.2039, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19345726072788239, |
| "step": 4425, |
| "valid_targets_mean": 5712.4, |
| "valid_targets_min": 814 |
| }, |
| { |
| "epoch": 6.651651651651652, |
| "grad_norm": 0.4999642956754218, |
| "learning_rate": 3.03700464195249e-07, |
| "loss": 0.1771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1533123254776001, |
| "step": 4430, |
| "valid_targets_mean": 4014.4, |
| "valid_targets_min": 448 |
| }, |
| { |
| "epoch": 6.6591591591591595, |
| "grad_norm": 0.6600694282993609, |
| "learning_rate": 2.9083730808120214e-07, |
| "loss": 0.252, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26119160652160645, |
| "step": 4435, |
| "valid_targets_mean": 3377.4, |
| "valid_targets_min": 445 |
| }, |
| { |
| "epoch": 6.666666666666667, |
| "grad_norm": 0.6967687532254948, |
| "learning_rate": 2.78250491800125e-07, |
| "loss": 0.2081, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1988351047039032, |
| "step": 4440, |
| "valid_targets_mean": 2430.9, |
| "valid_targets_min": 396 |
| }, |
| { |
| "epoch": 6.6741741741741745, |
| "grad_norm": 0.6534875940602458, |
| "learning_rate": 2.6594019183027844e-07, |
| "loss": 0.2099, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2011052370071411, |
| "step": 4445, |
| "valid_targets_mean": 3745.1, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 6.681681681681682, |
| "grad_norm": 0.6527183652558144, |
| "learning_rate": 2.5390658077292017e-07, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19569085538387299, |
| "step": 4450, |
| "valid_targets_mean": 3687.9, |
| "valid_targets_min": 539 |
| }, |
| { |
| "epoch": 6.6891891891891895, |
| "grad_norm": 0.8645812862940178, |
| "learning_rate": 2.4214982734988013e-07, |
| "loss": 0.2033, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22479039430618286, |
| "step": 4455, |
| "valid_targets_mean": 2105.8, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 6.696696696696697, |
| "grad_norm": 0.5255004317144049, |
| "learning_rate": 2.3067009640120652e-07, |
| "loss": 0.2365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26815474033355713, |
| "step": 4460, |
| "valid_targets_mean": 5218.8, |
| "valid_targets_min": 565 |
| }, |
| { |
| "epoch": 6.7042042042042045, |
| "grad_norm": 0.5916763601809271, |
| "learning_rate": 2.194675488828457e-07, |
| "loss": 0.1791, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1834341287612915, |
| "step": 4465, |
| "valid_targets_mean": 3968.9, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 6.711711711711712, |
| "grad_norm": 0.614175690495789, |
| "learning_rate": 2.0854234186438837e-07, |
| "loss": 0.1942, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24795103073120117, |
| "step": 4470, |
| "valid_targets_mean": 3751.3, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 6.7192192192192195, |
| "grad_norm": 0.5171279571165366, |
| "learning_rate": 1.9789462852686237e-07, |
| "loss": 0.2013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19156940281391144, |
| "step": 4475, |
| "valid_targets_mean": 4793.4, |
| "valid_targets_min": 679 |
| }, |
| { |
| "epoch": 6.726726726726727, |
| "grad_norm": 0.5178172693023037, |
| "learning_rate": 1.875245581605989e-07, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16094420850276947, |
| "step": 4480, |
| "valid_targets_mean": 4665.6, |
| "valid_targets_min": 471 |
| }, |
| { |
| "epoch": 6.7342342342342345, |
| "grad_norm": 0.48834241533960204, |
| "learning_rate": 1.7743227616312308e-07, |
| "loss": 0.213, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16197466850280762, |
| "step": 4485, |
| "valid_targets_mean": 4962.2, |
| "valid_targets_min": 1052 |
| }, |
| { |
| "epoch": 6.741741741741742, |
| "grad_norm": 0.5234925189927083, |
| "learning_rate": 1.676179240371245e-07, |
| "loss": 0.1807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16373220086097717, |
| "step": 4490, |
| "valid_targets_mean": 3922.8, |
| "valid_targets_min": 464 |
| }, |
| { |
| "epoch": 6.7492492492492495, |
| "grad_norm": 0.6352684311920057, |
| "learning_rate": 1.5808163938846986e-07, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19435149431228638, |
| "step": 4495, |
| "valid_targets_mean": 3218.4, |
| "valid_targets_min": 478 |
| }, |
| { |
| "epoch": 6.756756756756757, |
| "grad_norm": 0.6229594370415693, |
| "learning_rate": 1.4882355592427344e-07, |
| "loss": 0.191, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16698959469795227, |
| "step": 4500, |
| "valid_targets_mean": 3428.0, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 6.7642642642642645, |
| "grad_norm": 0.6138075392270004, |
| "learning_rate": 1.3984380345102966e-07, |
| "loss": 0.2124, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21965721249580383, |
| "step": 4505, |
| "valid_targets_mean": 3452.5, |
| "valid_targets_min": 408 |
| }, |
| { |
| "epoch": 6.771771771771772, |
| "grad_norm": 0.5674625446735158, |
| "learning_rate": 1.3114250787278128e-07, |
| "loss": 0.2276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17410314083099365, |
| "step": 4510, |
| "valid_targets_mean": 5005.2, |
| "valid_targets_min": 560 |
| }, |
| { |
| "epoch": 6.7792792792792795, |
| "grad_norm": 0.5558176857114882, |
| "learning_rate": 1.2271979118936074e-07, |
| "loss": 0.2114, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17912578582763672, |
| "step": 4515, |
| "valid_targets_mean": 3863.8, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 6.786786786786787, |
| "grad_norm": 0.635474987483276, |
| "learning_rate": 1.1457577149468268e-07, |
| "loss": 0.1884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17979639768600464, |
| "step": 4520, |
| "valid_targets_mean": 3391.7, |
| "valid_targets_min": 429 |
| }, |
| { |
| "epoch": 6.7942942942942945, |
| "grad_norm": 0.794907141047451, |
| "learning_rate": 1.0671056297507642e-07, |
| "loss": 0.2055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19865292310714722, |
| "step": 4525, |
| "valid_targets_mean": 2033.5, |
| "valid_targets_min": 584 |
| }, |
| { |
| "epoch": 6.801801801801802, |
| "grad_norm": 0.49215782912003203, |
| "learning_rate": 9.91242759077049e-08, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15488871932029724, |
| "step": 4530, |
| "valid_targets_mean": 4630.8, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 6.8093093093093096, |
| "grad_norm": 0.6173142764754961, |
| "learning_rate": 9.181701665899268e-08, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18007370829582214, |
| "step": 4535, |
| "valid_targets_mean": 4323.4, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 6.816816816816817, |
| "grad_norm": 0.7575394360176801, |
| "learning_rate": 8.47888876831604e-08, |
| "loss": 0.2296, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24876675009727478, |
| "step": 4540, |
| "valid_targets_mean": 3193.3, |
| "valid_targets_min": 277 |
| }, |
| { |
| "epoch": 6.824324324324325, |
| "grad_norm": 0.5819569698944355, |
| "learning_rate": 7.803998752076824e-08, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17346233129501343, |
| "step": 4545, |
| "valid_targets_mean": 5187.9, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 6.831831831831832, |
| "grad_norm": 0.4396136217756035, |
| "learning_rate": 7.157041079734584e-08, |
| "loss": 0.2325, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18130743503570557, |
| "step": 4550, |
| "valid_targets_mean": 5762.4, |
| "valid_targets_min": 1228 |
| }, |
| { |
| "epoch": 6.83933933933934, |
| "grad_norm": 0.4687226820184863, |
| "learning_rate": 6.538024822206224e-08, |
| "loss": 0.2008, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1852032095193863, |
| "step": 4555, |
| "valid_targets_mean": 5690.4, |
| "valid_targets_min": 702 |
| }, |
| { |
| "epoch": 6.846846846846847, |
| "grad_norm": 0.6527972240202853, |
| "learning_rate": 5.946958658645141e-08, |
| "loss": 0.2255, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21088294684886932, |
| "step": 4560, |
| "valid_targets_mean": 3305.9, |
| "valid_targets_min": 371 |
| }, |
| { |
| "epoch": 6.854354354354355, |
| "grad_norm": 0.5747007613275369, |
| "learning_rate": 5.383850876319763e-08, |
| "loss": 0.1834, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16404512524604797, |
| "step": 4565, |
| "valid_targets_mean": 3822.6, |
| "valid_targets_min": 609 |
| }, |
| { |
| "epoch": 6.861861861861862, |
| "grad_norm": 0.5712891848122477, |
| "learning_rate": 4.848709370498084e-08, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24901172518730164, |
| "step": 4570, |
| "valid_targets_mean": 5079.1, |
| "valid_targets_min": 574 |
| }, |
| { |
| "epoch": 6.86936936936937, |
| "grad_norm": 0.4949929365077814, |
| "learning_rate": 4.34154164433509e-08, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17748858034610748, |
| "step": 4575, |
| "valid_targets_mean": 4491.8, |
| "valid_targets_min": 634 |
| }, |
| { |
| "epoch": 6.876876876876877, |
| "grad_norm": 0.5203752172969807, |
| "learning_rate": 3.86235480876973e-08, |
| "loss": 0.2374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2086370289325714, |
| "step": 4580, |
| "valid_targets_mean": 5460.8, |
| "valid_targets_min": 622 |
| }, |
| { |
| "epoch": 6.884384384384385, |
| "grad_norm": 0.5124535100635832, |
| "learning_rate": 3.411155582423664e-08, |
| "loss": 0.1985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16645345091819763, |
| "step": 4585, |
| "valid_targets_mean": 4649.4, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 6.891891891891892, |
| "grad_norm": 0.6965621530697311, |
| "learning_rate": 2.9879502915075574e-08, |
| "loss": 0.2214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21695250272750854, |
| "step": 4590, |
| "valid_targets_mean": 3357.6, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 6.8993993993994, |
| "grad_norm": 0.5009549067493665, |
| "learning_rate": 2.592744869732933e-08, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2433704286813736, |
| "step": 4595, |
| "valid_targets_mean": 5021.1, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 6.906906906906907, |
| "grad_norm": 0.6325006211055703, |
| "learning_rate": 2.2255448582280127e-08, |
| "loss": 0.1923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1930675059556961, |
| "step": 4600, |
| "valid_targets_mean": 3954.0, |
| "valid_targets_min": 562 |
| }, |
| { |
| "epoch": 6.914414414414415, |
| "grad_norm": 0.5272145532637147, |
| "learning_rate": 1.8863554054606715e-08, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1625824272632599, |
| "step": 4605, |
| "valid_targets_mean": 4323.2, |
| "valid_targets_min": 1190 |
| }, |
| { |
| "epoch": 6.921921921921922, |
| "grad_norm": 0.5329661463696542, |
| "learning_rate": 1.5751812671658264e-08, |
| "loss": 0.2071, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19332969188690186, |
| "step": 4610, |
| "valid_targets_mean": 4747.9, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 6.92942942942943, |
| "grad_norm": 0.5417369482444132, |
| "learning_rate": 1.2920268062794894e-08, |
| "loss": 0.2086, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19969046115875244, |
| "step": 4615, |
| "valid_targets_mean": 4192.8, |
| "valid_targets_min": 728 |
| }, |
| { |
| "epoch": 6.936936936936937, |
| "grad_norm": 0.6878033594654033, |
| "learning_rate": 1.0368959928763744e-08, |
| "loss": 0.2053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21517297625541687, |
| "step": 4620, |
| "valid_targets_mean": 3462.9, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 6.944444444444445, |
| "grad_norm": 0.5692311923901623, |
| "learning_rate": 8.097924041157168e-09, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17874173820018768, |
| "step": 4625, |
| "valid_targets_mean": 3834.8, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 6.951951951951952, |
| "grad_norm": 0.8120108501447949, |
| "learning_rate": 6.107192241897597e-09, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19116508960723877, |
| "step": 4630, |
| "valid_targets_mean": 3737.9, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 6.95945945945946, |
| "grad_norm": 0.6343758559646698, |
| "learning_rate": 4.396792442800113e-09, |
| "loss": 0.2174, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2372244894504547, |
| "step": 4635, |
| "valid_targets_mean": 5020.9, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 6.966966966966967, |
| "grad_norm": 0.4747536212588191, |
| "learning_rate": 2.9667486251794274e-09, |
| "loss": 0.1961, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15623793005943298, |
| "step": 4640, |
| "valid_targets_mean": 5340.8, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 6.974474474474475, |
| "grad_norm": 0.4663889436387785, |
| "learning_rate": 1.8170808395079342e-09, |
| "loss": 0.2291, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.204878568649292, |
| "step": 4645, |
| "valid_targets_mean": 5754.1, |
| "valid_targets_min": 2157 |
| }, |
| { |
| "epoch": 6.981981981981982, |
| "grad_norm": 0.5618969419816342, |
| "learning_rate": 9.47805205140373e-10, |
| "loss": 0.196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2027861475944519, |
| "step": 4650, |
| "valid_targets_mean": 4324.8, |
| "valid_targets_min": 736 |
| }, |
| { |
| "epoch": 6.98948948948949, |
| "grad_norm": 0.440752938378733, |
| "learning_rate": 3.589339100917855e-10, |
| "loss": 0.1985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21129390597343445, |
| "step": 4655, |
| "valid_targets_mean": 6267.5, |
| "valid_targets_min": 686 |
| }, |
| { |
| "epoch": 6.996996996996997, |
| "grad_norm": 0.5759092607170879, |
| "learning_rate": 5.0475210853218045e-11, |
| "loss": 0.2195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21579566597938538, |
| "step": 4660, |
| "valid_targets_mean": 4775.2, |
| "valid_targets_min": 824 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1870056539773941, |
| "step": 4662, |
| "total_flos": 1420700030337024.0, |
| "train_loss": 0.25631797409579254, |
| "train_runtime": 31285.8836, |
| "train_samples_per_second": 2.384, |
| "train_steps_per_second": 0.149, |
| "valid_targets_mean": 4345.4, |
| "valid_targets_min": 624 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4662, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1420700030337024.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|