| { |
| "best_global_step": null, |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 7.0, |
| "eval_steps": 500, |
| "global_step": 4515, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.007751937984496124, |
| "grad_norm": 10.737414411251518, |
| "learning_rate": 3.5398230088495575e-07, |
| "loss": 0.6122, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5790383219718933, |
| "step": 5, |
| "valid_targets_mean": 5473.9, |
| "valid_targets_min": 2003 |
| }, |
| { |
| "epoch": 0.015503875968992248, |
| "grad_norm": 12.969006644336845, |
| "learning_rate": 7.964601769911505e-07, |
| "loss": 0.6056, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6179184317588806, |
| "step": 10, |
| "valid_targets_mean": 4275.1, |
| "valid_targets_min": 2399 |
| }, |
| { |
| "epoch": 0.023255813953488372, |
| "grad_norm": 10.73852678993892, |
| "learning_rate": 1.2389380530973452e-06, |
| "loss": 0.6059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6460979580879211, |
| "step": 15, |
| "valid_targets_mean": 5231.6, |
| "valid_targets_min": 343 |
| }, |
| { |
| "epoch": 0.031007751937984496, |
| "grad_norm": 10.022340877272923, |
| "learning_rate": 1.68141592920354e-06, |
| "loss": 0.5736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5392199158668518, |
| "step": 20, |
| "valid_targets_mean": 5241.8, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 0.03875968992248062, |
| "grad_norm": 5.037849526968358, |
| "learning_rate": 2.1238938053097345e-06, |
| "loss": 0.4978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3818526268005371, |
| "step": 25, |
| "valid_targets_mean": 5527.9, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 0.046511627906976744, |
| "grad_norm": 4.262678982312242, |
| "learning_rate": 2.5663716814159294e-06, |
| "loss": 0.5324, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.6495624780654907, |
| "step": 30, |
| "valid_targets_mean": 3715.2, |
| "valid_targets_min": 408 |
| }, |
| { |
| "epoch": 0.05426356589147287, |
| "grad_norm": 2.3482137938148466, |
| "learning_rate": 3.0088495575221242e-06, |
| "loss": 0.4639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.5476200580596924, |
| "step": 35, |
| "valid_targets_mean": 5361.5, |
| "valid_targets_min": 2437 |
| }, |
| { |
| "epoch": 0.06201550387596899, |
| "grad_norm": 1.46476205992856, |
| "learning_rate": 3.4513274336283186e-06, |
| "loss": 0.4293, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.46131038665771484, |
| "step": 40, |
| "valid_targets_mean": 5086.5, |
| "valid_targets_min": 272 |
| }, |
| { |
| "epoch": 0.06976744186046512, |
| "grad_norm": 1.3283216378548661, |
| "learning_rate": 3.8938053097345135e-06, |
| "loss": 0.4646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.44244861602783203, |
| "step": 45, |
| "valid_targets_mean": 3978.5, |
| "valid_targets_min": 1865 |
| }, |
| { |
| "epoch": 0.07751937984496124, |
| "grad_norm": 1.0028919580355764, |
| "learning_rate": 4.336283185840709e-06, |
| "loss": 0.4339, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.4484736919403076, |
| "step": 50, |
| "valid_targets_mean": 5080.6, |
| "valid_targets_min": 2468 |
| }, |
| { |
| "epoch": 0.08527131782945736, |
| "grad_norm": 0.8265483597929661, |
| "learning_rate": 4.778761061946903e-06, |
| "loss": 0.3985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.43008673191070557, |
| "step": 55, |
| "valid_targets_mean": 4308.8, |
| "valid_targets_min": 598 |
| }, |
| { |
| "epoch": 0.09302325581395349, |
| "grad_norm": 0.7109955989422742, |
| "learning_rate": 5.2212389380530985e-06, |
| "loss": 0.3726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34888190031051636, |
| "step": 60, |
| "valid_targets_mean": 4633.4, |
| "valid_targets_min": 2442 |
| }, |
| { |
| "epoch": 0.10077519379844961, |
| "grad_norm": 0.655988135659704, |
| "learning_rate": 5.663716814159292e-06, |
| "loss": 0.3799, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.34532463550567627, |
| "step": 65, |
| "valid_targets_mean": 3801.8, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 0.10852713178294573, |
| "grad_norm": 0.5932763195572598, |
| "learning_rate": 6.1061946902654865e-06, |
| "loss": 0.3585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.32048162817955017, |
| "step": 70, |
| "valid_targets_mean": 4474.1, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 0.11627906976744186, |
| "grad_norm": 0.5372600166593284, |
| "learning_rate": 6.548672566371682e-06, |
| "loss": 0.3061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3458303213119507, |
| "step": 75, |
| "valid_targets_mean": 5349.9, |
| "valid_targets_min": 2632 |
| }, |
| { |
| "epoch": 0.12403100775193798, |
| "grad_norm": 0.5539936993292226, |
| "learning_rate": 6.991150442477876e-06, |
| "loss": 0.357, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3393269181251526, |
| "step": 80, |
| "valid_targets_mean": 4613.9, |
| "valid_targets_min": 642 |
| }, |
| { |
| "epoch": 0.13178294573643412, |
| "grad_norm": 0.5623006682180124, |
| "learning_rate": 7.4336283185840714e-06, |
| "loss": 0.348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.37088829278945923, |
| "step": 85, |
| "valid_targets_mean": 5265.9, |
| "valid_targets_min": 2035 |
| }, |
| { |
| "epoch": 0.13953488372093023, |
| "grad_norm": 0.5992837863592103, |
| "learning_rate": 7.876106194690266e-06, |
| "loss": 0.3268, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.35172638297080994, |
| "step": 90, |
| "valid_targets_mean": 4771.9, |
| "valid_targets_min": 1048 |
| }, |
| { |
| "epoch": 0.14728682170542637, |
| "grad_norm": 0.45192427418479936, |
| "learning_rate": 8.31858407079646e-06, |
| "loss": 0.3372, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3198494017124176, |
| "step": 95, |
| "valid_targets_mean": 5918.0, |
| "valid_targets_min": 368 |
| }, |
| { |
| "epoch": 0.15503875968992248, |
| "grad_norm": 0.625926887246749, |
| "learning_rate": 8.761061946902656e-06, |
| "loss": 0.3209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.40857595205307007, |
| "step": 100, |
| "valid_targets_mean": 5248.5, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 0.16279069767441862, |
| "grad_norm": 0.6811575704902189, |
| "learning_rate": 9.203539823008851e-06, |
| "loss": 0.3315, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.38290804624557495, |
| "step": 105, |
| "valid_targets_mean": 4731.9, |
| "valid_targets_min": 422 |
| }, |
| { |
| "epoch": 0.17054263565891473, |
| "grad_norm": 0.5566478870304039, |
| "learning_rate": 9.646017699115045e-06, |
| "loss": 0.3422, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.313689649105072, |
| "step": 110, |
| "valid_targets_mean": 4493.0, |
| "valid_targets_min": 485 |
| }, |
| { |
| "epoch": 0.17829457364341086, |
| "grad_norm": 0.41287589462882723, |
| "learning_rate": 1.008849557522124e-05, |
| "loss": 0.2705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23904478549957275, |
| "step": 115, |
| "valid_targets_mean": 4980.3, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 0.18604651162790697, |
| "grad_norm": 0.522088179939139, |
| "learning_rate": 1.0530973451327436e-05, |
| "loss": 0.3139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.31741863489151, |
| "step": 120, |
| "valid_targets_mean": 3859.9, |
| "valid_targets_min": 361 |
| }, |
| { |
| "epoch": 0.1937984496124031, |
| "grad_norm": 0.5022551201886791, |
| "learning_rate": 1.0973451327433629e-05, |
| "loss": 0.2936, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29989367723464966, |
| "step": 125, |
| "valid_targets_mean": 4806.8, |
| "valid_targets_min": 2268 |
| }, |
| { |
| "epoch": 0.20155038759689922, |
| "grad_norm": 0.43337385085835556, |
| "learning_rate": 1.1415929203539825e-05, |
| "loss": 0.316, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26593732833862305, |
| "step": 130, |
| "valid_targets_mean": 5703.4, |
| "valid_targets_min": 861 |
| }, |
| { |
| "epoch": 0.20930232558139536, |
| "grad_norm": 0.5362034077276845, |
| "learning_rate": 1.1858407079646019e-05, |
| "loss": 0.2958, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26804763078689575, |
| "step": 135, |
| "valid_targets_mean": 5329.9, |
| "valid_targets_min": 436 |
| }, |
| { |
| "epoch": 0.21705426356589147, |
| "grad_norm": 0.7869829849569835, |
| "learning_rate": 1.2300884955752212e-05, |
| "loss": 0.295, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2954621911048889, |
| "step": 140, |
| "valid_targets_mean": 4087.9, |
| "valid_targets_min": 367 |
| }, |
| { |
| "epoch": 0.2248062015503876, |
| "grad_norm": 0.4284133599416018, |
| "learning_rate": 1.2743362831858408e-05, |
| "loss": 0.2592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22574186325073242, |
| "step": 145, |
| "valid_targets_mean": 4778.1, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 0.23255813953488372, |
| "grad_norm": 0.43346642775630995, |
| "learning_rate": 1.3185840707964604e-05, |
| "loss": 0.265, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2442144900560379, |
| "step": 150, |
| "valid_targets_mean": 4813.1, |
| "valid_targets_min": 370 |
| }, |
| { |
| "epoch": 0.24031007751937986, |
| "grad_norm": 0.4612125175821135, |
| "learning_rate": 1.3628318584070797e-05, |
| "loss": 0.2645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25243520736694336, |
| "step": 155, |
| "valid_targets_mean": 4157.1, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 0.24806201550387597, |
| "grad_norm": 0.4456387275424371, |
| "learning_rate": 1.4070796460176991e-05, |
| "loss": 0.3351, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28738337755203247, |
| "step": 160, |
| "valid_targets_mean": 5481.4, |
| "valid_targets_min": 1940 |
| }, |
| { |
| "epoch": 0.2558139534883721, |
| "grad_norm": 0.5654786805272515, |
| "learning_rate": 1.4513274336283187e-05, |
| "loss": 0.2997, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3355092406272888, |
| "step": 165, |
| "valid_targets_mean": 5211.9, |
| "valid_targets_min": 1841 |
| }, |
| { |
| "epoch": 0.26356589147286824, |
| "grad_norm": 0.4528552978301014, |
| "learning_rate": 1.4955752212389383e-05, |
| "loss": 0.2687, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24449273943901062, |
| "step": 170, |
| "valid_targets_mean": 4395.9, |
| "valid_targets_min": 716 |
| }, |
| { |
| "epoch": 0.2713178294573643, |
| "grad_norm": 0.5070510356795248, |
| "learning_rate": 1.5398230088495576e-05, |
| "loss": 0.2736, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2762889266014099, |
| "step": 175, |
| "valid_targets_mean": 5060.6, |
| "valid_targets_min": 332 |
| }, |
| { |
| "epoch": 0.27906976744186046, |
| "grad_norm": 0.4109586147637433, |
| "learning_rate": 1.5840707964601772e-05, |
| "loss": 0.2469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27871203422546387, |
| "step": 180, |
| "valid_targets_mean": 5762.0, |
| "valid_targets_min": 317 |
| }, |
| { |
| "epoch": 0.2868217054263566, |
| "grad_norm": 0.5312588834611185, |
| "learning_rate": 1.628318584070797e-05, |
| "loss": 0.2602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21110810339450836, |
| "step": 185, |
| "valid_targets_mean": 4100.6, |
| "valid_targets_min": 312 |
| }, |
| { |
| "epoch": 0.29457364341085274, |
| "grad_norm": 0.5125684260379816, |
| "learning_rate": 1.672566371681416e-05, |
| "loss": 0.2584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2507615089416504, |
| "step": 190, |
| "valid_targets_mean": 4268.3, |
| "valid_targets_min": 2439 |
| }, |
| { |
| "epoch": 0.3023255813953488, |
| "grad_norm": 0.6649775832883916, |
| "learning_rate": 1.7168141592920354e-05, |
| "loss": 0.2877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.41589394211769104, |
| "step": 195, |
| "valid_targets_mean": 3739.2, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 0.31007751937984496, |
| "grad_norm": 0.5366482871518907, |
| "learning_rate": 1.761061946902655e-05, |
| "loss": 0.2587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27435043454170227, |
| "step": 200, |
| "valid_targets_mean": 5772.8, |
| "valid_targets_min": 2700 |
| }, |
| { |
| "epoch": 0.3178294573643411, |
| "grad_norm": 0.5074784266785846, |
| "learning_rate": 1.8053097345132743e-05, |
| "loss": 0.281, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2721036970615387, |
| "step": 205, |
| "valid_targets_mean": 4397.0, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 0.32558139534883723, |
| "grad_norm": 0.614506165275271, |
| "learning_rate": 1.849557522123894e-05, |
| "loss": 0.2917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30919021368026733, |
| "step": 210, |
| "valid_targets_mean": 4218.9, |
| "valid_targets_min": 472 |
| }, |
| { |
| "epoch": 0.3333333333333333, |
| "grad_norm": 0.5419591558618669, |
| "learning_rate": 1.8938053097345135e-05, |
| "loss": 0.2622, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23832359910011292, |
| "step": 215, |
| "valid_targets_mean": 5124.2, |
| "valid_targets_min": 2981 |
| }, |
| { |
| "epoch": 0.34108527131782945, |
| "grad_norm": 0.5664964725729073, |
| "learning_rate": 1.9380530973451328e-05, |
| "loss": 0.2701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2373562753200531, |
| "step": 220, |
| "valid_targets_mean": 3882.1, |
| "valid_targets_min": 282 |
| }, |
| { |
| "epoch": 0.3488372093023256, |
| "grad_norm": 0.4209274671883887, |
| "learning_rate": 1.9823008849557524e-05, |
| "loss": 0.2434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1936969757080078, |
| "step": 225, |
| "valid_targets_mean": 5481.6, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 0.35658914728682173, |
| "grad_norm": 0.5074693857643466, |
| "learning_rate": 2.0265486725663717e-05, |
| "loss": 0.253, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25986820459365845, |
| "step": 230, |
| "valid_targets_mean": 5012.3, |
| "valid_targets_min": 1855 |
| }, |
| { |
| "epoch": 0.3643410852713178, |
| "grad_norm": 0.5512784168137245, |
| "learning_rate": 2.0707964601769913e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27459990978240967, |
| "step": 235, |
| "valid_targets_mean": 4073.4, |
| "valid_targets_min": 477 |
| }, |
| { |
| "epoch": 0.37209302325581395, |
| "grad_norm": 0.4347839613276555, |
| "learning_rate": 2.115044247787611e-05, |
| "loss": 0.2616, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24624979496002197, |
| "step": 240, |
| "valid_targets_mean": 5311.7, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 0.3798449612403101, |
| "grad_norm": 0.5190963993227697, |
| "learning_rate": 2.15929203539823e-05, |
| "loss": 0.2566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.252674400806427, |
| "step": 245, |
| "valid_targets_mean": 4257.4, |
| "valid_targets_min": 2687 |
| }, |
| { |
| "epoch": 0.3875968992248062, |
| "grad_norm": 0.5887863557318684, |
| "learning_rate": 2.2035398230088498e-05, |
| "loss": 0.2831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.33351632952690125, |
| "step": 250, |
| "valid_targets_mean": 5280.2, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 0.3953488372093023, |
| "grad_norm": 0.5068755318361087, |
| "learning_rate": 2.247787610619469e-05, |
| "loss": 0.2454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20935970544815063, |
| "step": 255, |
| "valid_targets_mean": 4357.3, |
| "valid_targets_min": 365 |
| }, |
| { |
| "epoch": 0.40310077519379844, |
| "grad_norm": 0.4660973149935113, |
| "learning_rate": 2.2920353982300883e-05, |
| "loss": 0.2583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2345641404390335, |
| "step": 260, |
| "valid_targets_mean": 4675.7, |
| "valid_targets_min": 472 |
| }, |
| { |
| "epoch": 0.4108527131782946, |
| "grad_norm": 0.4943641747428354, |
| "learning_rate": 2.3362831858407083e-05, |
| "loss": 0.2525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25245875120162964, |
| "step": 265, |
| "valid_targets_mean": 4586.7, |
| "valid_targets_min": 336 |
| }, |
| { |
| "epoch": 0.4186046511627907, |
| "grad_norm": 0.5733463209321147, |
| "learning_rate": 2.3805309734513275e-05, |
| "loss": 0.256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2648470103740692, |
| "step": 270, |
| "valid_targets_mean": 4878.5, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 0.4263565891472868, |
| "grad_norm": 0.5797109099250628, |
| "learning_rate": 2.424778761061947e-05, |
| "loss": 0.2686, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23868052661418915, |
| "step": 275, |
| "valid_targets_mean": 4204.3, |
| "valid_targets_min": 1999 |
| }, |
| { |
| "epoch": 0.43410852713178294, |
| "grad_norm": 0.5102454710373611, |
| "learning_rate": 2.4690265486725668e-05, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19877958297729492, |
| "step": 280, |
| "valid_targets_mean": 4676.9, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 0.4418604651162791, |
| "grad_norm": 0.5432212420309249, |
| "learning_rate": 2.513274336283186e-05, |
| "loss": 0.2822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30621248483657837, |
| "step": 285, |
| "valid_targets_mean": 4931.0, |
| "valid_targets_min": 1914 |
| }, |
| { |
| "epoch": 0.4496124031007752, |
| "grad_norm": 0.5173046537936798, |
| "learning_rate": 2.5575221238938056e-05, |
| "loss": 0.236, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2177397459745407, |
| "step": 290, |
| "valid_targets_mean": 3951.5, |
| "valid_targets_min": 1846 |
| }, |
| { |
| "epoch": 0.4573643410852713, |
| "grad_norm": 0.47098388353840676, |
| "learning_rate": 2.601769911504425e-05, |
| "loss": 0.2311, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23170709609985352, |
| "step": 295, |
| "valid_targets_mean": 5152.0, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 0.46511627906976744, |
| "grad_norm": 0.5012563709590744, |
| "learning_rate": 2.6460176991150442e-05, |
| "loss": 0.2354, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2445349246263504, |
| "step": 300, |
| "valid_targets_mean": 4086.8, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 0.4728682170542636, |
| "grad_norm": 0.7598417766003686, |
| "learning_rate": 2.690265486725664e-05, |
| "loss": 0.2685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2794634699821472, |
| "step": 305, |
| "valid_targets_mean": 6700.9, |
| "valid_targets_min": 2494 |
| }, |
| { |
| "epoch": 0.4806201550387597, |
| "grad_norm": 0.48809284746866477, |
| "learning_rate": 2.7345132743362834e-05, |
| "loss": 0.251, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23253998160362244, |
| "step": 310, |
| "valid_targets_mean": 4574.2, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 0.4883720930232558, |
| "grad_norm": 0.5629581496018895, |
| "learning_rate": 2.7787610619469027e-05, |
| "loss": 0.2549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.275101900100708, |
| "step": 315, |
| "valid_targets_mean": 4482.4, |
| "valid_targets_min": 380 |
| }, |
| { |
| "epoch": 0.49612403100775193, |
| "grad_norm": 0.5149842618437763, |
| "learning_rate": 2.8230088495575226e-05, |
| "loss": 0.241, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26416015625, |
| "step": 320, |
| "valid_targets_mean": 4816.7, |
| "valid_targets_min": 2959 |
| }, |
| { |
| "epoch": 0.5038759689922481, |
| "grad_norm": 0.5415600825598276, |
| "learning_rate": 2.867256637168142e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2811618149280548, |
| "step": 325, |
| "valid_targets_mean": 5667.7, |
| "valid_targets_min": 559 |
| }, |
| { |
| "epoch": 0.5116279069767442, |
| "grad_norm": 0.5507831167513966, |
| "learning_rate": 2.9115044247787612e-05, |
| "loss": 0.2434, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2697560787200928, |
| "step": 330, |
| "valid_targets_mean": 4328.9, |
| "valid_targets_min": 314 |
| }, |
| { |
| "epoch": 0.5193798449612403, |
| "grad_norm": 0.444364635402833, |
| "learning_rate": 2.9557522123893808e-05, |
| "loss": 0.2478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26696139574050903, |
| "step": 335, |
| "valid_targets_mean": 5249.1, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 0.5271317829457365, |
| "grad_norm": 0.5882361391451728, |
| "learning_rate": 3.0000000000000004e-05, |
| "loss": 0.2576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2548302412033081, |
| "step": 340, |
| "valid_targets_mean": 3739.8, |
| "valid_targets_min": 2192 |
| }, |
| { |
| "epoch": 0.5348837209302325, |
| "grad_norm": 0.5152875122005142, |
| "learning_rate": 3.0442477876106197e-05, |
| "loss": 0.2569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23482279479503632, |
| "step": 345, |
| "valid_targets_mean": 3619.9, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 0.5426356589147286, |
| "grad_norm": 0.4815633298934971, |
| "learning_rate": 3.0884955752212396e-05, |
| "loss": 0.2373, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2350481003522873, |
| "step": 350, |
| "valid_targets_mean": 4721.2, |
| "valid_targets_min": 1866 |
| }, |
| { |
| "epoch": 0.5503875968992248, |
| "grad_norm": 0.4648544079642719, |
| "learning_rate": 3.132743362831859e-05, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.181733176112175, |
| "step": 355, |
| "valid_targets_mean": 5043.9, |
| "valid_targets_min": 1925 |
| }, |
| { |
| "epoch": 0.5581395348837209, |
| "grad_norm": 0.5037726577202668, |
| "learning_rate": 3.176991150442478e-05, |
| "loss": 0.2506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29893919825553894, |
| "step": 360, |
| "valid_targets_mean": 4146.6, |
| "valid_targets_min": 419 |
| }, |
| { |
| "epoch": 0.5658914728682171, |
| "grad_norm": 0.4516342191965917, |
| "learning_rate": 3.2212389380530975e-05, |
| "loss": 0.269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.251533180475235, |
| "step": 365, |
| "valid_targets_mean": 5648.9, |
| "valid_targets_min": 1948 |
| }, |
| { |
| "epoch": 0.5736434108527132, |
| "grad_norm": 0.510314234160131, |
| "learning_rate": 3.265486725663717e-05, |
| "loss": 0.2389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2301664650440216, |
| "step": 370, |
| "valid_targets_mean": 4642.9, |
| "valid_targets_min": 357 |
| }, |
| { |
| "epoch": 0.5813953488372093, |
| "grad_norm": 0.5221420257676286, |
| "learning_rate": 3.309734513274337e-05, |
| "loss": 0.254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25842761993408203, |
| "step": 375, |
| "valid_targets_mean": 5166.7, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 0.5891472868217055, |
| "grad_norm": 0.47841880099325107, |
| "learning_rate": 3.353982300884956e-05, |
| "loss": 0.2427, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23205696046352386, |
| "step": 380, |
| "valid_targets_mean": 4452.9, |
| "valid_targets_min": 2554 |
| }, |
| { |
| "epoch": 0.5968992248062015, |
| "grad_norm": 0.607600902063009, |
| "learning_rate": 3.398230088495575e-05, |
| "loss": 0.2396, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23086626827716827, |
| "step": 385, |
| "valid_targets_mean": 4332.0, |
| "valid_targets_min": 2478 |
| }, |
| { |
| "epoch": 0.6046511627906976, |
| "grad_norm": 0.5649861293006265, |
| "learning_rate": 3.4424778761061945e-05, |
| "loss": 0.2331, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2606998682022095, |
| "step": 390, |
| "valid_targets_mean": 3863.3, |
| "valid_targets_min": 355 |
| }, |
| { |
| "epoch": 0.6124031007751938, |
| "grad_norm": 0.5467855289956822, |
| "learning_rate": 3.4867256637168145e-05, |
| "loss": 0.2519, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24656961858272552, |
| "step": 395, |
| "valid_targets_mean": 4666.2, |
| "valid_targets_min": 1840 |
| }, |
| { |
| "epoch": 0.6201550387596899, |
| "grad_norm": 0.4033482565091616, |
| "learning_rate": 3.530973451327434e-05, |
| "loss": 0.2317, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19554291665554047, |
| "step": 400, |
| "valid_targets_mean": 5451.3, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 0.627906976744186, |
| "grad_norm": 0.408434222869372, |
| "learning_rate": 3.575221238938053e-05, |
| "loss": 0.2523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20927652716636658, |
| "step": 405, |
| "valid_targets_mean": 5175.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 0.6356589147286822, |
| "grad_norm": 0.5142450144995636, |
| "learning_rate": 3.619469026548673e-05, |
| "loss": 0.2522, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.28972408175468445, |
| "step": 410, |
| "valid_targets_mean": 4840.2, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 0.6434108527131783, |
| "grad_norm": 0.5130835281170955, |
| "learning_rate": 3.663716814159292e-05, |
| "loss": 0.271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27192896604537964, |
| "step": 415, |
| "valid_targets_mean": 4130.9, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 0.6511627906976745, |
| "grad_norm": 0.5264620060585927, |
| "learning_rate": 3.707964601769912e-05, |
| "loss": 0.2475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.30271440744400024, |
| "step": 420, |
| "valid_targets_mean": 4858.8, |
| "valid_targets_min": 566 |
| }, |
| { |
| "epoch": 0.6589147286821705, |
| "grad_norm": 0.48973643965756275, |
| "learning_rate": 3.7522123893805314e-05, |
| "loss": 0.2348, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19385236501693726, |
| "step": 425, |
| "valid_targets_mean": 4338.8, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 0.6666666666666666, |
| "grad_norm": 0.47842223367968456, |
| "learning_rate": 3.796460176991151e-05, |
| "loss": 0.2404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24353685975074768, |
| "step": 430, |
| "valid_targets_mean": 4000.3, |
| "valid_targets_min": 2352 |
| }, |
| { |
| "epoch": 0.6744186046511628, |
| "grad_norm": 0.45816881401918463, |
| "learning_rate": 3.840707964601771e-05, |
| "loss": 0.2455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2597430646419525, |
| "step": 435, |
| "valid_targets_mean": 5271.6, |
| "valid_targets_min": 2162 |
| }, |
| { |
| "epoch": 0.6821705426356589, |
| "grad_norm": 0.6017326535707582, |
| "learning_rate": 3.88495575221239e-05, |
| "loss": 0.2444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24369432032108307, |
| "step": 440, |
| "valid_targets_mean": 3065.4, |
| "valid_targets_min": 304 |
| }, |
| { |
| "epoch": 0.689922480620155, |
| "grad_norm": 0.5404602142547137, |
| "learning_rate": 3.929203539823009e-05, |
| "loss": 0.2078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.256170392036438, |
| "step": 445, |
| "valid_targets_mean": 3592.6, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 0.6976744186046512, |
| "grad_norm": 0.4154279511759285, |
| "learning_rate": 3.9734513274336285e-05, |
| "loss": 0.2272, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21489651501178741, |
| "step": 450, |
| "valid_targets_mean": 4713.6, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 0.7054263565891473, |
| "grad_norm": 0.3730389962722997, |
| "learning_rate": 3.999997608524118e-05, |
| "loss": 0.2123, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1950041949748993, |
| "step": 455, |
| "valid_targets_mean": 6850.4, |
| "valid_targets_min": 2445 |
| }, |
| { |
| "epoch": 0.7131782945736435, |
| "grad_norm": 0.5017736757425001, |
| "learning_rate": 3.999970704486118e-05, |
| "loss": 0.2408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2439410388469696, |
| "step": 460, |
| "valid_targets_mean": 4726.7, |
| "valid_targets_min": 1933 |
| }, |
| { |
| "epoch": 0.7209302325581395, |
| "grad_norm": 0.5145474700945507, |
| "learning_rate": 3.999913907468731e-05, |
| "loss": 0.2448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2903444170951843, |
| "step": 465, |
| "valid_targets_mean": 3954.4, |
| "valid_targets_min": 606 |
| }, |
| { |
| "epoch": 0.7286821705426356, |
| "grad_norm": 0.39985614862149943, |
| "learning_rate": 3.9998272183208866e-05, |
| "loss": 0.242, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23064105212688446, |
| "step": 470, |
| "valid_targets_mean": 5725.1, |
| "valid_targets_min": 1885 |
| }, |
| { |
| "epoch": 0.7364341085271318, |
| "grad_norm": 0.47106899849704376, |
| "learning_rate": 3.999710638338303e-05, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2777732014656067, |
| "step": 475, |
| "valid_targets_mean": 4932.4, |
| "valid_targets_min": 2437 |
| }, |
| { |
| "epoch": 0.7441860465116279, |
| "grad_norm": 0.5041908945885922, |
| "learning_rate": 3.999564169263465e-05, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22737307846546173, |
| "step": 480, |
| "valid_targets_mean": 4427.4, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 0.751937984496124, |
| "grad_norm": 0.49803283079798477, |
| "learning_rate": 3.9993878132856044e-05, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2756238579750061, |
| "step": 485, |
| "valid_targets_mean": 4327.5, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 0.7596899224806202, |
| "grad_norm": 0.4206493823677622, |
| "learning_rate": 3.999181573040663e-05, |
| "loss": 0.2214, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2046414017677307, |
| "step": 490, |
| "valid_targets_mean": 5396.8, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 0.7674418604651163, |
| "grad_norm": 0.4197719415269444, |
| "learning_rate": 3.9989454516112524e-05, |
| "loss": 0.25, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2041558027267456, |
| "step": 495, |
| "valid_targets_mean": 4688.8, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 0.7751937984496124, |
| "grad_norm": 0.49956665072862294, |
| "learning_rate": 3.9986794525266115e-05, |
| "loss": 0.2538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2720697820186615, |
| "step": 500, |
| "valid_targets_mean": 4991.1, |
| "valid_targets_min": 2320 |
| }, |
| { |
| "epoch": 0.7829457364341085, |
| "grad_norm": 0.5668838261772827, |
| "learning_rate": 3.998383579762552e-05, |
| "loss": 0.2275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22524034976959229, |
| "step": 505, |
| "valid_targets_mean": 4758.6, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 0.7906976744186046, |
| "grad_norm": 0.4067566904060681, |
| "learning_rate": 3.998057837741396e-05, |
| "loss": 0.2368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20347392559051514, |
| "step": 510, |
| "valid_targets_mean": 5299.1, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 0.7984496124031008, |
| "grad_norm": 0.4983262141277965, |
| "learning_rate": 3.997702231331917e-05, |
| "loss": 0.2254, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22835250198841095, |
| "step": 515, |
| "valid_targets_mean": 4676.3, |
| "valid_targets_min": 1825 |
| }, |
| { |
| "epoch": 0.8062015503875969, |
| "grad_norm": 0.4874737761112375, |
| "learning_rate": 3.9973167658492577e-05, |
| "loss": 0.2326, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1982721984386444, |
| "step": 520, |
| "valid_targets_mean": 3951.7, |
| "valid_targets_min": 308 |
| }, |
| { |
| "epoch": 0.813953488372093, |
| "grad_norm": 0.4874095166955721, |
| "learning_rate": 3.99690144705486e-05, |
| "loss": 0.2588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27957573533058167, |
| "step": 525, |
| "valid_targets_mean": 4523.2, |
| "valid_targets_min": 630 |
| }, |
| { |
| "epoch": 0.8217054263565892, |
| "grad_norm": 0.46829582316727847, |
| "learning_rate": 3.996456281156372e-05, |
| "loss": 0.2304, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2339038848876953, |
| "step": 530, |
| "valid_targets_mean": 4400.8, |
| "valid_targets_min": 996 |
| }, |
| { |
| "epoch": 0.8294573643410853, |
| "grad_norm": 0.4173667508062997, |
| "learning_rate": 3.995981274807561e-05, |
| "loss": 0.2288, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19771169126033783, |
| "step": 535, |
| "valid_targets_mean": 4821.5, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 0.8372093023255814, |
| "grad_norm": 0.4998240530264507, |
| "learning_rate": 3.995476435108205e-05, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23739448189735413, |
| "step": 540, |
| "valid_targets_mean": 3693.3, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 0.8449612403100775, |
| "grad_norm": 0.40077148780586164, |
| "learning_rate": 3.994941769603999e-05, |
| "loss": 0.2402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25493863224983215, |
| "step": 545, |
| "valid_targets_mean": 6980.4, |
| "valid_targets_min": 3136 |
| }, |
| { |
| "epoch": 0.8527131782945736, |
| "grad_norm": 0.5106995708311232, |
| "learning_rate": 3.9943772862864303e-05, |
| "loss": 0.248, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.295318067073822, |
| "step": 550, |
| "valid_targets_mean": 4588.8, |
| "valid_targets_min": 2486 |
| }, |
| { |
| "epoch": 0.8604651162790697, |
| "grad_norm": 0.4775850652610667, |
| "learning_rate": 3.993782993592668e-05, |
| "loss": 0.2244, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2367231398820877, |
| "step": 555, |
| "valid_targets_mean": 4133.6, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 0.8682170542635659, |
| "grad_norm": 0.4680021737678082, |
| "learning_rate": 3.9931589004054305e-05, |
| "loss": 0.2394, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23238858580589294, |
| "step": 560, |
| "valid_targets_mean": 4216.1, |
| "valid_targets_min": 516 |
| }, |
| { |
| "epoch": 0.875968992248062, |
| "grad_norm": 0.5582382675085276, |
| "learning_rate": 3.992505016052858e-05, |
| "loss": 0.2275, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24689146876335144, |
| "step": 565, |
| "valid_targets_mean": 4033.6, |
| "valid_targets_min": 1922 |
| }, |
| { |
| "epoch": 0.8837209302325582, |
| "grad_norm": 0.48825810766144667, |
| "learning_rate": 3.991821350308369e-05, |
| "loss": 0.2269, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23387084901332855, |
| "step": 570, |
| "valid_targets_mean": 4010.4, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 0.8914728682170543, |
| "grad_norm": 0.3468810555031447, |
| "learning_rate": 3.991107913390516e-05, |
| "loss": 0.2017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16606643795967102, |
| "step": 575, |
| "valid_targets_mean": 6431.9, |
| "valid_targets_min": 2510 |
| }, |
| { |
| "epoch": 0.8992248062015504, |
| "grad_norm": 0.4163415879240496, |
| "learning_rate": 3.990364715962833e-05, |
| "loss": 0.2258, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1997481882572174, |
| "step": 580, |
| "valid_targets_mean": 5320.4, |
| "valid_targets_min": 2104 |
| }, |
| { |
| "epoch": 0.9069767441860465, |
| "grad_norm": 0.5473724440573992, |
| "learning_rate": 3.989591769133675e-05, |
| "loss": 0.2154, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24773220717906952, |
| "step": 585, |
| "valid_targets_mean": 4261.8, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 0.9147286821705426, |
| "grad_norm": 0.5436217489799219, |
| "learning_rate": 3.988789084456054e-05, |
| "loss": 0.232, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.26351064443588257, |
| "step": 590, |
| "valid_targets_mean": 3915.2, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 0.9224806201550387, |
| "grad_norm": 0.41536583827338946, |
| "learning_rate": 3.9879566739274626e-05, |
| "loss": 0.2094, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2559744715690613, |
| "step": 595, |
| "valid_targets_mean": 5054.2, |
| "valid_targets_min": 2545 |
| }, |
| { |
| "epoch": 0.9302325581395349, |
| "grad_norm": 0.35411011586501473, |
| "learning_rate": 3.987094549989699e-05, |
| "loss": 0.2118, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18530899286270142, |
| "step": 600, |
| "valid_targets_mean": 5971.2, |
| "valid_targets_min": 1835 |
| }, |
| { |
| "epoch": 0.937984496124031, |
| "grad_norm": 0.4392551065067926, |
| "learning_rate": 3.98620272552868e-05, |
| "loss": 0.2495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21953071653842926, |
| "step": 605, |
| "valid_targets_mean": 4565.2, |
| "valid_targets_min": 1942 |
| }, |
| { |
| "epoch": 0.9457364341085271, |
| "grad_norm": 0.47803844935864886, |
| "learning_rate": 3.985281213874244e-05, |
| "loss": 0.2298, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29870736598968506, |
| "step": 610, |
| "valid_targets_mean": 4237.6, |
| "valid_targets_min": 326 |
| }, |
| { |
| "epoch": 0.9534883720930233, |
| "grad_norm": 0.44870011943315186, |
| "learning_rate": 3.984330028799957e-05, |
| "loss": 0.2274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2335856556892395, |
| "step": 615, |
| "valid_targets_mean": 4557.3, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 0.9612403100775194, |
| "grad_norm": 0.5014485102007264, |
| "learning_rate": 3.9833491845229065e-05, |
| "loss": 0.2085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.253334641456604, |
| "step": 620, |
| "valid_targets_mean": 3717.8, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 0.9689922480620154, |
| "grad_norm": 0.4539009088514093, |
| "learning_rate": 3.982338695703486e-05, |
| "loss": 0.2471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2949668765068054, |
| "step": 625, |
| "valid_targets_mean": 4934.7, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 0.9767441860465116, |
| "grad_norm": 0.42836269237630537, |
| "learning_rate": 3.9812985774451763e-05, |
| "loss": 0.227, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23034946620464325, |
| "step": 630, |
| "valid_targets_mean": 4939.8, |
| "valid_targets_min": 2461 |
| }, |
| { |
| "epoch": 0.9844961240310077, |
| "grad_norm": 0.6158981927965868, |
| "learning_rate": 3.980228845294323e-05, |
| "loss": 0.2103, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23234328627586365, |
| "step": 635, |
| "valid_targets_mean": 4101.9, |
| "valid_targets_min": 386 |
| }, |
| { |
| "epoch": 0.9922480620155039, |
| "grad_norm": 0.4762142114139161, |
| "learning_rate": 3.9791295152399014e-05, |
| "loss": 0.2229, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20974400639533997, |
| "step": 640, |
| "valid_targets_mean": 3889.9, |
| "valid_targets_min": 266 |
| }, |
| { |
| "epoch": 1.0, |
| "grad_norm": 0.5061517747796611, |
| "learning_rate": 3.978000603713276e-05, |
| "loss": 0.2162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21345987915992737, |
| "step": 645, |
| "valid_targets_mean": 3841.9, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 1.0077519379844961, |
| "grad_norm": 0.7869218457307112, |
| "learning_rate": 3.976842127587959e-05, |
| "loss": 0.2392, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23174425959587097, |
| "step": 650, |
| "valid_targets_mean": 5303.6, |
| "valid_targets_min": 1966 |
| }, |
| { |
| "epoch": 1.0155038759689923, |
| "grad_norm": 0.5003906965370145, |
| "learning_rate": 3.975654104179356e-05, |
| "loss": 0.2077, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22817862033843994, |
| "step": 655, |
| "valid_targets_mean": 3844.0, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 1.0232558139534884, |
| "grad_norm": 0.4114203739700514, |
| "learning_rate": 3.9744365512445056e-05, |
| "loss": 0.2283, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25271815061569214, |
| "step": 660, |
| "valid_targets_mean": 5901.1, |
| "valid_targets_min": 2452 |
| }, |
| { |
| "epoch": 1.0310077519379846, |
| "grad_norm": 0.4575096509840006, |
| "learning_rate": 3.973189486981818e-05, |
| "loss": 0.2171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2162925899028778, |
| "step": 665, |
| "valid_targets_mean": 4902.4, |
| "valid_targets_min": 497 |
| }, |
| { |
| "epoch": 1.0387596899224807, |
| "grad_norm": 0.4021600509804852, |
| "learning_rate": 3.971912930030799e-05, |
| "loss": 0.2048, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19043004512786865, |
| "step": 670, |
| "valid_targets_mean": 4917.0, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 1.0465116279069768, |
| "grad_norm": 0.4989156170962161, |
| "learning_rate": 3.970606899471774e-05, |
| "loss": 0.2215, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17856532335281372, |
| "step": 675, |
| "valid_targets_mean": 4752.6, |
| "valid_targets_min": 502 |
| }, |
| { |
| "epoch": 1.054263565891473, |
| "grad_norm": 0.3847796119558988, |
| "learning_rate": 3.969271414825599e-05, |
| "loss": 0.1926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20729967951774597, |
| "step": 680, |
| "valid_targets_mean": 5683.9, |
| "valid_targets_min": 1844 |
| }, |
| { |
| "epoch": 1.062015503875969, |
| "grad_norm": 0.47657171710131, |
| "learning_rate": 3.967906496053377e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21222332119941711, |
| "step": 685, |
| "valid_targets_mean": 4150.8, |
| "valid_targets_min": 962 |
| }, |
| { |
| "epoch": 1.069767441860465, |
| "grad_norm": 0.3858090579432838, |
| "learning_rate": 3.966512163556149e-05, |
| "loss": 0.2201, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2170460969209671, |
| "step": 690, |
| "valid_targets_mean": 5164.2, |
| "valid_targets_min": 1885 |
| }, |
| { |
| "epoch": 1.0775193798449612, |
| "grad_norm": 0.4290059612627937, |
| "learning_rate": 3.965088438174597e-05, |
| "loss": 0.1915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1908944547176361, |
| "step": 695, |
| "valid_targets_mean": 4788.8, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 1.0852713178294573, |
| "grad_norm": 0.4409936183324337, |
| "learning_rate": 3.963635341188729e-05, |
| "loss": 0.2102, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23212580382823944, |
| "step": 700, |
| "valid_targets_mean": 4988.8, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 1.0930232558139534, |
| "grad_norm": 0.45813599715819825, |
| "learning_rate": 3.962152894317564e-05, |
| "loss": 0.2243, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23683017492294312, |
| "step": 705, |
| "valid_targets_mean": 4570.3, |
| "valid_targets_min": 2488 |
| }, |
| { |
| "epoch": 1.1007751937984496, |
| "grad_norm": 0.40951900195560925, |
| "learning_rate": 3.960641119718802e-05, |
| "loss": 0.2143, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2278529703617096, |
| "step": 710, |
| "valid_targets_mean": 5026.8, |
| "valid_targets_min": 393 |
| }, |
| { |
| "epoch": 1.1085271317829457, |
| "grad_norm": 0.36962646479291916, |
| "learning_rate": 3.9591000399884974e-05, |
| "loss": 0.1855, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19535881280899048, |
| "step": 715, |
| "valid_targets_mean": 5893.4, |
| "valid_targets_min": 1714 |
| }, |
| { |
| "epoch": 1.1162790697674418, |
| "grad_norm": 0.4169785909813559, |
| "learning_rate": 3.957529678160721e-05, |
| "loss": 0.2211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22500549256801605, |
| "step": 720, |
| "valid_targets_mean": 5345.6, |
| "valid_targets_min": 512 |
| }, |
| { |
| "epoch": 1.124031007751938, |
| "grad_norm": 0.49607819631085537, |
| "learning_rate": 3.9559300577072115e-05, |
| "loss": 0.2299, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25468283891677856, |
| "step": 725, |
| "valid_targets_mean": 5040.8, |
| "valid_targets_min": 2775 |
| }, |
| { |
| "epoch": 1.1317829457364341, |
| "grad_norm": 0.5069100805388594, |
| "learning_rate": 3.954301202537032e-05, |
| "loss": 0.1978, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1782360076904297, |
| "step": 730, |
| "valid_targets_mean": 5846.9, |
| "valid_targets_min": 2328 |
| }, |
| { |
| "epoch": 1.1395348837209303, |
| "grad_norm": 0.5044747278952141, |
| "learning_rate": 3.952643136996205e-05, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22031991183757782, |
| "step": 735, |
| "valid_targets_mean": 3806.4, |
| "valid_targets_min": 250 |
| }, |
| { |
| "epoch": 1.1472868217054264, |
| "grad_norm": 0.713115718875641, |
| "learning_rate": 3.950955885867353e-05, |
| "loss": 0.1987, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17436224222183228, |
| "step": 740, |
| "valid_targets_mean": 4936.1, |
| "valid_targets_min": 2127 |
| }, |
| { |
| "epoch": 1.1550387596899225, |
| "grad_norm": 0.5036250359903303, |
| "learning_rate": 3.9492394743693266e-05, |
| "loss": 0.2187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2408798635005951, |
| "step": 745, |
| "valid_targets_mean": 3656.3, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 1.1627906976744187, |
| "grad_norm": 0.46006096792307244, |
| "learning_rate": 3.94749392815683e-05, |
| "loss": 0.1973, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19669455289840698, |
| "step": 750, |
| "valid_targets_mean": 4952.6, |
| "valid_targets_min": 1766 |
| }, |
| { |
| "epoch": 1.1705426356589148, |
| "grad_norm": 0.4672041249500244, |
| "learning_rate": 3.9457192733200315e-05, |
| "loss": 0.2053, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1791488230228424, |
| "step": 755, |
| "valid_targets_mean": 4441.9, |
| "valid_targets_min": 650 |
| }, |
| { |
| "epoch": 1.178294573643411, |
| "grad_norm": 0.42348721602696954, |
| "learning_rate": 3.9439155363841814e-05, |
| "loss": 0.2092, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17398425936698914, |
| "step": 760, |
| "valid_targets_mean": 4538.8, |
| "valid_targets_min": 277 |
| }, |
| { |
| "epoch": 1.1860465116279069, |
| "grad_norm": 0.5878356373078284, |
| "learning_rate": 3.9420827443092104e-05, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2349127233028412, |
| "step": 765, |
| "valid_targets_mean": 4086.5, |
| "valid_targets_min": 644 |
| }, |
| { |
| "epoch": 1.193798449612403, |
| "grad_norm": 0.476452037868028, |
| "learning_rate": 3.940220924489327e-05, |
| "loss": 0.2181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2374195158481598, |
| "step": 770, |
| "valid_targets_mean": 3906.2, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 1.2015503875968991, |
| "grad_norm": 0.4353925367240353, |
| "learning_rate": 3.938330104752609e-05, |
| "loss": 0.2182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20411117374897003, |
| "step": 775, |
| "valid_targets_mean": 4184.5, |
| "valid_targets_min": 317 |
| }, |
| { |
| "epoch": 1.2093023255813953, |
| "grad_norm": 0.44738786787353246, |
| "learning_rate": 3.936410313360589e-05, |
| "loss": 0.2074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.29115378856658936, |
| "step": 780, |
| "valid_targets_mean": 5176.8, |
| "valid_targets_min": 2427 |
| }, |
| { |
| "epoch": 1.2170542635658914, |
| "grad_norm": 0.5025078305803677, |
| "learning_rate": 3.934461579007829e-05, |
| "loss": 0.1905, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.194045752286911, |
| "step": 785, |
| "valid_targets_mean": 4190.2, |
| "valid_targets_min": 2274 |
| }, |
| { |
| "epoch": 1.2248062015503876, |
| "grad_norm": 0.399168491370644, |
| "learning_rate": 3.932483930821495e-05, |
| "loss": 0.2027, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19120316207408905, |
| "step": 790, |
| "valid_targets_mean": 5678.2, |
| "valid_targets_min": 2268 |
| }, |
| { |
| "epoch": 1.2325581395348837, |
| "grad_norm": 0.40122275394036194, |
| "learning_rate": 3.930477398360915e-05, |
| "loss": 0.2109, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20044457912445068, |
| "step": 795, |
| "valid_targets_mean": 5078.8, |
| "valid_targets_min": 1999 |
| }, |
| { |
| "epoch": 1.2403100775193798, |
| "grad_norm": 0.42534010971764247, |
| "learning_rate": 3.928442011617148e-05, |
| "loss": 0.2093, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21228013932704926, |
| "step": 800, |
| "valid_targets_mean": 3933.1, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 1.248062015503876, |
| "grad_norm": 0.7069266989704566, |
| "learning_rate": 3.926377801012526e-05, |
| "loss": 0.2367, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22949740290641785, |
| "step": 805, |
| "valid_targets_mean": 4512.6, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 1.255813953488372, |
| "grad_norm": 0.42027583645711425, |
| "learning_rate": 3.9242847974002026e-05, |
| "loss": 0.2204, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2134920060634613, |
| "step": 810, |
| "valid_targets_mean": 4943.6, |
| "valid_targets_min": 1805 |
| }, |
| { |
| "epoch": 1.2635658914728682, |
| "grad_norm": 0.39016064981111986, |
| "learning_rate": 3.9221630320636935e-05, |
| "loss": 0.2095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19790124893188477, |
| "step": 815, |
| "valid_targets_mean": 4984.6, |
| "valid_targets_min": 2085 |
| }, |
| { |
| "epoch": 1.2713178294573644, |
| "grad_norm": 0.48120226759216767, |
| "learning_rate": 3.9200125367164076e-05, |
| "loss": 0.2083, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19904130697250366, |
| "step": 820, |
| "valid_targets_mean": 3452.6, |
| "valid_targets_min": 477 |
| }, |
| { |
| "epoch": 1.2790697674418605, |
| "grad_norm": 0.4551570397834542, |
| "learning_rate": 3.917833343501171e-05, |
| "loss": 0.1955, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19769467413425446, |
| "step": 825, |
| "valid_targets_mean": 5811.2, |
| "valid_targets_min": 923 |
| }, |
| { |
| "epoch": 1.2868217054263567, |
| "grad_norm": 0.43735207764564604, |
| "learning_rate": 3.91562548498975e-05, |
| "loss": 0.1992, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20643508434295654, |
| "step": 830, |
| "valid_targets_mean": 4570.1, |
| "valid_targets_min": 2493 |
| }, |
| { |
| "epoch": 1.2945736434108528, |
| "grad_norm": 0.4299580048955895, |
| "learning_rate": 3.913388994182364e-05, |
| "loss": 0.2196, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18837128579616547, |
| "step": 835, |
| "valid_targets_mean": 4744.1, |
| "valid_targets_min": 881 |
| }, |
| { |
| "epoch": 1.302325581395349, |
| "grad_norm": 0.3538726377495065, |
| "learning_rate": 3.9111239045071876e-05, |
| "loss": 0.1755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13884110748767853, |
| "step": 840, |
| "valid_targets_mean": 5657.9, |
| "valid_targets_min": 453 |
| }, |
| { |
| "epoch": 1.310077519379845, |
| "grad_norm": 0.48494658304811955, |
| "learning_rate": 3.9088302498198564e-05, |
| "loss": 0.2032, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21122536063194275, |
| "step": 845, |
| "valid_targets_mean": 4122.8, |
| "valid_targets_min": 264 |
| }, |
| { |
| "epoch": 1.3178294573643412, |
| "grad_norm": 0.40106643807384035, |
| "learning_rate": 3.90650806440296e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19900798797607422, |
| "step": 850, |
| "valid_targets_mean": 5050.8, |
| "valid_targets_min": 2416 |
| }, |
| { |
| "epoch": 1.3255813953488373, |
| "grad_norm": 0.3960604184673925, |
| "learning_rate": 3.904157382965526e-05, |
| "loss": 0.2157, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22484715282917023, |
| "step": 855, |
| "valid_targets_mean": 5748.9, |
| "valid_targets_min": 1856 |
| }, |
| { |
| "epoch": 1.3333333333333333, |
| "grad_norm": 0.3257220820239636, |
| "learning_rate": 3.9017782406425045e-05, |
| "loss": 0.2088, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16785819828510284, |
| "step": 860, |
| "valid_targets_mean": 5923.4, |
| "valid_targets_min": 2779 |
| }, |
| { |
| "epoch": 1.3410852713178294, |
| "grad_norm": 0.4239797338208263, |
| "learning_rate": 3.899370672994244e-05, |
| "loss": 0.2188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1850738823413849, |
| "step": 865, |
| "valid_targets_mean": 4976.4, |
| "valid_targets_min": 695 |
| }, |
| { |
| "epoch": 1.3488372093023255, |
| "grad_norm": 0.4680128138024682, |
| "learning_rate": 3.896934716005956e-05, |
| "loss": 0.219, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23862537741661072, |
| "step": 870, |
| "valid_targets_mean": 4609.4, |
| "valid_targets_min": 321 |
| }, |
| { |
| "epoch": 1.3565891472868217, |
| "grad_norm": 0.34295981747721627, |
| "learning_rate": 3.8944704060871803e-05, |
| "loss": 0.2328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19128797948360443, |
| "step": 875, |
| "valid_targets_mean": 6440.4, |
| "valid_targets_min": 2928 |
| }, |
| { |
| "epoch": 1.3643410852713178, |
| "grad_norm": 0.39579678053682266, |
| "learning_rate": 3.891977780071238e-05, |
| "loss": 0.2386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22662851214408875, |
| "step": 880, |
| "valid_targets_mean": 5590.4, |
| "valid_targets_min": 418 |
| }, |
| { |
| "epoch": 1.372093023255814, |
| "grad_norm": 0.3650270597088362, |
| "learning_rate": 3.889456875214685e-05, |
| "loss": 0.2028, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18867811560630798, |
| "step": 885, |
| "valid_targets_mean": 5108.4, |
| "valid_targets_min": 2550 |
| }, |
| { |
| "epoch": 1.37984496124031, |
| "grad_norm": 0.43546961058361106, |
| "learning_rate": 3.8869077291967514e-05, |
| "loss": 0.2091, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18624623119831085, |
| "step": 890, |
| "valid_targets_mean": 3812.8, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 1.3875968992248062, |
| "grad_norm": 0.35003941903300767, |
| "learning_rate": 3.88433038011878e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17150872945785522, |
| "step": 895, |
| "valid_targets_mean": 5599.2, |
| "valid_targets_min": 2853 |
| }, |
| { |
| "epoch": 1.3953488372093024, |
| "grad_norm": 0.40616386423722534, |
| "learning_rate": 3.881724866503656e-05, |
| "loss": 0.207, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.221075639128685, |
| "step": 900, |
| "valid_targets_mean": 4683.5, |
| "valid_targets_min": 1955 |
| }, |
| { |
| "epoch": 1.4031007751937985, |
| "grad_norm": 0.45770780156293883, |
| "learning_rate": 3.879091227295233e-05, |
| "loss": 0.2342, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3284824788570404, |
| "step": 905, |
| "valid_targets_mean": 5965.8, |
| "valid_targets_min": 2467 |
| }, |
| { |
| "epoch": 1.4108527131782946, |
| "grad_norm": 0.43076323744174305, |
| "learning_rate": 3.876429501857748e-05, |
| "loss": 0.2165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2374260425567627, |
| "step": 910, |
| "valid_targets_mean": 5230.9, |
| "valid_targets_min": 2401 |
| }, |
| { |
| "epoch": 1.4186046511627908, |
| "grad_norm": 0.4744851861080025, |
| "learning_rate": 3.873739729975237e-05, |
| "loss": 0.2156, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22709140181541443, |
| "step": 915, |
| "valid_targets_mean": 3975.9, |
| "valid_targets_min": 281 |
| }, |
| { |
| "epoch": 1.4263565891472867, |
| "grad_norm": 0.4914323912239341, |
| "learning_rate": 3.871021951850935e-05, |
| "loss": 0.2059, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2681000232696533, |
| "step": 920, |
| "valid_targets_mean": 4153.2, |
| "valid_targets_min": 579 |
| }, |
| { |
| "epoch": 1.4341085271317828, |
| "grad_norm": 0.5702552607786674, |
| "learning_rate": 3.868276208106681e-05, |
| "loss": 0.2307, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23841242492198944, |
| "step": 925, |
| "valid_targets_mean": 4588.2, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 1.441860465116279, |
| "grad_norm": 0.4960800862921102, |
| "learning_rate": 3.8655025397823054e-05, |
| "loss": 0.1843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19032783806324005, |
| "step": 930, |
| "valid_targets_mean": 4889.1, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 1.449612403100775, |
| "grad_norm": 0.3982547722090709, |
| "learning_rate": 3.862700988335022e-05, |
| "loss": 0.2096, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19539685547351837, |
| "step": 935, |
| "valid_targets_mean": 5027.4, |
| "valid_targets_min": 2790 |
| }, |
| { |
| "epoch": 1.4573643410852712, |
| "grad_norm": 0.4822298209707658, |
| "learning_rate": 3.8598715956388026e-05, |
| "loss": 0.218, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19648897647857666, |
| "step": 940, |
| "valid_targets_mean": 3873.2, |
| "valid_targets_min": 346 |
| }, |
| { |
| "epoch": 1.4651162790697674, |
| "grad_norm": 0.372486771897578, |
| "learning_rate": 3.8570144039837564e-05, |
| "loss": 0.2036, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15964803099632263, |
| "step": 945, |
| "valid_targets_mean": 4909.3, |
| "valid_targets_min": 2298 |
| }, |
| { |
| "epoch": 1.4728682170542635, |
| "grad_norm": 0.39582842776828425, |
| "learning_rate": 3.854129456075495e-05, |
| "loss": 0.2138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1935088038444519, |
| "step": 950, |
| "valid_targets_mean": 5237.1, |
| "valid_targets_min": 2445 |
| }, |
| { |
| "epoch": 1.4806201550387597, |
| "grad_norm": 0.4768595855727291, |
| "learning_rate": 3.8512167950344916e-05, |
| "loss": 0.2198, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24240124225616455, |
| "step": 955, |
| "valid_targets_mean": 4105.6, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 1.4883720930232558, |
| "grad_norm": 0.4935988281203597, |
| "learning_rate": 3.848276464395445e-05, |
| "loss": 0.2062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24553832411766052, |
| "step": 960, |
| "valid_targets_mean": 4142.4, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 1.496124031007752, |
| "grad_norm": 0.3508044933691806, |
| "learning_rate": 3.8453085081066195e-05, |
| "loss": 0.1977, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1662253439426422, |
| "step": 965, |
| "valid_targets_mean": 5088.2, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 1.503875968992248, |
| "grad_norm": 0.40679599062954963, |
| "learning_rate": 3.842312970529193e-05, |
| "loss": 0.2284, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2687034010887146, |
| "step": 970, |
| "valid_targets_mean": 5584.9, |
| "valid_targets_min": 265 |
| }, |
| { |
| "epoch": 1.5116279069767442, |
| "grad_norm": 0.5352927860483538, |
| "learning_rate": 3.839289896436592e-05, |
| "loss": 0.2209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24231748282909393, |
| "step": 975, |
| "valid_targets_mean": 3208.9, |
| "valid_targets_min": 401 |
| }, |
| { |
| "epoch": 1.5193798449612403, |
| "grad_norm": 0.4748472407205153, |
| "learning_rate": 3.836239331013825e-05, |
| "loss": 0.2151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18979281187057495, |
| "step": 980, |
| "valid_targets_mean": 3701.5, |
| "valid_targets_min": 455 |
| }, |
| { |
| "epoch": 1.5271317829457365, |
| "grad_norm": 0.345182798324371, |
| "learning_rate": 3.8331613198568056e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.164521723985672, |
| "step": 985, |
| "valid_targets_mean": 5305.6, |
| "valid_targets_min": 2154 |
| }, |
| { |
| "epoch": 1.5348837209302326, |
| "grad_norm": 0.34148764388998604, |
| "learning_rate": 3.830055908971668e-05, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1817236989736557, |
| "step": 990, |
| "valid_targets_mean": 5507.2, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 1.5426356589147288, |
| "grad_norm": 0.3914530838647767, |
| "learning_rate": 3.8269231447740844e-05, |
| "loss": 0.2134, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18969038128852844, |
| "step": 995, |
| "valid_targets_mean": 5196.0, |
| "valid_targets_min": 827 |
| }, |
| { |
| "epoch": 1.550387596899225, |
| "grad_norm": 0.39571077331421817, |
| "learning_rate": 3.823763074088568e-05, |
| "loss": 0.2054, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.209140807390213, |
| "step": 1000, |
| "valid_targets_mean": 5359.5, |
| "valid_targets_min": 1861 |
| }, |
| { |
| "epoch": 1.558139534883721, |
| "grad_norm": 0.3713493032556294, |
| "learning_rate": 3.8205757441477755e-05, |
| "loss": 0.2178, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1935080587863922, |
| "step": 1005, |
| "valid_targets_mean": 5409.0, |
| "valid_targets_min": 2022 |
| }, |
| { |
| "epoch": 1.5658914728682172, |
| "grad_norm": 0.40758343223754234, |
| "learning_rate": 3.8173612025917984e-05, |
| "loss": 0.216, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19840386509895325, |
| "step": 1010, |
| "valid_targets_mean": 5117.1, |
| "valid_targets_min": 590 |
| }, |
| { |
| "epoch": 1.5736434108527133, |
| "grad_norm": 0.3957074242428162, |
| "learning_rate": 3.8141194974674534e-05, |
| "loss": 0.2104, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20921745896339417, |
| "step": 1015, |
| "valid_targets_mean": 4456.0, |
| "valid_targets_min": 391 |
| }, |
| { |
| "epoch": 1.5813953488372094, |
| "grad_norm": 0.3733502693439458, |
| "learning_rate": 3.810850677227561e-05, |
| "loss": 0.2013, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16597923636436462, |
| "step": 1020, |
| "valid_targets_mean": 4493.0, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 1.5891472868217056, |
| "grad_norm": 0.3628573096363499, |
| "learning_rate": 3.8075547907302255e-05, |
| "loss": 0.2158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20087650418281555, |
| "step": 1025, |
| "valid_targets_mean": 5676.1, |
| "valid_targets_min": 1946 |
| }, |
| { |
| "epoch": 1.5968992248062015, |
| "grad_norm": 0.4127367151722258, |
| "learning_rate": 3.804231887238103e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2233181893825531, |
| "step": 1030, |
| "valid_targets_mean": 4449.3, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 1.6046511627906976, |
| "grad_norm": 0.3649731232133132, |
| "learning_rate": 3.800882016417662e-05, |
| "loss": 0.2217, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16599664092063904, |
| "step": 1035, |
| "valid_targets_mean": 4848.2, |
| "valid_targets_min": 1859 |
| }, |
| { |
| "epoch": 1.6124031007751938, |
| "grad_norm": 0.46927973730672984, |
| "learning_rate": 3.797505228338447e-05, |
| "loss": 0.2065, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2043415606021881, |
| "step": 1040, |
| "valid_targets_mean": 3859.1, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 1.62015503875969, |
| "grad_norm": 0.452023920939608, |
| "learning_rate": 3.794101573472325e-05, |
| "loss": 0.1983, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24635906517505646, |
| "step": 1045, |
| "valid_targets_mean": 4854.6, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 1.627906976744186, |
| "grad_norm": 0.41920457500146513, |
| "learning_rate": 3.7906711026927344e-05, |
| "loss": 0.1927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21003258228302002, |
| "step": 1050, |
| "valid_targets_mean": 4362.9, |
| "valid_targets_min": 2643 |
| }, |
| { |
| "epoch": 1.6356589147286822, |
| "grad_norm": 0.46857169083181116, |
| "learning_rate": 3.787213867273921e-05, |
| "loss": 0.2055, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2265489399433136, |
| "step": 1055, |
| "valid_targets_mean": 4190.8, |
| "valid_targets_min": 1976 |
| }, |
| { |
| "epoch": 1.6434108527131783, |
| "grad_norm": 0.4767624399813519, |
| "learning_rate": 3.783729918890176e-05, |
| "loss": 0.2186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17004413902759552, |
| "step": 1060, |
| "valid_targets_mean": 5151.8, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 1.6511627906976745, |
| "grad_norm": 0.3947749262809709, |
| "learning_rate": 3.780219309615061e-05, |
| "loss": 0.2164, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20741719007492065, |
| "step": 1065, |
| "valid_targets_mean": 4775.2, |
| "valid_targets_min": 2041 |
| }, |
| { |
| "epoch": 1.6589147286821704, |
| "grad_norm": 0.3652762324269706, |
| "learning_rate": 3.7766820919206294e-05, |
| "loss": 0.2074, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1898358166217804, |
| "step": 1070, |
| "valid_targets_mean": 5115.6, |
| "valid_targets_min": 395 |
| }, |
| { |
| "epoch": 1.6666666666666665, |
| "grad_norm": 0.4172044880561881, |
| "learning_rate": 3.7731183186766444e-05, |
| "loss": 0.2037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19984492659568787, |
| "step": 1075, |
| "valid_targets_mean": 4925.4, |
| "valid_targets_min": 2372 |
| }, |
| { |
| "epoch": 1.6744186046511627, |
| "grad_norm": 0.37343486351450866, |
| "learning_rate": 3.7695280431497845e-05, |
| "loss": 0.2067, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21672552824020386, |
| "step": 1080, |
| "valid_targets_mean": 5672.4, |
| "valid_targets_min": 3114 |
| }, |
| { |
| "epoch": 1.6821705426356588, |
| "grad_norm": 0.4094562646804994, |
| "learning_rate": 3.765911319002854e-05, |
| "loss": 0.2256, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2076679766178131, |
| "step": 1085, |
| "valid_targets_mean": 4861.9, |
| "valid_targets_min": 351 |
| }, |
| { |
| "epoch": 1.689922480620155, |
| "grad_norm": 0.31444076763215517, |
| "learning_rate": 3.762268200293973e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13465389609336853, |
| "step": 1090, |
| "valid_targets_mean": 4960.0, |
| "valid_targets_min": 566 |
| }, |
| { |
| "epoch": 1.697674418604651, |
| "grad_norm": 0.4339023669513262, |
| "learning_rate": 3.7585987414757774e-05, |
| "loss": 0.2153, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1692432165145874, |
| "step": 1095, |
| "valid_targets_mean": 3976.5, |
| "valid_targets_min": 1131 |
| }, |
| { |
| "epoch": 1.7054263565891472, |
| "grad_norm": 0.493759660874177, |
| "learning_rate": 3.754902997394597e-05, |
| "loss": 0.2076, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20814771950244904, |
| "step": 1100, |
| "valid_targets_mean": 4421.8, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 1.7131782945736433, |
| "grad_norm": 0.39667125615949944, |
| "learning_rate": 3.7511810232896435e-05, |
| "loss": 0.2221, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24969351291656494, |
| "step": 1105, |
| "valid_targets_mean": 6635.4, |
| "valid_targets_min": 767 |
| }, |
| { |
| "epoch": 1.7209302325581395, |
| "grad_norm": 0.40845510116998796, |
| "learning_rate": 3.7474328747921776e-05, |
| "loss": 0.192, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2053869366645813, |
| "step": 1110, |
| "valid_targets_mean": 4257.3, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 1.7286821705426356, |
| "grad_norm": 0.3654829840675916, |
| "learning_rate": 3.743658607924683e-05, |
| "loss": 0.2047, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20669598877429962, |
| "step": 1115, |
| "valid_targets_mean": 5434.2, |
| "valid_targets_min": 599 |
| }, |
| { |
| "epoch": 1.7364341085271318, |
| "grad_norm": 0.437762903353236, |
| "learning_rate": 3.739858279100028e-05, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2025665044784546, |
| "step": 1120, |
| "valid_targets_mean": 5428.5, |
| "valid_targets_min": 3371 |
| }, |
| { |
| "epoch": 1.744186046511628, |
| "grad_norm": 0.5392878995782371, |
| "learning_rate": 3.736031945120621e-05, |
| "loss": 0.2211, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22214415669441223, |
| "step": 1125, |
| "valid_targets_mean": 4204.6, |
| "valid_targets_min": 1972 |
| }, |
| { |
| "epoch": 1.751937984496124, |
| "grad_norm": 0.550987196574115, |
| "learning_rate": 3.732179663177559e-05, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17631106078624725, |
| "step": 1130, |
| "valid_targets_mean": 5127.2, |
| "valid_targets_min": 2529 |
| }, |
| { |
| "epoch": 1.7596899224806202, |
| "grad_norm": 0.3704297654863633, |
| "learning_rate": 3.728301490849778e-05, |
| "loss": 0.2116, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18758273124694824, |
| "step": 1135, |
| "valid_targets_mean": 5341.6, |
| "valid_targets_min": 2320 |
| }, |
| { |
| "epoch": 1.7674418604651163, |
| "grad_norm": 0.466284801284017, |
| "learning_rate": 3.7243974861031915e-05, |
| "loss": 0.2052, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27421271800994873, |
| "step": 1140, |
| "valid_targets_mean": 4469.6, |
| "valid_targets_min": 2055 |
| }, |
| { |
| "epoch": 1.7751937984496124, |
| "grad_norm": 0.4548187236481328, |
| "learning_rate": 3.720467707289819e-05, |
| "loss": 0.1848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19912035763263702, |
| "step": 1145, |
| "valid_targets_mean": 5421.1, |
| "valid_targets_min": 297 |
| }, |
| { |
| "epoch": 1.7829457364341086, |
| "grad_norm": 0.4234654458795664, |
| "learning_rate": 3.7165122131469205e-05, |
| "loss": 0.1967, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20600225031375885, |
| "step": 1150, |
| "valid_targets_mean": 4677.9, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 1.7906976744186047, |
| "grad_norm": 0.4892297020617883, |
| "learning_rate": 3.712531062796114e-05, |
| "loss": 0.2302, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2325432002544403, |
| "step": 1155, |
| "valid_targets_mean": 3676.9, |
| "valid_targets_min": 378 |
| }, |
| { |
| "epoch": 1.7984496124031009, |
| "grad_norm": 0.4615952861064993, |
| "learning_rate": 3.708524315742494e-05, |
| "loss": 0.2095, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20138488709926605, |
| "step": 1160, |
| "valid_targets_mean": 3587.5, |
| "valid_targets_min": 649 |
| }, |
| { |
| "epoch": 1.806201550387597, |
| "grad_norm": 0.4107586531975636, |
| "learning_rate": 3.704492031873742e-05, |
| "loss": 0.2085, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18871745467185974, |
| "step": 1165, |
| "valid_targets_mean": 4104.7, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 1.8139534883720931, |
| "grad_norm": 0.4364150036844027, |
| "learning_rate": 3.700434271459229e-05, |
| "loss": 0.1851, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18455129861831665, |
| "step": 1170, |
| "valid_targets_mean": 4351.6, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 1.8217054263565893, |
| "grad_norm": 0.40802425859518093, |
| "learning_rate": 3.696351095149117e-05, |
| "loss": 0.2017, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20364965498447418, |
| "step": 1175, |
| "valid_targets_mean": 4112.6, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 1.8294573643410854, |
| "grad_norm": 0.4032478517472396, |
| "learning_rate": 3.692242563973454e-05, |
| "loss": 0.2209, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.25360697507858276, |
| "step": 1180, |
| "valid_targets_mean": 5295.9, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 1.8372093023255816, |
| "grad_norm": 0.4614085026878937, |
| "learning_rate": 3.688108739341258e-05, |
| "loss": 0.1926, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20508089661598206, |
| "step": 1185, |
| "valid_targets_mean": 3781.7, |
| "valid_targets_min": 270 |
| }, |
| { |
| "epoch": 1.8449612403100775, |
| "grad_norm": 0.3802819813887152, |
| "learning_rate": 3.683949683039602e-05, |
| "loss": 0.2274, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20417264103889465, |
| "step": 1190, |
| "valid_targets_mean": 4810.9, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 1.8527131782945736, |
| "grad_norm": 0.43348296046621254, |
| "learning_rate": 3.679765457232687e-05, |
| "loss": 0.2113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19152264297008514, |
| "step": 1195, |
| "valid_targets_mean": 5837.1, |
| "valid_targets_min": 272 |
| }, |
| { |
| "epoch": 1.8604651162790697, |
| "grad_norm": 0.40270266495111867, |
| "learning_rate": 3.675556124460918e-05, |
| "loss": 0.2061, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18859389424324036, |
| "step": 1200, |
| "valid_targets_mean": 4652.8, |
| "valid_targets_min": 2805 |
| }, |
| { |
| "epoch": 1.8682170542635659, |
| "grad_norm": 0.3784724852972052, |
| "learning_rate": 3.6713217476399654e-05, |
| "loss": 0.2069, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22137880325317383, |
| "step": 1205, |
| "valid_targets_mean": 5666.8, |
| "valid_targets_min": 1380 |
| }, |
| { |
| "epoch": 1.875968992248062, |
| "grad_norm": 0.3563867466614007, |
| "learning_rate": 3.6670623900598264e-05, |
| "loss": 0.1915, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17663565278053284, |
| "step": 1210, |
| "valid_targets_mean": 4829.3, |
| "valid_targets_min": 2526 |
| }, |
| { |
| "epoch": 1.8837209302325582, |
| "grad_norm": 0.32541904092615365, |
| "learning_rate": 3.662778115383876e-05, |
| "loss": 0.2149, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1512431651353836, |
| "step": 1215, |
| "valid_targets_mean": 5500.1, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 1.8914728682170543, |
| "grad_norm": 0.3562253665751596, |
| "learning_rate": 3.6584689876479206e-05, |
| "loss": 0.195, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16320425271987915, |
| "step": 1220, |
| "valid_targets_mean": 4741.8, |
| "valid_targets_min": 335 |
| }, |
| { |
| "epoch": 1.8992248062015504, |
| "grad_norm": 0.4242425218762759, |
| "learning_rate": 3.654135071259237e-05, |
| "loss": 0.2005, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18462225794792175, |
| "step": 1225, |
| "valid_targets_mean": 3879.1, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 1.9069767441860463, |
| "grad_norm": 0.44990621216299576, |
| "learning_rate": 3.6497764309956104e-05, |
| "loss": 0.2089, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2571909725666046, |
| "step": 1230, |
| "valid_targets_mean": 5112.8, |
| "valid_targets_min": 2435 |
| }, |
| { |
| "epoch": 1.9147286821705425, |
| "grad_norm": 0.3514156745181372, |
| "learning_rate": 3.645393132004367e-05, |
| "loss": 0.2113, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2239769548177719, |
| "step": 1235, |
| "valid_targets_mean": 5990.8, |
| "valid_targets_min": 2526 |
| }, |
| { |
| "epoch": 1.9224806201550386, |
| "grad_norm": 0.4438288563404829, |
| "learning_rate": 3.640985239801399e-05, |
| "loss": 0.2021, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23280391097068787, |
| "step": 1240, |
| "valid_targets_mean": 3919.9, |
| "valid_targets_min": 339 |
| }, |
| { |
| "epoch": 1.9302325581395348, |
| "grad_norm": 0.42245513107437865, |
| "learning_rate": 3.636552820270189e-05, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20294125378131866, |
| "step": 1245, |
| "valid_targets_mean": 4123.6, |
| "valid_targets_min": 608 |
| }, |
| { |
| "epoch": 1.937984496124031, |
| "grad_norm": 0.36173604376638907, |
| "learning_rate": 3.632095939660817e-05, |
| "loss": 0.1921, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19740913808345795, |
| "step": 1250, |
| "valid_targets_mean": 4450.7, |
| "valid_targets_min": 243 |
| }, |
| { |
| "epoch": 1.945736434108527, |
| "grad_norm": 0.4185963445294981, |
| "learning_rate": 3.627614664588981e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20765337347984314, |
| "step": 1255, |
| "valid_targets_mean": 4475.6, |
| "valid_targets_min": 614 |
| }, |
| { |
| "epoch": 1.9534883720930232, |
| "grad_norm": 0.38392441124931787, |
| "learning_rate": 3.623109062034994e-05, |
| "loss": 0.2078, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19816569983959198, |
| "step": 1260, |
| "valid_targets_mean": 4867.6, |
| "valid_targets_min": 655 |
| }, |
| { |
| "epoch": 1.9612403100775193, |
| "grad_norm": 0.43839350861224635, |
| "learning_rate": 3.618579199342783e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20989343523979187, |
| "step": 1265, |
| "valid_targets_mean": 4077.1, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 1.9689922480620154, |
| "grad_norm": 0.4040165567082679, |
| "learning_rate": 3.614025144218887e-05, |
| "loss": 0.2062, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21057480573654175, |
| "step": 1270, |
| "valid_targets_mean": 4318.6, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 1.9767441860465116, |
| "grad_norm": 0.43337547842383023, |
| "learning_rate": 3.60944696473144e-05, |
| "loss": 0.2247, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1987258493900299, |
| "step": 1275, |
| "valid_targets_mean": 4023.1, |
| "valid_targets_min": 526 |
| }, |
| { |
| "epoch": 1.9844961240310077, |
| "grad_norm": 0.3271715231556842, |
| "learning_rate": 3.604844729309158e-05, |
| "loss": 0.17, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17882460355758667, |
| "step": 1280, |
| "valid_targets_mean": 6442.8, |
| "valid_targets_min": 2484 |
| }, |
| { |
| "epoch": 1.9922480620155039, |
| "grad_norm": 0.40322376508720353, |
| "learning_rate": 3.6002185067403126e-05, |
| "loss": 0.2075, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21025332808494568, |
| "step": 1285, |
| "valid_targets_mean": 4968.1, |
| "valid_targets_min": 1984 |
| }, |
| { |
| "epoch": 2.0, |
| "grad_norm": 0.43384474464309075, |
| "learning_rate": 3.5955683661717045e-05, |
| "loss": 0.1963, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22120501101016998, |
| "step": 1290, |
| "valid_targets_mean": 3698.2, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 2.007751937984496, |
| "grad_norm": 0.3930458616713528, |
| "learning_rate": 3.590894377107629e-05, |
| "loss": 0.186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2099405825138092, |
| "step": 1295, |
| "valid_targets_mean": 5265.2, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 2.0155038759689923, |
| "grad_norm": 0.3382222565954035, |
| "learning_rate": 3.586196609408841e-05, |
| "loss": 0.1884, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16293954849243164, |
| "step": 1300, |
| "valid_targets_mean": 5672.2, |
| "valid_targets_min": 2311 |
| }, |
| { |
| "epoch": 2.0232558139534884, |
| "grad_norm": 0.4908644970549336, |
| "learning_rate": 3.5814751332915025e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22366786003112793, |
| "step": 1305, |
| "valid_targets_mean": 3243.5, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 2.0310077519379846, |
| "grad_norm": 0.3498811091866486, |
| "learning_rate": 3.576730019326144e-05, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15233008563518524, |
| "step": 1310, |
| "valid_targets_mean": 4671.6, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 2.0387596899224807, |
| "grad_norm": 0.413386188431943, |
| "learning_rate": 3.571961338436599e-05, |
| "loss": 0.1917, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18065381050109863, |
| "step": 1315, |
| "valid_targets_mean": 5047.1, |
| "valid_targets_min": 845 |
| }, |
| { |
| "epoch": 2.046511627906977, |
| "grad_norm": 0.37597109516074934, |
| "learning_rate": 3.567169161898954e-05, |
| "loss": 0.1994, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1616477519273758, |
| "step": 1320, |
| "valid_targets_mean": 4590.8, |
| "valid_targets_min": 941 |
| }, |
| { |
| "epoch": 2.054263565891473, |
| "grad_norm": 0.41487589705713607, |
| "learning_rate": 3.562353561340473e-05, |
| "loss": 0.2004, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1990424543619156, |
| "step": 1325, |
| "valid_targets_mean": 5129.2, |
| "valid_targets_min": 2305 |
| }, |
| { |
| "epoch": 2.062015503875969, |
| "grad_norm": 0.3711795564505497, |
| "learning_rate": 3.557514608738536e-05, |
| "loss": 0.18, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15171518921852112, |
| "step": 1330, |
| "valid_targets_mean": 4377.2, |
| "valid_targets_min": 575 |
| }, |
| { |
| "epoch": 2.0697674418604652, |
| "grad_norm": 0.4175667094746574, |
| "learning_rate": 3.552652376419557e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16562065482139587, |
| "step": 1335, |
| "valid_targets_mean": 4697.5, |
| "valid_targets_min": 286 |
| }, |
| { |
| "epoch": 2.0775193798449614, |
| "grad_norm": 0.4306958245785991, |
| "learning_rate": 3.5477669370579045e-05, |
| "loss": 0.2022, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1900160312652588, |
| "step": 1340, |
| "valid_targets_mean": 4857.3, |
| "valid_targets_min": 1846 |
| }, |
| { |
| "epoch": 2.0852713178294575, |
| "grad_norm": 0.4476150200629465, |
| "learning_rate": 3.542858363674819e-05, |
| "loss": 0.1807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18552112579345703, |
| "step": 1345, |
| "valid_targets_mean": 6009.1, |
| "valid_targets_min": 314 |
| }, |
| { |
| "epoch": 2.0930232558139537, |
| "grad_norm": 1.2948036152332547, |
| "learning_rate": 3.537926729637316e-05, |
| "loss": 0.1985, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19947974383831024, |
| "step": 1350, |
| "valid_targets_mean": 5068.8, |
| "valid_targets_min": 2881 |
| }, |
| { |
| "epoch": 2.10077519379845, |
| "grad_norm": 0.41477365418280177, |
| "learning_rate": 3.532972108657093e-05, |
| "loss": 0.1777, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19240254163742065, |
| "step": 1355, |
| "valid_targets_mean": 4253.2, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 2.108527131782946, |
| "grad_norm": 0.42076615883749335, |
| "learning_rate": 3.527994574789425e-05, |
| "loss": 0.1741, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1795780062675476, |
| "step": 1360, |
| "valid_targets_mean": 4628.8, |
| "valid_targets_min": 677 |
| }, |
| { |
| "epoch": 2.116279069767442, |
| "grad_norm": 0.3617903288384957, |
| "learning_rate": 3.5229942024320614e-05, |
| "loss": 0.1858, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1568509340286255, |
| "step": 1365, |
| "valid_targets_mean": 4954.9, |
| "valid_targets_min": 712 |
| }, |
| { |
| "epoch": 2.124031007751938, |
| "grad_norm": 0.5456999997368401, |
| "learning_rate": 3.517971066324111e-05, |
| "loss": 0.1914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17306216061115265, |
| "step": 1370, |
| "valid_targets_mean": 3624.9, |
| "valid_targets_min": 335 |
| }, |
| { |
| "epoch": 2.1317829457364343, |
| "grad_norm": 0.38334555353165817, |
| "learning_rate": 3.512925241544925e-05, |
| "loss": 0.1877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19654911756515503, |
| "step": 1375, |
| "valid_targets_mean": 5664.1, |
| "valid_targets_min": 1799 |
| }, |
| { |
| "epoch": 2.13953488372093, |
| "grad_norm": 0.43336348909756756, |
| "learning_rate": 3.5078568035129755e-05, |
| "loss": 0.1835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2114173173904419, |
| "step": 1380, |
| "valid_targets_mean": 4490.0, |
| "valid_targets_min": 535 |
| }, |
| { |
| "epoch": 2.147286821705426, |
| "grad_norm": 0.43851230664405455, |
| "learning_rate": 3.502765827984731e-05, |
| "loss": 0.1816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2103298455476761, |
| "step": 1385, |
| "valid_targets_mean": 4057.0, |
| "valid_targets_min": 2866 |
| }, |
| { |
| "epoch": 2.1550387596899223, |
| "grad_norm": 0.48397504627229887, |
| "learning_rate": 3.497652391053517e-05, |
| "loss": 0.186, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2291339933872223, |
| "step": 1390, |
| "valid_targets_mean": 4031.1, |
| "valid_targets_min": 630 |
| }, |
| { |
| "epoch": 2.1627906976744184, |
| "grad_norm": 0.4549549638224178, |
| "learning_rate": 3.492516569148388e-05, |
| "loss": 0.2142, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21782903373241425, |
| "step": 1395, |
| "valid_targets_mean": 4231.4, |
| "valid_targets_min": 2014 |
| }, |
| { |
| "epoch": 2.1705426356589146, |
| "grad_norm": 0.36020932761428015, |
| "learning_rate": 3.487358439032975e-05, |
| "loss": 0.1616, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18451038002967834, |
| "step": 1400, |
| "valid_targets_mean": 6068.2, |
| "valid_targets_min": 2874 |
| }, |
| { |
| "epoch": 2.1782945736434107, |
| "grad_norm": 0.3920924834443207, |
| "learning_rate": 3.4821780778043474e-05, |
| "loss": 0.1889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1814422309398651, |
| "step": 1405, |
| "valid_targets_mean": 4700.9, |
| "valid_targets_min": 656 |
| }, |
| { |
| "epoch": 2.186046511627907, |
| "grad_norm": 0.3750763170625423, |
| "learning_rate": 3.4769755628918545e-05, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1634986400604248, |
| "step": 1410, |
| "valid_targets_mean": 4980.3, |
| "valid_targets_min": 2167 |
| }, |
| { |
| "epoch": 2.193798449612403, |
| "grad_norm": 0.42291953615168815, |
| "learning_rate": 3.471750972055972e-05, |
| "loss": 0.1733, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16338089108467102, |
| "step": 1415, |
| "valid_targets_mean": 4139.0, |
| "valid_targets_min": 391 |
| }, |
| { |
| "epoch": 2.201550387596899, |
| "grad_norm": 0.4171884044672125, |
| "learning_rate": 3.466504383387135e-05, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1964506208896637, |
| "step": 1420, |
| "valid_targets_mean": 4754.2, |
| "valid_targets_min": 2815 |
| }, |
| { |
| "epoch": 2.2093023255813953, |
| "grad_norm": 0.3903545245483966, |
| "learning_rate": 3.461235875304577e-05, |
| "loss": 0.1848, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20105893909931183, |
| "step": 1425, |
| "valid_targets_mean": 4361.9, |
| "valid_targets_min": 250 |
| }, |
| { |
| "epoch": 2.2170542635658914, |
| "grad_norm": 0.3750810698508955, |
| "learning_rate": 3.455945526555153e-05, |
| "loss": 0.1867, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17983251810073853, |
| "step": 1430, |
| "valid_targets_mean": 5131.6, |
| "valid_targets_min": 2493 |
| }, |
| { |
| "epoch": 2.2248062015503876, |
| "grad_norm": 0.37223290231346184, |
| "learning_rate": 3.450633416212162e-05, |
| "loss": 0.1922, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16431176662445068, |
| "step": 1435, |
| "valid_targets_mean": 4377.4, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 2.2325581395348837, |
| "grad_norm": 0.3352051342701091, |
| "learning_rate": 3.4452996236741744e-05, |
| "loss": 0.1976, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1869511604309082, |
| "step": 1440, |
| "valid_targets_mean": 5356.9, |
| "valid_targets_min": 2703 |
| }, |
| { |
| "epoch": 2.24031007751938, |
| "grad_norm": 0.432086006561443, |
| "learning_rate": 3.439944228663829e-05, |
| "loss": 0.2079, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21285605430603027, |
| "step": 1445, |
| "valid_targets_mean": 4237.8, |
| "valid_targets_min": 1886 |
| }, |
| { |
| "epoch": 2.248062015503876, |
| "grad_norm": 0.3275443973114785, |
| "learning_rate": 3.434567311226656e-05, |
| "loss": 0.1757, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15418857336044312, |
| "step": 1450, |
| "valid_targets_mean": 5285.2, |
| "valid_targets_min": 566 |
| }, |
| { |
| "epoch": 2.255813953488372, |
| "grad_norm": 0.3576878996712879, |
| "learning_rate": 3.4291689517298734e-05, |
| "loss": 0.1946, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.186420738697052, |
| "step": 1455, |
| "valid_targets_mean": 5496.6, |
| "valid_targets_min": 321 |
| }, |
| { |
| "epoch": 2.2635658914728682, |
| "grad_norm": 0.4962339025365947, |
| "learning_rate": 3.423749230861188e-05, |
| "loss": 0.1694, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17092068493366241, |
| "step": 1460, |
| "valid_targets_mean": 3222.7, |
| "valid_targets_min": 402 |
| }, |
| { |
| "epoch": 2.2713178294573644, |
| "grad_norm": 0.4812137783785399, |
| "learning_rate": 3.418308229627588e-05, |
| "loss": 0.2163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.27093812823295593, |
| "step": 1465, |
| "valid_targets_mean": 4862.1, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 2.2790697674418605, |
| "grad_norm": 0.4153567019223971, |
| "learning_rate": 3.412846029354134e-05, |
| "loss": 0.1927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.237184539437294, |
| "step": 1470, |
| "valid_targets_mean": 4620.6, |
| "valid_targets_min": 455 |
| }, |
| { |
| "epoch": 2.2868217054263567, |
| "grad_norm": 0.3426626225579909, |
| "learning_rate": 3.4073627116827425e-05, |
| "loss": 0.1781, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18062137067317963, |
| "step": 1475, |
| "valid_targets_mean": 5811.9, |
| "valid_targets_min": 2245 |
| }, |
| { |
| "epoch": 2.294573643410853, |
| "grad_norm": 0.38476093721663684, |
| "learning_rate": 3.4018583585709636e-05, |
| "loss": 0.1816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18126948177814484, |
| "step": 1480, |
| "valid_targets_mean": 4559.2, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 2.302325581395349, |
| "grad_norm": 0.4096766811442832, |
| "learning_rate": 3.39633305229076e-05, |
| "loss": 0.1877, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20921531319618225, |
| "step": 1485, |
| "valid_targets_mean": 5167.4, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 2.310077519379845, |
| "grad_norm": 0.38639646068488026, |
| "learning_rate": 3.390786875427275e-05, |
| "loss": 0.1811, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15107879042625427, |
| "step": 1490, |
| "valid_targets_mean": 4523.8, |
| "valid_targets_min": 1865 |
| }, |
| { |
| "epoch": 2.317829457364341, |
| "grad_norm": 0.4502008909642411, |
| "learning_rate": 3.385219910877599e-05, |
| "loss": 0.2037, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1977536380290985, |
| "step": 1495, |
| "valid_targets_mean": 4173.2, |
| "valid_targets_min": 1948 |
| }, |
| { |
| "epoch": 2.3255813953488373, |
| "grad_norm": 0.3796879053543267, |
| "learning_rate": 3.3796322418495276e-05, |
| "loss": 0.1879, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1648637056350708, |
| "step": 1500, |
| "valid_targets_mean": 4416.7, |
| "valid_targets_min": 304 |
| }, |
| { |
| "epoch": 2.3333333333333335, |
| "grad_norm": 0.3789163353016251, |
| "learning_rate": 3.374023951860322e-05, |
| "loss": 0.1794, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1563669592142105, |
| "step": 1505, |
| "valid_targets_mean": 5124.2, |
| "valid_targets_min": 2981 |
| }, |
| { |
| "epoch": 2.3410852713178296, |
| "grad_norm": 0.41364685765156334, |
| "learning_rate": 3.368395124735459e-05, |
| "loss": 0.1893, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16633863747119904, |
| "step": 1510, |
| "valid_targets_mean": 3882.1, |
| "valid_targets_min": 282 |
| }, |
| { |
| "epoch": 2.3488372093023258, |
| "grad_norm": 0.35667587906507076, |
| "learning_rate": 3.3627458446073775e-05, |
| "loss": 0.1673, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13330259919166565, |
| "step": 1515, |
| "valid_targets_mean": 5481.6, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 2.356589147286822, |
| "grad_norm": 0.3881816160616292, |
| "learning_rate": 3.357076195914221e-05, |
| "loss": 0.1789, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18566307425498962, |
| "step": 1520, |
| "valid_targets_mean": 5012.3, |
| "valid_targets_min": 1855 |
| }, |
| { |
| "epoch": 2.3643410852713176, |
| "grad_norm": 0.4712604845214267, |
| "learning_rate": 3.351386263398578e-05, |
| "loss": 0.1833, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19617591798305511, |
| "step": 1525, |
| "valid_targets_mean": 4073.4, |
| "valid_targets_min": 477 |
| }, |
| { |
| "epoch": 2.3720930232558137, |
| "grad_norm": 0.35048104567381255, |
| "learning_rate": 3.34567613210621e-05, |
| "loss": 0.1856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17707285284996033, |
| "step": 1530, |
| "valid_targets_mean": 5311.7, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 2.37984496124031, |
| "grad_norm": 0.41501213355240485, |
| "learning_rate": 3.3399458873847865e-05, |
| "loss": 0.1839, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18096289038658142, |
| "step": 1535, |
| "valid_targets_mean": 4257.4, |
| "valid_targets_min": 2687 |
| }, |
| { |
| "epoch": 2.387596899224806, |
| "grad_norm": 0.3935199588486319, |
| "learning_rate": 3.334195614882606e-05, |
| "loss": 0.2009, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23064912855625153, |
| "step": 1540, |
| "valid_targets_mean": 5280.2, |
| "valid_targets_min": 726 |
| }, |
| { |
| "epoch": 2.395348837209302, |
| "grad_norm": 0.39245757715509993, |
| "learning_rate": 3.3284254005473164e-05, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14799197018146515, |
| "step": 1545, |
| "valid_targets_mean": 4357.3, |
| "valid_targets_min": 365 |
| }, |
| { |
| "epoch": 2.4031007751937983, |
| "grad_norm": 0.3960910530726775, |
| "learning_rate": 3.3226353306246296e-05, |
| "loss": 0.1802, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16391268372535706, |
| "step": 1550, |
| "valid_targets_mean": 4675.7, |
| "valid_targets_min": 472 |
| }, |
| { |
| "epoch": 2.4108527131782944, |
| "grad_norm": 0.399983594538759, |
| "learning_rate": 3.316825491657033e-05, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18162378668785095, |
| "step": 1555, |
| "valid_targets_mean": 4586.7, |
| "valid_targets_min": 336 |
| }, |
| { |
| "epoch": 2.4186046511627906, |
| "grad_norm": 0.4339613073850326, |
| "learning_rate": 3.310995970482498e-05, |
| "loss": 0.1812, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18091610074043274, |
| "step": 1560, |
| "valid_targets_mean": 4878.5, |
| "valid_targets_min": 1433 |
| }, |
| { |
| "epoch": 2.4263565891472867, |
| "grad_norm": 0.40487359759812325, |
| "learning_rate": 3.3051468542331784e-05, |
| "loss": 0.1959, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17559471726417542, |
| "step": 1565, |
| "valid_targets_mean": 4204.3, |
| "valid_targets_min": 1999 |
| }, |
| { |
| "epoch": 2.434108527131783, |
| "grad_norm": 0.37204854898669026, |
| "learning_rate": 3.2992782303341104e-05, |
| "loss": 0.1642, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1342979371547699, |
| "step": 1570, |
| "valid_targets_mean": 4676.9, |
| "valid_targets_min": 720 |
| }, |
| { |
| "epoch": 2.441860465116279, |
| "grad_norm": 0.43162119589856907, |
| "learning_rate": 3.2933901865019064e-05, |
| "loss": 0.203, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2307354062795639, |
| "step": 1575, |
| "valid_targets_mean": 4931.0, |
| "valid_targets_min": 1914 |
| }, |
| { |
| "epoch": 2.449612403100775, |
| "grad_norm": 0.4576769904055123, |
| "learning_rate": 3.28748281074344e-05, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15882378816604614, |
| "step": 1580, |
| "valid_targets_mean": 3951.5, |
| "valid_targets_min": 1846 |
| }, |
| { |
| "epoch": 2.4573643410852712, |
| "grad_norm": 0.4015392257462172, |
| "learning_rate": 3.281556191354538e-05, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15286649763584137, |
| "step": 1585, |
| "valid_targets_mean": 5152.0, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 2.4651162790697674, |
| "grad_norm": 0.42917005882818327, |
| "learning_rate": 3.2756104169186524e-05, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17661848664283752, |
| "step": 1590, |
| "valid_targets_mean": 4086.8, |
| "valid_targets_min": 568 |
| }, |
| { |
| "epoch": 2.4728682170542635, |
| "grad_norm": 0.4411320746574963, |
| "learning_rate": 3.269645576305541e-05, |
| "loss": 0.1927, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.184126615524292, |
| "step": 1595, |
| "valid_targets_mean": 6700.9, |
| "valid_targets_min": 2494 |
| }, |
| { |
| "epoch": 2.4806201550387597, |
| "grad_norm": 0.4047963399547679, |
| "learning_rate": 3.2636617586699375e-05, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16849125921726227, |
| "step": 1600, |
| "valid_targets_mean": 4574.2, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 2.488372093023256, |
| "grad_norm": 0.44245747159170795, |
| "learning_rate": 3.257659053450223e-05, |
| "loss": 0.188, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20396322011947632, |
| "step": 1605, |
| "valid_targets_mean": 4482.4, |
| "valid_targets_min": 380 |
| }, |
| { |
| "epoch": 2.496124031007752, |
| "grad_norm": 0.43654194588770506, |
| "learning_rate": 3.251637550367082e-05, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19797450304031372, |
| "step": 1610, |
| "valid_targets_mean": 4816.7, |
| "valid_targets_min": 2959 |
| }, |
| { |
| "epoch": 2.503875968992248, |
| "grad_norm": 0.43464122667550903, |
| "learning_rate": 3.245597339422165e-05, |
| "loss": 0.1815, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1967172473669052, |
| "step": 1615, |
| "valid_targets_mean": 5667.7, |
| "valid_targets_min": 559 |
| }, |
| { |
| "epoch": 2.511627906976744, |
| "grad_norm": 0.4652650203493568, |
| "learning_rate": 3.2395385108967486e-05, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19761139154434204, |
| "step": 1620, |
| "valid_targets_mean": 4328.9, |
| "valid_targets_min": 314 |
| }, |
| { |
| "epoch": 2.5193798449612403, |
| "grad_norm": 0.40709753507837126, |
| "learning_rate": 3.233461155350375e-05, |
| "loss": 0.1843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20508559048175812, |
| "step": 1625, |
| "valid_targets_mean": 5249.1, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 2.5271317829457365, |
| "grad_norm": 0.4491598648675841, |
| "learning_rate": 3.227365363619507e-05, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1938488781452179, |
| "step": 1630, |
| "valid_targets_mean": 3739.8, |
| "valid_targets_min": 2192 |
| }, |
| { |
| "epoch": 2.5348837209302326, |
| "grad_norm": 0.4742827982147315, |
| "learning_rate": 3.221251226816168e-05, |
| "loss": 0.1906, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17324459552764893, |
| "step": 1635, |
| "valid_targets_mean": 3619.9, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 2.5426356589147288, |
| "grad_norm": 0.40634153675562273, |
| "learning_rate": 3.21511883632658e-05, |
| "loss": 0.1762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17292270064353943, |
| "step": 1640, |
| "valid_targets_mean": 4721.2, |
| "valid_targets_min": 1866 |
| }, |
| { |
| "epoch": 2.550387596899225, |
| "grad_norm": 0.3502337789022322, |
| "learning_rate": 3.208968283809795e-05, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13709160685539246, |
| "step": 1645, |
| "valid_targets_mean": 5043.9, |
| "valid_targets_min": 1925 |
| }, |
| { |
| "epoch": 2.558139534883721, |
| "grad_norm": 0.46216095941040614, |
| "learning_rate": 3.202799661196331e-05, |
| "loss": 0.1881, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22641834616661072, |
| "step": 1650, |
| "valid_targets_mean": 4146.6, |
| "valid_targets_min": 419 |
| }, |
| { |
| "epoch": 2.565891472868217, |
| "grad_norm": 0.3770036373887086, |
| "learning_rate": 3.196613060686791e-05, |
| "loss": 0.2024, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19278298318386078, |
| "step": 1655, |
| "valid_targets_mean": 5648.9, |
| "valid_targets_min": 1948 |
| }, |
| { |
| "epoch": 2.5736434108527133, |
| "grad_norm": 0.3885989041243395, |
| "learning_rate": 3.1904085747504927e-05, |
| "loss": 0.179, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17080789804458618, |
| "step": 1660, |
| "valid_targets_mean": 4642.9, |
| "valid_targets_min": 357 |
| }, |
| { |
| "epoch": 2.5813953488372094, |
| "grad_norm": 0.4011197982513075, |
| "learning_rate": 3.184186296124077e-05, |
| "loss": 0.1885, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1865064799785614, |
| "step": 1665, |
| "valid_targets_mean": 5166.7, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 2.5891472868217056, |
| "grad_norm": 0.3745953386421688, |
| "learning_rate": 3.1779463178101317e-05, |
| "loss": 0.1844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17259354889392853, |
| "step": 1670, |
| "valid_targets_mean": 4452.9, |
| "valid_targets_min": 2554 |
| }, |
| { |
| "epoch": 2.5968992248062017, |
| "grad_norm": 0.4235759003308612, |
| "learning_rate": 3.1716887330757935e-05, |
| "loss": 0.1797, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17030495405197144, |
| "step": 1675, |
| "valid_targets_mean": 4332.0, |
| "valid_targets_min": 2478 |
| }, |
| { |
| "epoch": 2.604651162790698, |
| "grad_norm": 0.4854637458573741, |
| "learning_rate": 3.165413635451358e-05, |
| "loss": 0.1711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19602999091148376, |
| "step": 1680, |
| "valid_targets_mean": 3863.3, |
| "valid_targets_min": 355 |
| }, |
| { |
| "epoch": 2.612403100775194, |
| "grad_norm": 0.40699113598693853, |
| "learning_rate": 3.159121118728882e-05, |
| "loss": 0.1901, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18548724055290222, |
| "step": 1685, |
| "valid_targets_mean": 4666.2, |
| "valid_targets_min": 1840 |
| }, |
| { |
| "epoch": 2.62015503875969, |
| "grad_norm": 0.34544920663620954, |
| "learning_rate": 3.152811276960778e-05, |
| "loss": 0.1751, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14782579243183136, |
| "step": 1690, |
| "valid_targets_mean": 5451.3, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 2.6279069767441863, |
| "grad_norm": 0.3927708940246696, |
| "learning_rate": 3.1464842044584134e-05, |
| "loss": 0.1937, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15799960494041443, |
| "step": 1695, |
| "valid_targets_mean": 5175.1, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 2.6356589147286824, |
| "grad_norm": 0.40704479344798744, |
| "learning_rate": 3.140139995790697e-05, |
| "loss": 0.1888, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21562063694000244, |
| "step": 1700, |
| "valid_targets_mean": 4840.2, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 2.6434108527131785, |
| "grad_norm": 0.4492192562060312, |
| "learning_rate": 3.1337787457826676e-05, |
| "loss": 0.2064, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20294302701950073, |
| "step": 1705, |
| "valid_targets_mean": 4130.9, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 2.6511627906976747, |
| "grad_norm": 0.439737875037387, |
| "learning_rate": 3.127400549514075e-05, |
| "loss": 0.1844, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22795331478118896, |
| "step": 1710, |
| "valid_targets_mean": 4858.8, |
| "valid_targets_min": 566 |
| }, |
| { |
| "epoch": 2.6589147286821704, |
| "grad_norm": 0.3937483563358435, |
| "learning_rate": 3.121005502317961e-05, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14470066130161285, |
| "step": 1715, |
| "valid_targets_mean": 4338.8, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 2.6666666666666665, |
| "grad_norm": 0.43258662767772366, |
| "learning_rate": 3.114593699779233e-05, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18938937783241272, |
| "step": 1720, |
| "valid_targets_mean": 4000.3, |
| "valid_targets_min": 2352 |
| }, |
| { |
| "epoch": 2.6744186046511627, |
| "grad_norm": 0.38825080259416433, |
| "learning_rate": 3.108165237733235e-05, |
| "loss": 0.1896, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20304493606090546, |
| "step": 1725, |
| "valid_targets_mean": 5271.6, |
| "valid_targets_min": 2162 |
| }, |
| { |
| "epoch": 2.682170542635659, |
| "grad_norm": 0.5030719627542097, |
| "learning_rate": 3.101720212264315e-05, |
| "loss": 0.1836, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1815469115972519, |
| "step": 1730, |
| "valid_targets_mean": 3065.4, |
| "valid_targets_min": 304 |
| }, |
| { |
| "epoch": 2.689922480620155, |
| "grad_norm": 0.48074649750101905, |
| "learning_rate": 3.0952587197043916e-05, |
| "loss": 0.1565, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1928318440914154, |
| "step": 1735, |
| "valid_targets_mean": 3592.6, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 2.697674418604651, |
| "grad_norm": 0.38224384351415913, |
| "learning_rate": 3.0887808566315123e-05, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16647925972938538, |
| "step": 1740, |
| "valid_targets_mean": 4713.6, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 2.705426356589147, |
| "grad_norm": 0.33777469296551843, |
| "learning_rate": 3.0822867198684076e-05, |
| "loss": 0.1617, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15009137988090515, |
| "step": 1745, |
| "valid_targets_mean": 6850.4, |
| "valid_targets_min": 2445 |
| }, |
| { |
| "epoch": 2.7131782945736433, |
| "grad_norm": 0.44540770518271033, |
| "learning_rate": 3.075776406481048e-05, |
| "loss": 0.185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18640130758285522, |
| "step": 1750, |
| "valid_targets_mean": 4726.7, |
| "valid_targets_min": 1933 |
| }, |
| { |
| "epoch": 2.7209302325581395, |
| "grad_norm": 0.44372094538107276, |
| "learning_rate": 3.0692500137771926e-05, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22654184699058533, |
| "step": 1755, |
| "valid_targets_mean": 3954.4, |
| "valid_targets_min": 606 |
| }, |
| { |
| "epoch": 2.7286821705426356, |
| "grad_norm": 0.369529532189345, |
| "learning_rate": 3.062707639304928e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17843511700630188, |
| "step": 1760, |
| "valid_targets_mean": 5725.1, |
| "valid_targets_min": 1885 |
| }, |
| { |
| "epoch": 2.7364341085271318, |
| "grad_norm": 0.40621309446299825, |
| "learning_rate": 3.0561493808512216e-05, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21624553203582764, |
| "step": 1765, |
| "valid_targets_mean": 4932.4, |
| "valid_targets_min": 2437 |
| }, |
| { |
| "epoch": 2.744186046511628, |
| "grad_norm": 0.4324605534368406, |
| "learning_rate": 3.0495753364404513e-05, |
| "loss": 0.1693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1789764165878296, |
| "step": 1770, |
| "valid_targets_mean": 4427.4, |
| "valid_targets_min": 1030 |
| }, |
| { |
| "epoch": 2.751937984496124, |
| "grad_norm": 0.44772637547939986, |
| "learning_rate": 3.042985604332943e-05, |
| "loss": 0.1807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21675977110862732, |
| "step": 1775, |
| "valid_targets_mean": 4327.5, |
| "valid_targets_min": 783 |
| }, |
| { |
| "epoch": 2.75968992248062, |
| "grad_norm": 0.3320961105254609, |
| "learning_rate": 3.036380283023502e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15626108646392822, |
| "step": 1780, |
| "valid_targets_mean": 5396.8, |
| "valid_targets_min": 646 |
| }, |
| { |
| "epoch": 2.7674418604651163, |
| "grad_norm": 0.37789640533310415, |
| "learning_rate": 3.0297594712399428e-05, |
| "loss": 0.1933, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15670335292816162, |
| "step": 1785, |
| "valid_targets_mean": 4688.8, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 2.7751937984496124, |
| "grad_norm": 0.40427238608967736, |
| "learning_rate": 3.0231232679416088e-05, |
| "loss": 0.1932, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2058807611465454, |
| "step": 1790, |
| "valid_targets_mean": 4991.1, |
| "valid_targets_min": 2320 |
| }, |
| { |
| "epoch": 2.7829457364341086, |
| "grad_norm": 0.3958864673220442, |
| "learning_rate": 3.0164717723178976e-05, |
| "loss": 0.1758, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1790355145931244, |
| "step": 1795, |
| "valid_targets_mean": 4758.6, |
| "valid_targets_min": 623 |
| }, |
| { |
| "epoch": 2.7906976744186047, |
| "grad_norm": 0.3482330544899987, |
| "learning_rate": 3.0098050837867755e-05, |
| "loss": 0.183, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15739408135414124, |
| "step": 1800, |
| "valid_targets_mean": 5299.1, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 2.798449612403101, |
| "grad_norm": 0.41439611401362086, |
| "learning_rate": 3.003123301993295e-05, |
| "loss": 0.171, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16220103204250336, |
| "step": 1805, |
| "valid_targets_mean": 4676.3, |
| "valid_targets_min": 1825 |
| }, |
| { |
| "epoch": 2.806201550387597, |
| "grad_norm": 0.41973002932333475, |
| "learning_rate": 2.9964265268081e-05, |
| "loss": 0.1814, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15398794412612915, |
| "step": 1810, |
| "valid_targets_mean": 3951.7, |
| "valid_targets_min": 308 |
| }, |
| { |
| "epoch": 2.813953488372093, |
| "grad_norm": 0.41316632273979337, |
| "learning_rate": 2.9897148583259386e-05, |
| "loss": 0.1996, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21641714870929718, |
| "step": 1815, |
| "valid_targets_mean": 4523.2, |
| "valid_targets_min": 630 |
| }, |
| { |
| "epoch": 2.8217054263565893, |
| "grad_norm": 0.44522140399389565, |
| "learning_rate": 2.982988396864165e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18898218870162964, |
| "step": 1820, |
| "valid_targets_mean": 4400.8, |
| "valid_targets_min": 996 |
| }, |
| { |
| "epoch": 2.8294573643410854, |
| "grad_norm": 0.3738531998626034, |
| "learning_rate": 2.9762472429612375e-05, |
| "loss": 0.1813, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15361550450325012, |
| "step": 1825, |
| "valid_targets_mean": 4821.5, |
| "valid_targets_min": 978 |
| }, |
| { |
| "epoch": 2.8372093023255816, |
| "grad_norm": 0.43083740204233706, |
| "learning_rate": 2.9694914973752194e-05, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1844104826450348, |
| "step": 1830, |
| "valid_targets_mean": 3693.3, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 2.8449612403100772, |
| "grad_norm": 0.3659912670375286, |
| "learning_rate": 2.962721261082272e-05, |
| "loss": 0.1889, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20017662644386292, |
| "step": 1835, |
| "valid_targets_mean": 6980.4, |
| "valid_targets_min": 3136 |
| }, |
| { |
| "epoch": 2.8527131782945734, |
| "grad_norm": 0.4567000170536253, |
| "learning_rate": 2.9559366352751445e-05, |
| "loss": 0.1919, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23465114831924438, |
| "step": 1840, |
| "valid_targets_mean": 4588.8, |
| "valid_targets_min": 2486 |
| }, |
| { |
| "epoch": 2.8604651162790695, |
| "grad_norm": 0.40929029223114577, |
| "learning_rate": 2.9491377213616618e-05, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18239933252334595, |
| "step": 1845, |
| "valid_targets_mean": 4133.6, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 2.8682170542635657, |
| "grad_norm": 0.40525101121640406, |
| "learning_rate": 2.94232462096321e-05, |
| "loss": 0.1865, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1767432689666748, |
| "step": 1850, |
| "valid_targets_mean": 4216.1, |
| "valid_targets_min": 516 |
| }, |
| { |
| "epoch": 2.875968992248062, |
| "grad_norm": 0.4366325773783958, |
| "learning_rate": 2.9354974359132135e-05, |
| "loss": 0.1826, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19949214160442352, |
| "step": 1855, |
| "valid_targets_mean": 4033.6, |
| "valid_targets_min": 1922 |
| }, |
| { |
| "epoch": 2.883720930232558, |
| "grad_norm": 0.42935985240712937, |
| "learning_rate": 2.92865626825562e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18675842881202698, |
| "step": 1860, |
| "valid_targets_mean": 4010.4, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 2.891472868217054, |
| "grad_norm": 0.31457168919286277, |
| "learning_rate": 2.921801220243368e-05, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13208898901939392, |
| "step": 1865, |
| "valid_targets_mean": 6431.9, |
| "valid_targets_min": 2510 |
| }, |
| { |
| "epoch": 2.89922480620155, |
| "grad_norm": 0.39154537620319585, |
| "learning_rate": 2.9149323943368635e-05, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15021896362304688, |
| "step": 1870, |
| "valid_targets_mean": 5320.4, |
| "valid_targets_min": 2104 |
| }, |
| { |
| "epoch": 2.9069767441860463, |
| "grad_norm": 0.4215081843896084, |
| "learning_rate": 2.9080498932024462e-05, |
| "loss": 0.1708, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19808581471443176, |
| "step": 1875, |
| "valid_targets_mean": 4261.8, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 2.9147286821705425, |
| "grad_norm": 0.48180287200478444, |
| "learning_rate": 2.901153819710855e-05, |
| "loss": 0.1831, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20577339828014374, |
| "step": 1880, |
| "valid_targets_mean": 3915.2, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 2.9224806201550386, |
| "grad_norm": 0.4046284897843421, |
| "learning_rate": 2.8942442769356896e-05, |
| "loss": 0.1648, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20008404552936554, |
| "step": 1885, |
| "valid_targets_mean": 5054.2, |
| "valid_targets_min": 2545 |
| }, |
| { |
| "epoch": 2.9302325581395348, |
| "grad_norm": 0.3202021785981192, |
| "learning_rate": 2.8873213681518747e-05, |
| "loss": 0.1676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14765912294387817, |
| "step": 1890, |
| "valid_targets_mean": 5971.2, |
| "valid_targets_min": 1835 |
| }, |
| { |
| "epoch": 2.937984496124031, |
| "grad_norm": 0.3975741557425795, |
| "learning_rate": 2.8803851968341092e-05, |
| "loss": 0.1965, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17159457504749298, |
| "step": 1895, |
| "valid_targets_mean": 4565.2, |
| "valid_targets_min": 1942 |
| }, |
| { |
| "epoch": 2.945736434108527, |
| "grad_norm": 0.46251815005036806, |
| "learning_rate": 2.873435866655326e-05, |
| "loss": 0.1843, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24192339181900024, |
| "step": 1900, |
| "valid_targets_mean": 4237.6, |
| "valid_targets_min": 326 |
| }, |
| { |
| "epoch": 2.953488372093023, |
| "grad_norm": 0.41403119618696854, |
| "learning_rate": 2.8664734814851377e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18902885913848877, |
| "step": 1905, |
| "valid_targets_mean": 4557.3, |
| "valid_targets_min": 849 |
| }, |
| { |
| "epoch": 2.9612403100775193, |
| "grad_norm": 0.44851409111675167, |
| "learning_rate": 2.8594981453882874e-05, |
| "loss": 0.1656, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20263975858688354, |
| "step": 1910, |
| "valid_targets_mean": 3717.8, |
| "valid_targets_min": 926 |
| }, |
| { |
| "epoch": 2.9689922480620154, |
| "grad_norm": 0.42903678457431993, |
| "learning_rate": 2.85250996262309e-05, |
| "loss": 0.1957, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23578867316246033, |
| "step": 1915, |
| "valid_targets_mean": 4934.7, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 2.9767441860465116, |
| "grad_norm": 0.7267563478310851, |
| "learning_rate": 2.8455090376398783e-05, |
| "loss": 0.1792, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18642187118530273, |
| "step": 1920, |
| "valid_targets_mean": 4939.8, |
| "valid_targets_min": 2461 |
| }, |
| { |
| "epoch": 2.9844961240310077, |
| "grad_norm": 0.45652911775394833, |
| "learning_rate": 2.8384954750794383e-05, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1863420158624649, |
| "step": 1925, |
| "valid_targets_mean": 4101.9, |
| "valid_targets_min": 386 |
| }, |
| { |
| "epoch": 2.992248062015504, |
| "grad_norm": 0.4162197137776795, |
| "learning_rate": 2.8314693797714453e-05, |
| "loss": 0.1786, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16806048154830933, |
| "step": 1930, |
| "valid_targets_mean": 3889.9, |
| "valid_targets_min": 266 |
| }, |
| { |
| "epoch": 3.0, |
| "grad_norm": 0.4173426583399949, |
| "learning_rate": 2.8244308567328995e-05, |
| "loss": 0.1705, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1593976765871048, |
| "step": 1935, |
| "valid_targets_mean": 3841.9, |
| "valid_targets_min": 725 |
| }, |
| { |
| "epoch": 3.007751937984496, |
| "grad_norm": 0.31143453647713937, |
| "learning_rate": 2.8173800111665534e-05, |
| "loss": 0.1603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1310623288154602, |
| "step": 1940, |
| "valid_targets_mean": 6594.8, |
| "valid_targets_min": 3125 |
| }, |
| { |
| "epoch": 3.0155038759689923, |
| "grad_norm": 0.37798360065942155, |
| "learning_rate": 2.8103169484593408e-05, |
| "loss": 0.1671, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14523474872112274, |
| "step": 1945, |
| "valid_targets_mean": 4545.6, |
| "valid_targets_min": 391 |
| }, |
| { |
| "epoch": 3.0232558139534884, |
| "grad_norm": 0.4193657818911918, |
| "learning_rate": 2.8032417741808026e-05, |
| "loss": 0.1825, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19101709127426147, |
| "step": 1950, |
| "valid_targets_mean": 4638.9, |
| "valid_targets_min": 1098 |
| }, |
| { |
| "epoch": 3.0310077519379846, |
| "grad_norm": 0.4292392293342452, |
| "learning_rate": 2.7961545940815073e-05, |
| "loss": 0.1683, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14101950824260712, |
| "step": 1955, |
| "valid_targets_mean": 4463.8, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 3.0387596899224807, |
| "grad_norm": 0.445566159385126, |
| "learning_rate": 2.7890555140914712e-05, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15082740783691406, |
| "step": 1960, |
| "valid_targets_mean": 4373.4, |
| "valid_targets_min": 196 |
| }, |
| { |
| "epoch": 3.046511627906977, |
| "grad_norm": 0.3879287131571122, |
| "learning_rate": 2.7819446403185737e-05, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.155793234705925, |
| "step": 1965, |
| "valid_targets_mean": 4823.5, |
| "valid_targets_min": 424 |
| }, |
| { |
| "epoch": 3.054263565891473, |
| "grad_norm": 0.4580658977138339, |
| "learning_rate": 2.774822079046973e-05, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1928856372833252, |
| "step": 1970, |
| "valid_targets_mean": 4411.8, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 3.062015503875969, |
| "grad_norm": 0.37791164078529926, |
| "learning_rate": 2.7676879367355182e-05, |
| "loss": 0.1947, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22396092116832733, |
| "step": 1975, |
| "valid_targets_mean": 6053.8, |
| "valid_targets_min": 341 |
| }, |
| { |
| "epoch": 3.0697674418604652, |
| "grad_norm": 0.5813711025395043, |
| "learning_rate": 2.7605423200161544e-05, |
| "loss": 0.1766, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20629319548606873, |
| "step": 1980, |
| "valid_targets_mean": 2834.8, |
| "valid_targets_min": 594 |
| }, |
| { |
| "epoch": 3.0775193798449614, |
| "grad_norm": 0.5229150181707595, |
| "learning_rate": 2.753385335692334e-05, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19532498717308044, |
| "step": 1985, |
| "valid_targets_mean": 5435.9, |
| "valid_targets_min": 2333 |
| }, |
| { |
| "epoch": 3.0852713178294575, |
| "grad_norm": 0.5039292916210872, |
| "learning_rate": 2.7462170907374152e-05, |
| "loss": 0.2046, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2393975555896759, |
| "step": 1990, |
| "valid_targets_mean": 3852.1, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 3.0930232558139537, |
| "grad_norm": 0.4334986389248226, |
| "learning_rate": 2.7390376922930676e-05, |
| "loss": 0.1536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2017873227596283, |
| "step": 1995, |
| "valid_targets_mean": 4789.2, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 3.10077519379845, |
| "grad_norm": 0.48940426768725165, |
| "learning_rate": 2.7318472476676678e-05, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20767296850681305, |
| "step": 2000, |
| "valid_targets_mean": 4572.1, |
| "valid_targets_min": 564 |
| }, |
| { |
| "epoch": 3.108527131782946, |
| "grad_norm": 0.45021483225829007, |
| "learning_rate": 2.7246458643346954e-05, |
| "loss": 0.1722, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19874969124794006, |
| "step": 2005, |
| "valid_targets_mean": 4382.3, |
| "valid_targets_min": 400 |
| }, |
| { |
| "epoch": 3.116279069767442, |
| "grad_norm": 0.39974386281581625, |
| "learning_rate": 2.7174336499311306e-05, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15649522840976715, |
| "step": 2010, |
| "valid_targets_mean": 4884.1, |
| "valid_targets_min": 1197 |
| }, |
| { |
| "epoch": 3.124031007751938, |
| "grad_norm": 0.4810534052770901, |
| "learning_rate": 2.7102107122558388e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.196878120303154, |
| "step": 2015, |
| "valid_targets_mean": 4465.6, |
| "valid_targets_min": 422 |
| }, |
| { |
| "epoch": 3.1317829457364343, |
| "grad_norm": 0.4405420076380904, |
| "learning_rate": 2.7029771592679667e-05, |
| "loss": 0.1832, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2112666368484497, |
| "step": 2020, |
| "valid_targets_mean": 4233.7, |
| "valid_targets_min": 2211 |
| }, |
| { |
| "epoch": 3.13953488372093, |
| "grad_norm": 0.435544733463545, |
| "learning_rate": 2.695733099085322e-05, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1643523871898651, |
| "step": 2025, |
| "valid_targets_mean": 4607.8, |
| "valid_targets_min": 313 |
| }, |
| { |
| "epoch": 3.147286821705426, |
| "grad_norm": 0.39286659071704916, |
| "learning_rate": 2.6884786399827617e-05, |
| "loss": 0.1654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1477556824684143, |
| "step": 2030, |
| "valid_targets_mean": 4724.6, |
| "valid_targets_min": 1978 |
| }, |
| { |
| "epoch": 3.1550387596899223, |
| "grad_norm": 0.3724002460323432, |
| "learning_rate": 2.6812138903905725e-05, |
| "loss": 0.1646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16990327835083008, |
| "step": 2035, |
| "valid_targets_mean": 4912.9, |
| "valid_targets_min": 2789 |
| }, |
| { |
| "epoch": 3.1627906976744184, |
| "grad_norm": 0.3944253467485725, |
| "learning_rate": 2.6739389588928496e-05, |
| "loss": 0.1538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15294812619686127, |
| "step": 2040, |
| "valid_targets_mean": 4411.3, |
| "valid_targets_min": 470 |
| }, |
| { |
| "epoch": 3.1705426356589146, |
| "grad_norm": 0.4077204261905621, |
| "learning_rate": 2.6666539542258742e-05, |
| "loss": 0.1918, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2099585086107254, |
| "step": 2045, |
| "valid_targets_mean": 5898.4, |
| "valid_targets_min": 2703 |
| }, |
| { |
| "epoch": 3.1782945736434107, |
| "grad_norm": 0.3700464997656355, |
| "learning_rate": 2.6593589852764886e-05, |
| "loss": 0.1866, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17447850108146667, |
| "step": 2050, |
| "valid_targets_mean": 5101.3, |
| "valid_targets_min": 242 |
| }, |
| { |
| "epoch": 3.186046511627907, |
| "grad_norm": 0.4095360723042356, |
| "learning_rate": 2.6520541610804688e-05, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18860718607902527, |
| "step": 2055, |
| "valid_targets_mean": 4771.2, |
| "valid_targets_min": 2471 |
| }, |
| { |
| "epoch": 3.193798449612403, |
| "grad_norm": 0.42170127535958324, |
| "learning_rate": 2.6447395908208933e-05, |
| "loss": 0.1719, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19056911766529083, |
| "step": 2060, |
| "valid_targets_mean": 4609.7, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 3.201550387596899, |
| "grad_norm": 0.3731793258953492, |
| "learning_rate": 2.6374153838265117e-05, |
| "loss": 0.1551, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14581088721752167, |
| "step": 2065, |
| "valid_targets_mean": 4326.2, |
| "valid_targets_min": 282 |
| }, |
| { |
| "epoch": 3.2093023255813953, |
| "grad_norm": 0.39762533461899896, |
| "learning_rate": 2.6300816495701124e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15880948305130005, |
| "step": 2070, |
| "valid_targets_mean": 4789.0, |
| "valid_targets_min": 1925 |
| }, |
| { |
| "epoch": 3.2170542635658914, |
| "grad_norm": 0.44748063624921613, |
| "learning_rate": 2.6227384976668848e-05, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.170176699757576, |
| "step": 2075, |
| "valid_targets_mean": 3995.2, |
| "valid_targets_min": 1668 |
| }, |
| { |
| "epoch": 3.2248062015503876, |
| "grad_norm": 0.36135621157101455, |
| "learning_rate": 2.6153860378727805e-05, |
| "loss": 0.1568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1492878496646881, |
| "step": 2080, |
| "valid_targets_mean": 4992.2, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 3.2325581395348837, |
| "grad_norm": 0.4154124841987222, |
| "learning_rate": 2.6080243800828742e-05, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17003397643566132, |
| "step": 2085, |
| "valid_targets_mean": 4658.8, |
| "valid_targets_min": 1209 |
| }, |
| { |
| "epoch": 3.24031007751938, |
| "grad_norm": 0.37368780763861736, |
| "learning_rate": 2.600653634329719e-05, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1633392572402954, |
| "step": 2090, |
| "valid_targets_mean": 4566.2, |
| "valid_targets_min": 2411 |
| }, |
| { |
| "epoch": 3.248062015503876, |
| "grad_norm": 0.3979676356096421, |
| "learning_rate": 2.593273910781705e-05, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17785364389419556, |
| "step": 2095, |
| "valid_targets_mean": 4691.6, |
| "valid_targets_min": 432 |
| }, |
| { |
| "epoch": 3.255813953488372, |
| "grad_norm": 0.4225515784722321, |
| "learning_rate": 2.585885319741409e-05, |
| "loss": 0.1782, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18224605917930603, |
| "step": 2100, |
| "valid_targets_mean": 4253.3, |
| "valid_targets_min": 756 |
| }, |
| { |
| "epoch": 3.2635658914728682, |
| "grad_norm": 0.38016881244736056, |
| "learning_rate": 2.5784879716439495e-05, |
| "loss": 0.1527, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12859958410263062, |
| "step": 2105, |
| "valid_targets_mean": 3910.2, |
| "valid_targets_min": 549 |
| }, |
| { |
| "epoch": 3.2713178294573644, |
| "grad_norm": 0.5201402499872219, |
| "learning_rate": 2.5710819770553322e-05, |
| "loss": 0.1521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15190503001213074, |
| "step": 2110, |
| "valid_targets_mean": 4282.5, |
| "valid_targets_min": 460 |
| }, |
| { |
| "epoch": 3.2790697674418605, |
| "grad_norm": 0.36744579209677214, |
| "learning_rate": 2.5636674466708002e-05, |
| "loss": 0.1595, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14565041661262512, |
| "step": 2115, |
| "valid_targets_mean": 4384.2, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 3.2868217054263567, |
| "grad_norm": 0.41793705033807765, |
| "learning_rate": 2.5562444913131802e-05, |
| "loss": 0.1838, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16959373652935028, |
| "step": 2120, |
| "valid_targets_mean": 4006.3, |
| "valid_targets_min": 412 |
| }, |
| { |
| "epoch": 3.294573643410853, |
| "grad_norm": 0.4168288113393459, |
| "learning_rate": 2.548813221931221e-05, |
| "loss": 0.1637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15278933942317963, |
| "step": 2125, |
| "valid_targets_mean": 4835.8, |
| "valid_targets_min": 1716 |
| }, |
| { |
| "epoch": 3.302325581395349, |
| "grad_norm": 0.43979678843894293, |
| "learning_rate": 2.5413737495979426e-05, |
| "loss": 0.1674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16088305413722992, |
| "step": 2130, |
| "valid_targets_mean": 4291.2, |
| "valid_targets_min": 2104 |
| }, |
| { |
| "epoch": 3.310077519379845, |
| "grad_norm": 0.3934052531036587, |
| "learning_rate": 2.5339261855089694e-05, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15298032760620117, |
| "step": 2135, |
| "valid_targets_mean": 4588.1, |
| "valid_targets_min": 329 |
| }, |
| { |
| "epoch": 3.317829457364341, |
| "grad_norm": 0.36169781906861537, |
| "learning_rate": 2.5264706409808725e-05, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16061750054359436, |
| "step": 2140, |
| "valid_targets_mean": 5402.7, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 3.3255813953488373, |
| "grad_norm": 0.4010813470774762, |
| "learning_rate": 2.5190072274495028e-05, |
| "loss": 0.1711, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1538451462984085, |
| "step": 2145, |
| "valid_targets_mean": 4433.6, |
| "valid_targets_min": 339 |
| }, |
| { |
| "epoch": 3.3333333333333335, |
| "grad_norm": 0.3582230333794788, |
| "learning_rate": 2.511536056468328e-05, |
| "loss": 0.1496, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13346490263938904, |
| "step": 2150, |
| "valid_targets_mean": 4958.1, |
| "valid_targets_min": 676 |
| }, |
| { |
| "epoch": 3.3410852713178296, |
| "grad_norm": 0.4020066100217078, |
| "learning_rate": 2.5040572397067645e-05, |
| "loss": 0.1679, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19228683412075043, |
| "step": 2155, |
| "valid_targets_mean": 5232.5, |
| "valid_targets_min": 760 |
| }, |
| { |
| "epoch": 3.3488372093023258, |
| "grad_norm": 0.3855313842797188, |
| "learning_rate": 2.4965708889485062e-05, |
| "loss": 0.1718, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17724131047725677, |
| "step": 2160, |
| "valid_targets_mean": 4920.0, |
| "valid_targets_min": 1946 |
| }, |
| { |
| "epoch": 3.356589147286822, |
| "grad_norm": 0.4532744687578762, |
| "learning_rate": 2.489077116089858e-05, |
| "loss": 0.1914, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22503584623336792, |
| "step": 2165, |
| "valid_targets_mean": 4651.2, |
| "valid_targets_min": 272 |
| }, |
| { |
| "epoch": 3.3643410852713176, |
| "grad_norm": 0.4366754770288092, |
| "learning_rate": 2.4815760331380578e-05, |
| "loss": 0.1911, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2072749137878418, |
| "step": 2170, |
| "valid_targets_mean": 4974.6, |
| "valid_targets_min": 450 |
| }, |
| { |
| "epoch": 3.3720930232558137, |
| "grad_norm": 0.5215057560813444, |
| "learning_rate": 2.4740677522096078e-05, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2247978001832962, |
| "step": 2175, |
| "valid_targets_mean": 3434.2, |
| "valid_targets_min": 352 |
| }, |
| { |
| "epoch": 3.37984496124031, |
| "grad_norm": 0.43695153967165795, |
| "learning_rate": 2.4665523855285954e-05, |
| "loss": 0.163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1621866375207901, |
| "step": 2180, |
| "valid_targets_mean": 3792.3, |
| "valid_targets_min": 364 |
| }, |
| { |
| "epoch": 3.387596899224806, |
| "grad_norm": 0.40940303711183107, |
| "learning_rate": 2.4590300454250164e-05, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14481836557388306, |
| "step": 2185, |
| "valid_targets_mean": 4906.2, |
| "valid_targets_min": 2115 |
| }, |
| { |
| "epoch": 3.395348837209302, |
| "grad_norm": 0.41242022872473294, |
| "learning_rate": 2.4515008443330963e-05, |
| "loss": 0.1706, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16337113082408905, |
| "step": 2190, |
| "valid_targets_mean": 4234.1, |
| "valid_targets_min": 339 |
| }, |
| { |
| "epoch": 3.4031007751937983, |
| "grad_norm": 0.34565747520342643, |
| "learning_rate": 2.4439648947896103e-05, |
| "loss": 0.1771, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14244988560676575, |
| "step": 2195, |
| "valid_targets_mean": 5911.4, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 3.4108527131782944, |
| "grad_norm": 0.47813710313391616, |
| "learning_rate": 2.4364223094322004e-05, |
| "loss": 0.1674, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16893121600151062, |
| "step": 2200, |
| "valid_targets_mean": 4232.1, |
| "valid_targets_min": 284 |
| }, |
| { |
| "epoch": 3.4186046511627906, |
| "grad_norm": 0.41110932893026, |
| "learning_rate": 2.4288732009976928e-05, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14816223084926605, |
| "step": 2205, |
| "valid_targets_mean": 4381.5, |
| "valid_targets_min": 2163 |
| }, |
| { |
| "epoch": 3.4263565891472867, |
| "grad_norm": 0.4329916569520111, |
| "learning_rate": 2.4213176823204103e-05, |
| "loss": 0.1709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15532240271568298, |
| "step": 2210, |
| "valid_targets_mean": 3792.0, |
| "valid_targets_min": 575 |
| }, |
| { |
| "epoch": 3.434108527131783, |
| "grad_norm": 0.47293777686859195, |
| "learning_rate": 2.4137558663304907e-05, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17490163445472717, |
| "step": 2215, |
| "valid_targets_mean": 4627.6, |
| "valid_targets_min": 304 |
| }, |
| { |
| "epoch": 3.441860465116279, |
| "grad_norm": 0.42026578348250343, |
| "learning_rate": 2.4061878660521927e-05, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14874975383281708, |
| "step": 2220, |
| "valid_targets_mean": 3723.0, |
| "valid_targets_min": 2346 |
| }, |
| { |
| "epoch": 3.449612403100775, |
| "grad_norm": 0.5448600259555658, |
| "learning_rate": 2.3986137946022132e-05, |
| "loss": 0.1755, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.23847255110740662, |
| "step": 2225, |
| "valid_targets_mean": 3648.1, |
| "valid_targets_min": 556 |
| }, |
| { |
| "epoch": 3.4573643410852712, |
| "grad_norm": 0.3526959052609803, |
| "learning_rate": 2.3910337651879902e-05, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15136197209358215, |
| "step": 2230, |
| "valid_targets_mean": 5305.6, |
| "valid_targets_min": 632 |
| }, |
| { |
| "epoch": 3.4651162790697674, |
| "grad_norm": 0.4609105179523114, |
| "learning_rate": 2.3834478911060144e-05, |
| "loss": 0.1824, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1996048092842102, |
| "step": 2235, |
| "valid_targets_mean": 4194.4, |
| "valid_targets_min": 628 |
| }, |
| { |
| "epoch": 3.4728682170542635, |
| "grad_norm": 0.3632917288631249, |
| "learning_rate": 2.3758562857401365e-05, |
| "loss": 0.1818, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14042022824287415, |
| "step": 2240, |
| "valid_targets_mean": 4892.4, |
| "valid_targets_min": 431 |
| }, |
| { |
| "epoch": 3.4806201550387597, |
| "grad_norm": 0.3596297602071797, |
| "learning_rate": 2.3682590625598682e-05, |
| "loss": 0.1664, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1568746566772461, |
| "step": 2245, |
| "valid_targets_mean": 5468.7, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 3.488372093023256, |
| "grad_norm": 0.36656096196128835, |
| "learning_rate": 2.360656335118692e-05, |
| "loss": 0.1764, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15595552325248718, |
| "step": 2250, |
| "valid_targets_mean": 4770.1, |
| "valid_targets_min": 330 |
| }, |
| { |
| "epoch": 3.496124031007752, |
| "grad_norm": 0.4048396000613103, |
| "learning_rate": 2.3530482170523604e-05, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2218673974275589, |
| "step": 2255, |
| "valid_targets_mean": 4977.7, |
| "valid_targets_min": 346 |
| }, |
| { |
| "epoch": 3.503875968992248, |
| "grad_norm": 0.4120002351387735, |
| "learning_rate": 2.3454348220771966e-05, |
| "loss": 0.1876, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1626529097557068, |
| "step": 2260, |
| "valid_targets_mean": 4942.2, |
| "valid_targets_min": 1938 |
| }, |
| { |
| "epoch": 3.511627906976744, |
| "grad_norm": 0.46155281185784397, |
| "learning_rate": 2.337816263988397e-05, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2315581887960434, |
| "step": 2265, |
| "valid_targets_mean": 5495.6, |
| "valid_targets_min": 1092 |
| }, |
| { |
| "epoch": 3.5193798449612403, |
| "grad_norm": 0.4144849480419605, |
| "learning_rate": 2.3301926566583292e-05, |
| "loss": 0.1816, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.166578471660614, |
| "step": 2270, |
| "valid_targets_mean": 4457.1, |
| "valid_targets_min": 2280 |
| }, |
| { |
| "epoch": 3.5271317829457365, |
| "grad_norm": 0.4109601135912686, |
| "learning_rate": 2.3225641140348306e-05, |
| "loss": 0.1701, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17378325760364532, |
| "step": 2275, |
| "valid_targets_mean": 4608.7, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 3.5348837209302326, |
| "grad_norm": 0.4582644976154119, |
| "learning_rate": 2.3149307501395056e-05, |
| "loss": 0.1446, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15773174166679382, |
| "step": 2280, |
| "valid_targets_mean": 4992.6, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 3.5426356589147288, |
| "grad_norm": 0.46360151480816175, |
| "learning_rate": 2.3072926790660203e-05, |
| "loss": 0.1964, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20285546779632568, |
| "step": 2285, |
| "valid_targets_mean": 4078.0, |
| "valid_targets_min": 532 |
| }, |
| { |
| "epoch": 3.550387596899225, |
| "grad_norm": 0.4408826537960868, |
| "learning_rate": 2.2996500149783973e-05, |
| "loss": 0.1868, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13840195536613464, |
| "step": 2290, |
| "valid_targets_mean": 4301.3, |
| "valid_targets_min": 606 |
| }, |
| { |
| "epoch": 3.558139534883721, |
| "grad_norm": 0.41302173935323416, |
| "learning_rate": 2.292002872109309e-05, |
| "loss": 0.1806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19090792536735535, |
| "step": 2295, |
| "valid_targets_mean": 4607.9, |
| "valid_targets_min": 1945 |
| }, |
| { |
| "epoch": 3.565891472868217, |
| "grad_norm": 0.48709929421908504, |
| "learning_rate": 2.284351364758373e-05, |
| "loss": 0.1747, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16162961721420288, |
| "step": 2300, |
| "valid_targets_mean": 2969.8, |
| "valid_targets_min": 411 |
| }, |
| { |
| "epoch": 3.5736434108527133, |
| "grad_norm": 0.34907911319518736, |
| "learning_rate": 2.2766956072904397e-05, |
| "loss": 0.1637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16097891330718994, |
| "step": 2305, |
| "valid_targets_mean": 5617.7, |
| "valid_targets_min": 343 |
| }, |
| { |
| "epoch": 3.5813953488372094, |
| "grad_norm": 0.41643473859763513, |
| "learning_rate": 2.2690357141338853e-05, |
| "loss": 0.1923, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16287288069725037, |
| "step": 2310, |
| "valid_targets_mean": 4270.3, |
| "valid_targets_min": 1388 |
| }, |
| { |
| "epoch": 3.5891472868217056, |
| "grad_norm": 0.36847179752276477, |
| "learning_rate": 2.2613717997789016e-05, |
| "loss": 0.1762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1488853245973587, |
| "step": 2315, |
| "valid_targets_mean": 4785.6, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 3.5968992248062017, |
| "grad_norm": 0.41943679729107547, |
| "learning_rate": 2.2537039787757817e-05, |
| "loss": 0.1956, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19536623358726501, |
| "step": 2320, |
| "valid_targets_mean": 4583.6, |
| "valid_targets_min": 2379 |
| }, |
| { |
| "epoch": 3.604651162790698, |
| "grad_norm": 0.3773107032307372, |
| "learning_rate": 2.2460323657332138e-05, |
| "loss": 0.1756, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13412323594093323, |
| "step": 2325, |
| "valid_targets_mean": 4938.5, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 3.612403100775194, |
| "grad_norm": 0.41099143457360815, |
| "learning_rate": 2.2383570753165615e-05, |
| "loss": 0.1752, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.146214097738266, |
| "step": 2330, |
| "valid_targets_mean": 4063.8, |
| "valid_targets_min": 520 |
| }, |
| { |
| "epoch": 3.62015503875969, |
| "grad_norm": 0.3494048218491353, |
| "learning_rate": 2.2306782222461547e-05, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1244577169418335, |
| "step": 2335, |
| "valid_targets_mean": 4674.1, |
| "valid_targets_min": 516 |
| }, |
| { |
| "epoch": 3.6279069767441863, |
| "grad_norm": 0.4137755237450408, |
| "learning_rate": 2.2229959212955735e-05, |
| "loss": 0.1557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1691616028547287, |
| "step": 2340, |
| "valid_targets_mean": 4078.2, |
| "valid_targets_min": 957 |
| }, |
| { |
| "epoch": 3.6356589147286824, |
| "grad_norm": 0.41202438782783035, |
| "learning_rate": 2.2153102872899313e-05, |
| "loss": 0.181, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19243177771568298, |
| "step": 2345, |
| "valid_targets_mean": 5443.7, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 3.6434108527131785, |
| "grad_norm": 0.4168252301471801, |
| "learning_rate": 2.20762143510416e-05, |
| "loss": 0.1601, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1762881577014923, |
| "step": 2350, |
| "valid_targets_mean": 4094.8, |
| "valid_targets_min": 436 |
| }, |
| { |
| "epoch": 3.6511627906976747, |
| "grad_norm": 0.3658382509380567, |
| "learning_rate": 2.1999294796612926e-05, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13929161429405212, |
| "step": 2355, |
| "valid_targets_mean": 5087.1, |
| "valid_targets_min": 2622 |
| }, |
| { |
| "epoch": 3.6589147286821704, |
| "grad_norm": 0.806554291125336, |
| "learning_rate": 2.1922345359307468e-05, |
| "loss": 0.1862, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.24180075526237488, |
| "step": 2360, |
| "valid_targets_mean": 3961.2, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 3.6666666666666665, |
| "grad_norm": 0.4010351294747989, |
| "learning_rate": 2.184536718926604e-05, |
| "loss": 0.1856, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15781967341899872, |
| "step": 2365, |
| "valid_targets_mean": 4302.3, |
| "valid_targets_min": 481 |
| }, |
| { |
| "epoch": 3.6744186046511627, |
| "grad_norm": 0.4910349746865378, |
| "learning_rate": 2.1768361437058924e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15803927183151245, |
| "step": 2370, |
| "valid_targets_mean": 5285.8, |
| "valid_targets_min": 1922 |
| }, |
| { |
| "epoch": 3.682170542635659, |
| "grad_norm": 0.5033930845464233, |
| "learning_rate": 2.1691329253668657e-05, |
| "loss": 0.1773, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16929282248020172, |
| "step": 2375, |
| "valid_targets_mean": 3518.6, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 3.689922480620155, |
| "grad_norm": 0.4812536807942641, |
| "learning_rate": 2.1614271790472835e-05, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16329653561115265, |
| "step": 2380, |
| "valid_targets_mean": 3963.1, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 3.697674418604651, |
| "grad_norm": 0.4106493741878364, |
| "learning_rate": 2.1537190199226917e-05, |
| "loss": 0.1822, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15833979845046997, |
| "step": 2385, |
| "valid_targets_mean": 4434.0, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 3.705426356589147, |
| "grad_norm": 0.42703025254446647, |
| "learning_rate": 2.1460085632046983e-05, |
| "loss": 0.1842, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19955435395240784, |
| "step": 2390, |
| "valid_targets_mean": 4425.7, |
| "valid_targets_min": 268 |
| }, |
| { |
| "epoch": 3.7131782945736433, |
| "grad_norm": 0.3400275265721782, |
| "learning_rate": 2.138295924139253e-05, |
| "loss": 0.1584, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13872955739498138, |
| "step": 2395, |
| "valid_targets_mean": 5467.9, |
| "valid_targets_min": 319 |
| }, |
| { |
| "epoch": 3.7209302325581395, |
| "grad_norm": 0.3682059763421827, |
| "learning_rate": 2.1305812180049258e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14761081337928772, |
| "step": 2400, |
| "valid_targets_mean": 5667.8, |
| "valid_targets_min": 2894 |
| }, |
| { |
| "epoch": 3.7286821705426356, |
| "grad_norm": 0.3974454201846236, |
| "learning_rate": 2.12286456011118e-05, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18874874711036682, |
| "step": 2405, |
| "valid_targets_mean": 5224.0, |
| "valid_targets_min": 3081 |
| }, |
| { |
| "epoch": 3.7364341085271318, |
| "grad_norm": 0.39427590403656537, |
| "learning_rate": 2.1151460657966543e-05, |
| "loss": 0.1731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14733751118183136, |
| "step": 2410, |
| "valid_targets_mean": 4060.3, |
| "valid_targets_min": 2348 |
| }, |
| { |
| "epoch": 3.744186046511628, |
| "grad_norm": 0.4347000971418473, |
| "learning_rate": 2.1074258504274324e-05, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16277927160263062, |
| "step": 2415, |
| "valid_targets_mean": 4161.8, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 3.751937984496124, |
| "grad_norm": 0.46642613155184653, |
| "learning_rate": 2.099704029395325e-05, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17865529656410217, |
| "step": 2420, |
| "valid_targets_mean": 3506.7, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 3.75968992248062, |
| "grad_norm": 0.36926786871608897, |
| "learning_rate": 2.0919807181161413e-05, |
| "loss": 0.182, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1872124969959259, |
| "step": 2425, |
| "valid_targets_mean": 5992.2, |
| "valid_targets_min": 2637 |
| }, |
| { |
| "epoch": 3.7674418604651163, |
| "grad_norm": 0.40797959752050406, |
| "learning_rate": 2.0842560320279647e-05, |
| "loss": 0.1795, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13483797013759613, |
| "step": 2430, |
| "valid_targets_mean": 3735.1, |
| "valid_targets_min": 396 |
| }, |
| { |
| "epoch": 3.7751937984496124, |
| "grad_norm": 0.3569093694297914, |
| "learning_rate": 2.0765300865894273e-05, |
| "loss": 0.1709, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16950270533561707, |
| "step": 2435, |
| "valid_targets_mean": 5004.4, |
| "valid_targets_min": 341 |
| }, |
| { |
| "epoch": 3.7829457364341086, |
| "grad_norm": 0.489744210232547, |
| "learning_rate": 2.068802997277984e-05, |
| "loss": 0.1676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14903788268566132, |
| "step": 2440, |
| "valid_targets_mean": 4375.1, |
| "valid_targets_min": 613 |
| }, |
| { |
| "epoch": 3.7906976744186047, |
| "grad_norm": 0.4631630261801319, |
| "learning_rate": 2.061074879588187e-05, |
| "loss": 0.1761, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17495691776275635, |
| "step": 2445, |
| "valid_targets_mean": 4443.9, |
| "valid_targets_min": 2333 |
| }, |
| { |
| "epoch": 3.798449612403101, |
| "grad_norm": 0.381627105046557, |
| "learning_rate": 2.0533458490299608e-05, |
| "loss": 0.172, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19416113197803497, |
| "step": 2450, |
| "valid_targets_mean": 5910.8, |
| "valid_targets_min": 813 |
| }, |
| { |
| "epoch": 3.806201550387597, |
| "grad_norm": 0.3672369381288124, |
| "learning_rate": 2.0456160211268726e-05, |
| "loss": 0.1523, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15462546050548553, |
| "step": 2455, |
| "valid_targets_mean": 4590.2, |
| "valid_targets_min": 425 |
| }, |
| { |
| "epoch": 3.813953488372093, |
| "grad_norm": 0.36355092211128553, |
| "learning_rate": 2.037885511414408e-05, |
| "loss": 0.1685, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1489698588848114, |
| "step": 2460, |
| "valid_targets_mean": 4814.1, |
| "valid_targets_min": 250 |
| }, |
| { |
| "epoch": 3.8217054263565893, |
| "grad_norm": 0.5834913333456886, |
| "learning_rate": 2.030154435438243e-05, |
| "loss": 0.1806, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17469245195388794, |
| "step": 2465, |
| "valid_targets_mean": 4683.1, |
| "valid_targets_min": 227 |
| }, |
| { |
| "epoch": 3.8294573643410854, |
| "grad_norm": 0.3750569957368585, |
| "learning_rate": 2.0224229087525176e-05, |
| "loss": 0.1638, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16605322062969208, |
| "step": 2470, |
| "valid_targets_mean": 5050.2, |
| "valid_targets_min": 2206 |
| }, |
| { |
| "epoch": 3.8372093023255816, |
| "grad_norm": 0.4159111267532109, |
| "learning_rate": 2.0146910469181083e-05, |
| "loss": 0.1798, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16885146498680115, |
| "step": 2475, |
| "valid_targets_mean": 4601.3, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 3.8449612403100772, |
| "grad_norm": 0.3729264179998901, |
| "learning_rate": 2.006958965500901e-05, |
| "loss": 0.1699, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15141122043132782, |
| "step": 2480, |
| "valid_targets_mean": 4849.9, |
| "valid_targets_min": 2352 |
| }, |
| { |
| "epoch": 3.8527131782945734, |
| "grad_norm": 0.5766276206946744, |
| "learning_rate": 1.9992267800700643e-05, |
| "loss": 0.1783, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19176653027534485, |
| "step": 2485, |
| "valid_targets_mean": 3846.1, |
| "valid_targets_min": 731 |
| }, |
| { |
| "epoch": 3.8604651162790695, |
| "grad_norm": 0.3706800726667539, |
| "learning_rate": 1.991494606196321e-05, |
| "loss": 0.1515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1340998411178589, |
| "step": 2490, |
| "valid_targets_mean": 4474.6, |
| "valid_targets_min": 269 |
| }, |
| { |
| "epoch": 3.8682170542635657, |
| "grad_norm": 0.44584862226366007, |
| "learning_rate": 1.98376255945022e-05, |
| "loss": 0.1778, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16283494234085083, |
| "step": 2495, |
| "valid_targets_mean": 4311.2, |
| "valid_targets_min": 1115 |
| }, |
| { |
| "epoch": 3.875968992248062, |
| "grad_norm": 0.3592938976849822, |
| "learning_rate": 1.9760307554004122e-05, |
| "loss": 0.1524, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18098889291286469, |
| "step": 2500, |
| "valid_targets_mean": 5765.5, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 3.883720930232558, |
| "grad_norm": 0.4223273599027322, |
| "learning_rate": 1.9682993096119197e-05, |
| "loss": 0.1693, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16485443711280823, |
| "step": 2505, |
| "valid_targets_mean": 4137.4, |
| "valid_targets_min": 901 |
| }, |
| { |
| "epoch": 3.891472868217054, |
| "grad_norm": 0.4448395910223574, |
| "learning_rate": 1.9605683376444086e-05, |
| "loss": 0.1817, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1999254673719406, |
| "step": 2510, |
| "valid_targets_mean": 3733.8, |
| "valid_targets_min": 266 |
| }, |
| { |
| "epoch": 3.89922480620155, |
| "grad_norm": 0.44711782753625473, |
| "learning_rate": 1.9528379550504663e-05, |
| "loss": 0.1975, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2123761773109436, |
| "step": 2515, |
| "valid_targets_mean": 3842.1, |
| "valid_targets_min": 489 |
| }, |
| { |
| "epoch": 3.9069767441860463, |
| "grad_norm": 0.3585629672419737, |
| "learning_rate": 1.945108277373869e-05, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16551396250724792, |
| "step": 2520, |
| "valid_targets_mean": 5320.1, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 3.9147286821705425, |
| "grad_norm": 0.38593055920198166, |
| "learning_rate": 1.9373794201478554e-05, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17138083279132843, |
| "step": 2525, |
| "valid_targets_mean": 4754.8, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 3.9224806201550386, |
| "grad_norm": 0.34993836610858403, |
| "learning_rate": 1.9296514988934018e-05, |
| "loss": 0.1532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13611240684986115, |
| "step": 2530, |
| "valid_targets_mean": 4849.8, |
| "valid_targets_min": 299 |
| }, |
| { |
| "epoch": 3.9302325581395348, |
| "grad_norm": 0.38998762581393137, |
| "learning_rate": 1.921924629117498e-05, |
| "loss": 0.169, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16259539127349854, |
| "step": 2535, |
| "valid_targets_mean": 4528.8, |
| "valid_targets_min": 1955 |
| }, |
| { |
| "epoch": 3.937984496124031, |
| "grad_norm": 0.4406751870739783, |
| "learning_rate": 1.9141989263114136e-05, |
| "loss": 0.185, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1572207659482956, |
| "step": 2540, |
| "valid_targets_mean": 3975.7, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 3.945736434108527, |
| "grad_norm": 0.45031010235314506, |
| "learning_rate": 1.9064745059489774e-05, |
| "loss": 0.1841, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1765103042125702, |
| "step": 2545, |
| "valid_targets_mean": 3726.0, |
| "valid_targets_min": 282 |
| }, |
| { |
| "epoch": 3.953488372093023, |
| "grad_norm": 0.6078467791119643, |
| "learning_rate": 1.8987514834848503e-05, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17429549992084503, |
| "step": 2550, |
| "valid_targets_mean": 3989.9, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 3.9612403100775193, |
| "grad_norm": 0.3631710161577126, |
| "learning_rate": 1.8910299743527993e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1885673701763153, |
| "step": 2555, |
| "valid_targets_mean": 5834.6, |
| "valid_targets_min": 585 |
| }, |
| { |
| "epoch": 3.9689922480620154, |
| "grad_norm": 0.49167632435325864, |
| "learning_rate": 1.8833100939639694e-05, |
| "loss": 0.1624, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20458854734897614, |
| "step": 2560, |
| "valid_targets_mean": 3560.4, |
| "valid_targets_min": 419 |
| }, |
| { |
| "epoch": 3.9767441860465116, |
| "grad_norm": 0.3634420862575136, |
| "learning_rate": 1.875591957705166e-05, |
| "loss": 0.1785, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13289107382297516, |
| "step": 2565, |
| "valid_targets_mean": 5413.6, |
| "valid_targets_min": 1805 |
| }, |
| { |
| "epoch": 3.9844961240310077, |
| "grad_norm": 0.4586334241085507, |
| "learning_rate": 1.867875680937122e-05, |
| "loss": 0.1691, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2052847146987915, |
| "step": 2570, |
| "valid_targets_mean": 4061.1, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 3.992248062015504, |
| "grad_norm": 0.43210061293605817, |
| "learning_rate": 1.860161378992778e-05, |
| "loss": 0.1779, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2044166624546051, |
| "step": 2575, |
| "valid_targets_mean": 4605.4, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 4.0, |
| "grad_norm": 0.37276933625985337, |
| "learning_rate": 1.8524491671755563e-05, |
| "loss": 0.1763, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1616727113723755, |
| "step": 2580, |
| "valid_targets_mean": 5067.4, |
| "valid_targets_min": 527 |
| }, |
| { |
| "epoch": 4.007751937984496, |
| "grad_norm": 0.36563074448629657, |
| "learning_rate": 1.8447391607576416e-05, |
| "loss": 0.1441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13933786749839783, |
| "step": 2585, |
| "valid_targets_mean": 4913.7, |
| "valid_targets_min": 740 |
| }, |
| { |
| "epoch": 4.015503875968992, |
| "grad_norm": 0.4772926288066321, |
| "learning_rate": 1.8370314749782524e-05, |
| "loss": 0.1581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18599829077720642, |
| "step": 2590, |
| "valid_targets_mean": 4072.6, |
| "valid_targets_min": 666 |
| }, |
| { |
| "epoch": 4.023255813953488, |
| "grad_norm": 0.4964995939447069, |
| "learning_rate": 1.8293262250419215e-05, |
| "loss": 0.165, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16809843480587006, |
| "step": 2595, |
| "valid_targets_mean": 3508.6, |
| "valid_targets_min": 2368 |
| }, |
| { |
| "epoch": 4.0310077519379846, |
| "grad_norm": 0.5174597685405774, |
| "learning_rate": 1.8216235261167765e-05, |
| "loss": 0.1731, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2505348324775696, |
| "step": 2600, |
| "valid_targets_mean": 4262.7, |
| "valid_targets_min": 970 |
| }, |
| { |
| "epoch": 4.038759689922481, |
| "grad_norm": 0.40606990941323745, |
| "learning_rate": 1.8139234933328126e-05, |
| "loss": 0.1677, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.138991117477417, |
| "step": 2605, |
| "valid_targets_mean": 5074.9, |
| "valid_targets_min": 680 |
| }, |
| { |
| "epoch": 4.046511627906977, |
| "grad_norm": 0.4634993018273127, |
| "learning_rate": 1.8062262417801767e-05, |
| "loss": 0.1539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1454424411058426, |
| "step": 2610, |
| "valid_targets_mean": 4132.0, |
| "valid_targets_min": 315 |
| }, |
| { |
| "epoch": 4.054263565891473, |
| "grad_norm": 0.45594388080755227, |
| "learning_rate": 1.7985318865074445e-05, |
| "loss": 0.1558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13495397567749023, |
| "step": 2615, |
| "valid_targets_mean": 4592.6, |
| "valid_targets_min": 908 |
| }, |
| { |
| "epoch": 4.062015503875969, |
| "grad_norm": 0.3632193067972436, |
| "learning_rate": 1.790840542519903e-05, |
| "loss": 0.1581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14542677998542786, |
| "step": 2620, |
| "valid_targets_mean": 6443.2, |
| "valid_targets_min": 674 |
| }, |
| { |
| "epoch": 4.069767441860465, |
| "grad_norm": 0.4084216853540113, |
| "learning_rate": 1.7831523247778296e-05, |
| "loss": 0.1361, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15561866760253906, |
| "step": 2625, |
| "valid_targets_mean": 4696.6, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 4.077519379844961, |
| "grad_norm": 0.4622453535570728, |
| "learning_rate": 1.775467348194774e-05, |
| "loss": 0.1508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1541646271944046, |
| "step": 2630, |
| "valid_targets_mean": 4509.7, |
| "valid_targets_min": 585 |
| }, |
| { |
| "epoch": 4.0852713178294575, |
| "grad_norm": 0.36481781559899207, |
| "learning_rate": 1.767785727635843e-05, |
| "loss": 0.1445, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1567380130290985, |
| "step": 2635, |
| "valid_targets_mean": 6221.8, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 4.093023255813954, |
| "grad_norm": 0.3792078104165168, |
| "learning_rate": 1.7601075779159806e-05, |
| "loss": 0.1463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12530960142612457, |
| "step": 2640, |
| "valid_targets_mean": 4478.4, |
| "valid_targets_min": 361 |
| }, |
| { |
| "epoch": 4.10077519379845, |
| "grad_norm": 0.4219019340853787, |
| "learning_rate": 1.7524330137982524e-05, |
| "loss": 0.1563, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18058227002620697, |
| "step": 2645, |
| "valid_targets_mean": 4726.9, |
| "valid_targets_min": 2654 |
| }, |
| { |
| "epoch": 4.108527131782946, |
| "grad_norm": 0.42766284883408445, |
| "learning_rate": 1.7447621499921342e-05, |
| "loss": 0.1555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16935157775878906, |
| "step": 2650, |
| "valid_targets_mean": 4662.6, |
| "valid_targets_min": 2874 |
| }, |
| { |
| "epoch": 4.116279069767442, |
| "grad_norm": 0.4480590715700904, |
| "learning_rate": 1.7370951011517906e-05, |
| "loss": 0.159, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19573025405406952, |
| "step": 2655, |
| "valid_targets_mean": 4988.3, |
| "valid_targets_min": 887 |
| }, |
| { |
| "epoch": 4.124031007751938, |
| "grad_norm": 0.4647682503763762, |
| "learning_rate": 1.7294319818743677e-05, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1806863695383072, |
| "step": 2660, |
| "valid_targets_mean": 4018.7, |
| "valid_targets_min": 684 |
| }, |
| { |
| "epoch": 4.131782945736434, |
| "grad_norm": 0.33468042082332256, |
| "learning_rate": 1.7217729066982754e-05, |
| "loss": 0.1676, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13625994324684143, |
| "step": 2665, |
| "valid_targets_mean": 5762.8, |
| "valid_targets_min": 3241 |
| }, |
| { |
| "epoch": 4.1395348837209305, |
| "grad_norm": 0.35879066729195264, |
| "learning_rate": 1.7141179901014798e-05, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1351138949394226, |
| "step": 2670, |
| "valid_targets_mean": 5373.6, |
| "valid_targets_min": 2492 |
| }, |
| { |
| "epoch": 4.147286821705427, |
| "grad_norm": 0.38289139539979355, |
| "learning_rate": 1.7064673464997885e-05, |
| "loss": 0.1507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14373061060905457, |
| "step": 2675, |
| "valid_targets_mean": 4701.4, |
| "valid_targets_min": 1523 |
| }, |
| { |
| "epoch": 4.155038759689923, |
| "grad_norm": 0.3514618484402962, |
| "learning_rate": 1.698821090245141e-05, |
| "loss": 0.1576, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12618312239646912, |
| "step": 2680, |
| "valid_targets_mean": 5099.0, |
| "valid_targets_min": 1436 |
| }, |
| { |
| "epoch": 4.162790697674419, |
| "grad_norm": 0.4029673695317988, |
| "learning_rate": 1.691179335623904e-05, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15906205773353577, |
| "step": 2685, |
| "valid_targets_mean": 5508.1, |
| "valid_targets_min": 432 |
| }, |
| { |
| "epoch": 4.170542635658915, |
| "grad_norm": 0.4944425640026309, |
| "learning_rate": 1.6835421968551556e-05, |
| "loss": 0.1478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14945298433303833, |
| "step": 2690, |
| "valid_targets_mean": 3783.1, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 4.178294573643411, |
| "grad_norm": 0.4380361387817116, |
| "learning_rate": 1.675909788088984e-05, |
| "loss": 0.1737, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18563194572925568, |
| "step": 2695, |
| "valid_targets_mean": 4740.7, |
| "valid_targets_min": 2335 |
| }, |
| { |
| "epoch": 4.186046511627907, |
| "grad_norm": 0.4771028211600623, |
| "learning_rate": 1.6682822234047796e-05, |
| "loss": 0.1555, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1575438231229782, |
| "step": 2700, |
| "valid_targets_mean": 3456.6, |
| "valid_targets_min": 352 |
| }, |
| { |
| "epoch": 4.1937984496124034, |
| "grad_norm": 0.41423182041175527, |
| "learning_rate": 1.660659616809529e-05, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13387396931648254, |
| "step": 2705, |
| "valid_targets_mean": 4664.9, |
| "valid_targets_min": 1948 |
| }, |
| { |
| "epoch": 4.2015503875969, |
| "grad_norm": 0.530813584525465, |
| "learning_rate": 1.653042082236112e-05, |
| "loss": 0.1774, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.3004525601863861, |
| "step": 2710, |
| "valid_targets_mean": 4756.2, |
| "valid_targets_min": 332 |
| }, |
| { |
| "epoch": 4.209302325581396, |
| "grad_norm": 0.44640047447531017, |
| "learning_rate": 1.6454297335415975e-05, |
| "loss": 0.167, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1683686077594757, |
| "step": 2715, |
| "valid_targets_mean": 3983.3, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 4.217054263565892, |
| "grad_norm": 0.4231137236979658, |
| "learning_rate": 1.6378226845055454e-05, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17019568383693695, |
| "step": 2720, |
| "valid_targets_mean": 4835.2, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 4.224806201550388, |
| "grad_norm": 0.386736159227142, |
| "learning_rate": 1.6302210488282993e-05, |
| "loss": 0.1633, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18334552645683289, |
| "step": 2725, |
| "valid_targets_mean": 5246.4, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 4.232558139534884, |
| "grad_norm": 0.4229332730901514, |
| "learning_rate": 1.6226249401292932e-05, |
| "loss": 0.1447, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1335538774728775, |
| "step": 2730, |
| "valid_targets_mean": 4478.2, |
| "valid_targets_min": 265 |
| }, |
| { |
| "epoch": 4.24031007751938, |
| "grad_norm": 0.5239959011141749, |
| "learning_rate": 1.6150344719453513e-05, |
| "loss": 0.1599, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13435792922973633, |
| "step": 2735, |
| "valid_targets_mean": 4364.5, |
| "valid_targets_min": 389 |
| }, |
| { |
| "epoch": 4.248062015503876, |
| "grad_norm": 0.3585379143026963, |
| "learning_rate": 1.6074497577289893e-05, |
| "loss": 0.1428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12283202260732651, |
| "step": 2740, |
| "valid_targets_mean": 5174.9, |
| "valid_targets_min": 2143 |
| }, |
| { |
| "epoch": 4.2558139534883725, |
| "grad_norm": 0.41779854478657813, |
| "learning_rate": 1.599870910846721e-05, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13781797885894775, |
| "step": 2745, |
| "valid_targets_mean": 4340.5, |
| "valid_targets_min": 2348 |
| }, |
| { |
| "epoch": 4.263565891472869, |
| "grad_norm": 0.47639510138543717, |
| "learning_rate": 1.5922980445773618e-05, |
| "loss": 0.1688, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20977307856082916, |
| "step": 2750, |
| "valid_targets_mean": 4089.1, |
| "valid_targets_min": 570 |
| }, |
| { |
| "epoch": 4.271317829457364, |
| "grad_norm": 0.4321321807850601, |
| "learning_rate": 1.584731272110338e-05, |
| "loss": 0.1478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1279362142086029, |
| "step": 2755, |
| "valid_targets_mean": 4232.4, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 4.27906976744186, |
| "grad_norm": 0.4163782737967656, |
| "learning_rate": 1.5771707065439925e-05, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1572471261024475, |
| "step": 2760, |
| "valid_targets_mean": 4172.6, |
| "valid_targets_min": 362 |
| }, |
| { |
| "epoch": 4.286821705426356, |
| "grad_norm": 0.44476929142723237, |
| "learning_rate": 1.5696164608838957e-05, |
| "loss": 0.1492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12877783179283142, |
| "step": 2765, |
| "valid_targets_mean": 3667.2, |
| "valid_targets_min": 324 |
| }, |
| { |
| "epoch": 4.294573643410852, |
| "grad_norm": 0.44033521779323154, |
| "learning_rate": 1.5620686480411568e-05, |
| "loss": 0.1793, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1912871152162552, |
| "step": 2770, |
| "valid_targets_mean": 4556.9, |
| "valid_targets_min": 571 |
| }, |
| { |
| "epoch": 4.3023255813953485, |
| "grad_norm": 0.43835417771534674, |
| "learning_rate": 1.5545273808307358e-05, |
| "loss": 0.1762, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18065080046653748, |
| "step": 2775, |
| "valid_targets_mean": 4829.0, |
| "valid_targets_min": 701 |
| }, |
| { |
| "epoch": 4.310077519379845, |
| "grad_norm": 0.4359801265972791, |
| "learning_rate": 1.546992771969755e-05, |
| "loss": 0.1548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1816236674785614, |
| "step": 2780, |
| "valid_targets_mean": 4372.9, |
| "valid_targets_min": 313 |
| }, |
| { |
| "epoch": 4.317829457364341, |
| "grad_norm": 0.4410756401612138, |
| "learning_rate": 1.5394649340758184e-05, |
| "loss": 0.1483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15419849753379822, |
| "step": 2785, |
| "valid_targets_mean": 5035.1, |
| "valid_targets_min": 2134 |
| }, |
| { |
| "epoch": 4.325581395348837, |
| "grad_norm": 0.4559093303470707, |
| "learning_rate": 1.5319439796653258e-05, |
| "loss": 0.1586, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17408901453018188, |
| "step": 2790, |
| "valid_targets_mean": 4336.3, |
| "valid_targets_min": 1990 |
| }, |
| { |
| "epoch": 4.333333333333333, |
| "grad_norm": 0.3733614937743712, |
| "learning_rate": 1.5244300211517916e-05, |
| "loss": 0.1613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1421089917421341, |
| "step": 2795, |
| "valid_targets_mean": 4486.0, |
| "valid_targets_min": 266 |
| }, |
| { |
| "epoch": 4.341085271317829, |
| "grad_norm": 0.4384718248610877, |
| "learning_rate": 1.5169231708441625e-05, |
| "loss": 0.1641, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15485528111457825, |
| "step": 2800, |
| "valid_targets_mean": 4390.1, |
| "valid_targets_min": 458 |
| }, |
| { |
| "epoch": 4.348837209302325, |
| "grad_norm": 0.35486111522759517, |
| "learning_rate": 1.5094235409451452e-05, |
| "loss": 0.1567, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14936892688274384, |
| "step": 2805, |
| "valid_targets_mean": 5619.9, |
| "valid_targets_min": 2606 |
| }, |
| { |
| "epoch": 4.3565891472868215, |
| "grad_norm": 0.4641264262776539, |
| "learning_rate": 1.5019312435495215e-05, |
| "loss": 0.1681, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16389770805835724, |
| "step": 2810, |
| "valid_targets_mean": 4543.3, |
| "valid_targets_min": 531 |
| }, |
| { |
| "epoch": 4.364341085271318, |
| "grad_norm": 0.4095733450935873, |
| "learning_rate": 1.4944463906424773e-05, |
| "loss": 0.1602, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15087318420410156, |
| "step": 2815, |
| "valid_targets_mean": 5138.6, |
| "valid_targets_min": 2324 |
| }, |
| { |
| "epoch": 4.372093023255814, |
| "grad_norm": 0.43224144450256036, |
| "learning_rate": 1.486969094097929e-05, |
| "loss": 0.1864, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17015056312084198, |
| "step": 2820, |
| "valid_targets_mean": 4383.4, |
| "valid_targets_min": 196 |
| }, |
| { |
| "epoch": 4.37984496124031, |
| "grad_norm": 0.42039391089480094, |
| "learning_rate": 1.4794994656768485e-05, |
| "loss": 0.1835, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16320443153381348, |
| "step": 2825, |
| "valid_targets_mean": 4572.7, |
| "valid_targets_min": 1677 |
| }, |
| { |
| "epoch": 4.387596899224806, |
| "grad_norm": 0.4360528678353131, |
| "learning_rate": 1.4720376170255958e-05, |
| "loss": 0.1631, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17029808461666107, |
| "step": 2830, |
| "valid_targets_mean": 4660.2, |
| "valid_targets_min": 2294 |
| }, |
| { |
| "epoch": 4.395348837209302, |
| "grad_norm": 0.47146218786067823, |
| "learning_rate": 1.464583659674248e-05, |
| "loss": 0.1666, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19265028834342957, |
| "step": 2835, |
| "valid_targets_mean": 4134.2, |
| "valid_targets_min": 328 |
| }, |
| { |
| "epoch": 4.403100775193798, |
| "grad_norm": 0.44499692816713254, |
| "learning_rate": 1.4571377050349347e-05, |
| "loss": 0.1577, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16304971277713776, |
| "step": 2840, |
| "valid_targets_mean": 4391.5, |
| "valid_targets_min": 370 |
| }, |
| { |
| "epoch": 4.410852713178294, |
| "grad_norm": 0.46432590434836263, |
| "learning_rate": 1.44969986440017e-05, |
| "loss": 0.1707, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1540422886610031, |
| "step": 2845, |
| "valid_targets_mean": 4667.3, |
| "valid_targets_min": 335 |
| }, |
| { |
| "epoch": 4.4186046511627906, |
| "grad_norm": 0.4999077483071989, |
| "learning_rate": 1.4422702489411894e-05, |
| "loss": 0.162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18639114499092102, |
| "step": 2850, |
| "valid_targets_mean": 3962.9, |
| "valid_targets_min": 546 |
| }, |
| { |
| "epoch": 4.426356589147287, |
| "grad_norm": 0.405932784042207, |
| "learning_rate": 1.4348489697062925e-05, |
| "loss": 0.1603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1444004476070404, |
| "step": 2855, |
| "valid_targets_mean": 4650.3, |
| "valid_targets_min": 1526 |
| }, |
| { |
| "epoch": 4.434108527131783, |
| "grad_norm": 0.3934528365825335, |
| "learning_rate": 1.4274361376191767e-05, |
| "loss": 0.1516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1553172767162323, |
| "step": 2860, |
| "valid_targets_mean": 5694.0, |
| "valid_targets_min": 2890 |
| }, |
| { |
| "epoch": 4.441860465116279, |
| "grad_norm": 0.40913794771831696, |
| "learning_rate": 1.420031863477283e-05, |
| "loss": 0.1581, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1494569182395935, |
| "step": 2865, |
| "valid_targets_mean": 4331.6, |
| "valid_targets_min": 319 |
| }, |
| { |
| "epoch": 4.449612403100775, |
| "grad_norm": 0.47285700783628626, |
| "learning_rate": 1.4126362579501401e-05, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15232403576374054, |
| "step": 2870, |
| "valid_targets_mean": 3542.6, |
| "valid_targets_min": 370 |
| }, |
| { |
| "epoch": 4.457364341085271, |
| "grad_norm": 0.4650848027329248, |
| "learning_rate": 1.4052494315777091e-05, |
| "loss": 0.1726, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1610431671142578, |
| "step": 2875, |
| "valid_targets_mean": 3635.2, |
| "valid_targets_min": 1079 |
| }, |
| { |
| "epoch": 4.465116279069767, |
| "grad_norm": 0.4653775809202961, |
| "learning_rate": 1.3978714947687308e-05, |
| "loss": 0.158, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20595189929008484, |
| "step": 2880, |
| "valid_targets_mean": 4235.9, |
| "valid_targets_min": 453 |
| }, |
| { |
| "epoch": 4.4728682170542635, |
| "grad_norm": 0.3856889005381559, |
| "learning_rate": 1.390502557799077e-05, |
| "loss": 0.1645, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14087346196174622, |
| "step": 2885, |
| "valid_targets_mean": 4527.4, |
| "valid_targets_min": 2189 |
| }, |
| { |
| "epoch": 4.48062015503876, |
| "grad_norm": 0.3945151120253326, |
| "learning_rate": 1.3831427308101021e-05, |
| "loss": 0.1623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1581602394580841, |
| "step": 2890, |
| "valid_targets_mean": 4957.9, |
| "valid_targets_min": 1819 |
| }, |
| { |
| "epoch": 4.488372093023256, |
| "grad_norm": 0.40342280135663167, |
| "learning_rate": 1.375792123806996e-05, |
| "loss": 0.1669, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14058300852775574, |
| "step": 2895, |
| "valid_targets_mean": 4725.2, |
| "valid_targets_min": 643 |
| }, |
| { |
| "epoch": 4.496124031007752, |
| "grad_norm": 0.4036139924740885, |
| "learning_rate": 1.3684508466571385e-05, |
| "loss": 0.1639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18375971913337708, |
| "step": 2900, |
| "valid_targets_mean": 5136.7, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 4.503875968992248, |
| "grad_norm": 0.5271710172062103, |
| "learning_rate": 1.3611190090884611e-05, |
| "loss": 0.1606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17250756919384003, |
| "step": 2905, |
| "valid_targets_mean": 3673.4, |
| "valid_targets_min": 249 |
| }, |
| { |
| "epoch": 4.511627906976744, |
| "grad_norm": 0.40659265968531066, |
| "learning_rate": 1.3537967206878036e-05, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15408380329608917, |
| "step": 2910, |
| "valid_targets_mean": 4791.4, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 4.51937984496124, |
| "grad_norm": 0.3722111335904797, |
| "learning_rate": 1.3464840908992768e-05, |
| "loss": 0.1553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12856316566467285, |
| "step": 2915, |
| "valid_targets_mean": 4795.7, |
| "valid_targets_min": 2420 |
| }, |
| { |
| "epoch": 4.5271317829457365, |
| "grad_norm": 0.4556137521413307, |
| "learning_rate": 1.3391812290226272e-05, |
| "loss": 0.187, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2201414704322815, |
| "step": 2920, |
| "valid_targets_mean": 4536.7, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 4.534883720930233, |
| "grad_norm": 0.4743449244975186, |
| "learning_rate": 1.3318882442116048e-05, |
| "loss": 0.1578, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21773910522460938, |
| "step": 2925, |
| "valid_targets_mean": 4512.2, |
| "valid_targets_min": 581 |
| }, |
| { |
| "epoch": 4.542635658914729, |
| "grad_norm": 0.47202078789113744, |
| "learning_rate": 1.3246052454723275e-05, |
| "loss": 0.1484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17931053042411804, |
| "step": 2930, |
| "valid_targets_mean": 4000.9, |
| "valid_targets_min": 683 |
| }, |
| { |
| "epoch": 4.550387596899225, |
| "grad_norm": 0.363075525223068, |
| "learning_rate": 1.3173323416616546e-05, |
| "loss": 0.1634, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1436081826686859, |
| "step": 2935, |
| "valid_targets_mean": 5052.1, |
| "valid_targets_min": 766 |
| }, |
| { |
| "epoch": 4.558139534883721, |
| "grad_norm": 0.4252120402864096, |
| "learning_rate": 1.310069641485562e-05, |
| "loss": 0.163, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1449616551399231, |
| "step": 2940, |
| "valid_targets_mean": 5067.6, |
| "valid_targets_min": 968 |
| }, |
| { |
| "epoch": 4.565891472868217, |
| "grad_norm": 0.41309349051810224, |
| "learning_rate": 1.3028172534975125e-05, |
| "loss": 0.1589, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15337392687797546, |
| "step": 2945, |
| "valid_targets_mean": 4410.0, |
| "valid_targets_min": 625 |
| }, |
| { |
| "epoch": 4.573643410852713, |
| "grad_norm": 0.5160731043484095, |
| "learning_rate": 1.2955752860968356e-05, |
| "loss": 0.1697, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1839904487133026, |
| "step": 2950, |
| "valid_targets_mean": 4195.2, |
| "valid_targets_min": 1004 |
| }, |
| { |
| "epoch": 4.5813953488372094, |
| "grad_norm": 0.39603413769839324, |
| "learning_rate": 1.2883438475271088e-05, |
| "loss": 0.1449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1449984461069107, |
| "step": 2955, |
| "valid_targets_mean": 4908.1, |
| "valid_targets_min": 1489 |
| }, |
| { |
| "epoch": 4.589147286821706, |
| "grad_norm": 0.4659985680055713, |
| "learning_rate": 1.2811230458745372e-05, |
| "loss": 0.1748, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21567106246948242, |
| "step": 2960, |
| "valid_targets_mean": 4454.5, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 4.596899224806202, |
| "grad_norm": 0.4523280898732182, |
| "learning_rate": 1.2739129890663386e-05, |
| "loss": 0.1546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15529918670654297, |
| "step": 2965, |
| "valid_targets_mean": 4419.5, |
| "valid_targets_min": 962 |
| }, |
| { |
| "epoch": 4.604651162790698, |
| "grad_norm": 0.3913593277889339, |
| "learning_rate": 1.266713784869131e-05, |
| "loss": 0.1801, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15807433426380157, |
| "step": 2970, |
| "valid_targets_mean": 4846.1, |
| "valid_targets_min": 734 |
| }, |
| { |
| "epoch": 4.612403100775194, |
| "grad_norm": 0.4182683219376584, |
| "learning_rate": 1.2595255408873232e-05, |
| "loss": 0.1507, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13988031446933746, |
| "step": 2975, |
| "valid_targets_mean": 4320.1, |
| "valid_targets_min": 523 |
| }, |
| { |
| "epoch": 4.62015503875969, |
| "grad_norm": 0.35362147101841246, |
| "learning_rate": 1.2523483645615031e-05, |
| "loss": 0.1435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11566026508808136, |
| "step": 2980, |
| "valid_targets_mean": 5738.1, |
| "valid_targets_min": 1805 |
| }, |
| { |
| "epoch": 4.627906976744186, |
| "grad_norm": 0.4359085932620926, |
| "learning_rate": 1.2451823631668333e-05, |
| "loss": 0.1734, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2180645763874054, |
| "step": 2985, |
| "valid_targets_mean": 5415.4, |
| "valid_targets_min": 1779 |
| }, |
| { |
| "epoch": 4.635658914728682, |
| "grad_norm": 0.4178432880182616, |
| "learning_rate": 1.2380276438114495e-05, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15357699990272522, |
| "step": 2990, |
| "valid_targets_mean": 3995.6, |
| "valid_targets_min": 921 |
| }, |
| { |
| "epoch": 4.6434108527131785, |
| "grad_norm": 0.3928742323402058, |
| "learning_rate": 1.2308843134348569e-05, |
| "loss": 0.1587, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14658121764659882, |
| "step": 2995, |
| "valid_targets_mean": 4797.7, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 4.651162790697675, |
| "grad_norm": 0.40724671685704517, |
| "learning_rate": 1.2237524788063335e-05, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13327175378799438, |
| "step": 3000, |
| "valid_targets_mean": 4289.8, |
| "valid_targets_min": 654 |
| }, |
| { |
| "epoch": 4.658914728682171, |
| "grad_norm": 0.38017870244977436, |
| "learning_rate": 1.2166322465233325e-05, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15827676653862, |
| "step": 3005, |
| "valid_targets_mean": 5934.4, |
| "valid_targets_min": 2154 |
| }, |
| { |
| "epoch": 4.666666666666667, |
| "grad_norm": 0.4241213390458187, |
| "learning_rate": 1.2095237230098925e-05, |
| "loss": 0.1513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15015850961208344, |
| "step": 3010, |
| "valid_targets_mean": 3942.2, |
| "valid_targets_min": 2726 |
| }, |
| { |
| "epoch": 4.674418604651163, |
| "grad_norm": 0.42983747059070593, |
| "learning_rate": 1.2024270145150428e-05, |
| "loss": 0.1529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1613459587097168, |
| "step": 3015, |
| "valid_targets_mean": 4662.0, |
| "valid_targets_min": 2112 |
| }, |
| { |
| "epoch": 4.682170542635659, |
| "grad_norm": 0.4541648568256799, |
| "learning_rate": 1.1953422271112171e-05, |
| "loss": 0.1533, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1784931868314743, |
| "step": 3020, |
| "valid_targets_mean": 4353.8, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 4.689922480620155, |
| "grad_norm": 0.37376376389283156, |
| "learning_rate": 1.1882694666926691e-05, |
| "loss": 0.1458, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10884034633636475, |
| "step": 3025, |
| "valid_targets_mean": 4409.1, |
| "valid_targets_min": 533 |
| }, |
| { |
| "epoch": 4.6976744186046515, |
| "grad_norm": 0.4214595584685805, |
| "learning_rate": 1.1812088389738875e-05, |
| "loss": 0.1558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21922525763511658, |
| "step": 3030, |
| "valid_targets_mean": 6067.9, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 4.705426356589148, |
| "grad_norm": 0.35642720118665594, |
| "learning_rate": 1.1741604494880177e-05, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14536528289318085, |
| "step": 3035, |
| "valid_targets_mean": 5993.4, |
| "valid_targets_min": 752 |
| }, |
| { |
| "epoch": 4.713178294573644, |
| "grad_norm": 0.4788498710665514, |
| "learning_rate": 1.167124403585283e-05, |
| "loss": 0.1607, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16465994715690613, |
| "step": 3040, |
| "valid_targets_mean": 3857.6, |
| "valid_targets_min": 302 |
| }, |
| { |
| "epoch": 4.720930232558139, |
| "grad_norm": 0.46807401286424594, |
| "learning_rate": 1.1601008064314127e-05, |
| "loss": 0.1511, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17980757355690002, |
| "step": 3045, |
| "valid_targets_mean": 4050.8, |
| "valid_targets_min": 411 |
| }, |
| { |
| "epoch": 4.728682170542635, |
| "grad_norm": 0.3493024998293867, |
| "learning_rate": 1.1530897630060664e-05, |
| "loss": 0.1453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14402084052562714, |
| "step": 3050, |
| "valid_targets_mean": 5970.5, |
| "valid_targets_min": 3312 |
| }, |
| { |
| "epoch": 4.736434108527131, |
| "grad_norm": 1.1433311286570027, |
| "learning_rate": 1.146091378101267e-05, |
| "loss": 0.1612, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18359369039535522, |
| "step": 3055, |
| "valid_targets_mean": 5394.9, |
| "valid_targets_min": 2047 |
| }, |
| { |
| "epoch": 4.7441860465116275, |
| "grad_norm": 0.3656089625075003, |
| "learning_rate": 1.1391057563198352e-05, |
| "loss": 0.1568, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15548282861709595, |
| "step": 3060, |
| "valid_targets_mean": 5395.7, |
| "valid_targets_min": 1999 |
| }, |
| { |
| "epoch": 4.751937984496124, |
| "grad_norm": 0.3682957712457608, |
| "learning_rate": 1.1321330020738238e-05, |
| "loss": 0.1513, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12282656878232956, |
| "step": 3065, |
| "valid_targets_mean": 4505.5, |
| "valid_targets_min": 433 |
| }, |
| { |
| "epoch": 4.75968992248062, |
| "grad_norm": 0.41853152057960064, |
| "learning_rate": 1.1251732195829581e-05, |
| "loss": 0.1611, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13153740763664246, |
| "step": 3070, |
| "valid_targets_mean": 4470.2, |
| "valid_targets_min": 2352 |
| }, |
| { |
| "epoch": 4.767441860465116, |
| "grad_norm": 0.38423534152358596, |
| "learning_rate": 1.118226512873081e-05, |
| "loss": 0.1537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17503979802131653, |
| "step": 3075, |
| "valid_targets_mean": 4954.4, |
| "valid_targets_min": 307 |
| }, |
| { |
| "epoch": 4.775193798449612, |
| "grad_norm": 0.37157618329698217, |
| "learning_rate": 1.1112929857745924e-05, |
| "loss": 0.1463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13206711411476135, |
| "step": 3080, |
| "valid_targets_mean": 5568.5, |
| "valid_targets_min": 2292 |
| }, |
| { |
| "epoch": 4.782945736434108, |
| "grad_norm": 0.509246178657668, |
| "learning_rate": 1.1043727419209023e-05, |
| "loss": 0.1653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1961718052625656, |
| "step": 3085, |
| "valid_targets_mean": 3839.4, |
| "valid_targets_min": 266 |
| }, |
| { |
| "epoch": 4.790697674418604, |
| "grad_norm": 0.4608884016393757, |
| "learning_rate": 1.0974658847468775e-05, |
| "loss": 0.1639, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18118709325790405, |
| "step": 3090, |
| "valid_targets_mean": 4658.3, |
| "valid_targets_min": 609 |
| }, |
| { |
| "epoch": 4.7984496124031, |
| "grad_norm": 0.3407586601849243, |
| "learning_rate": 1.0905725174873021e-05, |
| "loss": 0.1508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13145892322063446, |
| "step": 3095, |
| "valid_targets_mean": 5481.1, |
| "valid_targets_min": 2463 |
| }, |
| { |
| "epoch": 4.8062015503875966, |
| "grad_norm": 0.44372721977998414, |
| "learning_rate": 1.0836927431753268e-05, |
| "loss": 0.1535, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1747463047504425, |
| "step": 3100, |
| "valid_targets_mean": 4381.4, |
| "valid_targets_min": 2634 |
| }, |
| { |
| "epoch": 4.813953488372093, |
| "grad_norm": 0.4313480237295467, |
| "learning_rate": 1.0768266646409331e-05, |
| "loss": 0.1725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1479579210281372, |
| "step": 3105, |
| "valid_targets_mean": 3838.2, |
| "valid_targets_min": 558 |
| }, |
| { |
| "epoch": 4.821705426356589, |
| "grad_norm": 0.40712005319072236, |
| "learning_rate": 1.0699743845093977e-05, |
| "loss": 0.1807, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16829770803451538, |
| "step": 3110, |
| "valid_targets_mean": 5049.5, |
| "valid_targets_min": 635 |
| }, |
| { |
| "epoch": 4.829457364341085, |
| "grad_norm": 0.4038620874534929, |
| "learning_rate": 1.0631360051997545e-05, |
| "loss": 0.1504, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13558568060398102, |
| "step": 3115, |
| "valid_targets_mean": 4396.6, |
| "valid_targets_min": 477 |
| }, |
| { |
| "epoch": 4.837209302325581, |
| "grad_norm": 0.46074509090856464, |
| "learning_rate": 1.0563116289232664e-05, |
| "loss": 0.1389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13045081496238708, |
| "step": 3120, |
| "valid_targets_mean": 3530.9, |
| "valid_targets_min": 341 |
| }, |
| { |
| "epoch": 4.844961240310077, |
| "grad_norm": 0.43813490790924364, |
| "learning_rate": 1.0495013576818974e-05, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15511000156402588, |
| "step": 3125, |
| "valid_targets_mean": 4225.4, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 4.852713178294573, |
| "grad_norm": 0.4380047569329961, |
| "learning_rate": 1.0427052932667872e-05, |
| "loss": 0.1729, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19142797589302063, |
| "step": 3130, |
| "valid_targets_mean": 4649.4, |
| "valid_targets_min": 1866 |
| }, |
| { |
| "epoch": 4.8604651162790695, |
| "grad_norm": 0.3622958483592568, |
| "learning_rate": 1.0359235372567303e-05, |
| "loss": 0.1564, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16687515377998352, |
| "step": 3135, |
| "valid_targets_mean": 5099.6, |
| "valid_targets_min": 2400 |
| }, |
| { |
| "epoch": 4.868217054263566, |
| "grad_norm": 0.4538324825468118, |
| "learning_rate": 1.0291561910166575e-05, |
| "loss": 0.1508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1640026718378067, |
| "step": 3140, |
| "valid_targets_mean": 4020.4, |
| "valid_targets_min": 637 |
| }, |
| { |
| "epoch": 4.875968992248062, |
| "grad_norm": 0.3815270313643839, |
| "learning_rate": 1.0224033556961221e-05, |
| "loss": 0.1517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15679693222045898, |
| "step": 3145, |
| "valid_targets_mean": 5416.8, |
| "valid_targets_min": 2731 |
| }, |
| { |
| "epoch": 4.883720930232558, |
| "grad_norm": 0.37173879163162826, |
| "learning_rate": 1.0156651322277859e-05, |
| "loss": 0.1545, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15583065152168274, |
| "step": 3150, |
| "valid_targets_mean": 6000.7, |
| "valid_targets_min": 2168 |
| }, |
| { |
| "epoch": 4.891472868217054, |
| "grad_norm": 0.44542528707551793, |
| "learning_rate": 1.0089416213259109e-05, |
| "loss": 0.1655, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.2258930504322052, |
| "step": 3155, |
| "valid_targets_mean": 5374.3, |
| "valid_targets_min": 1335 |
| }, |
| { |
| "epoch": 4.89922480620155, |
| "grad_norm": 0.46872132575511044, |
| "learning_rate": 1.0022329234848568e-05, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20413146913051605, |
| "step": 3160, |
| "valid_targets_mean": 4518.1, |
| "valid_targets_min": 1923 |
| }, |
| { |
| "epoch": 4.906976744186046, |
| "grad_norm": 0.4064894961029224, |
| "learning_rate": 9.95539138977575e-06, |
| "loss": 0.1493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12033580243587494, |
| "step": 3165, |
| "valid_targets_mean": 4383.8, |
| "valid_targets_min": 606 |
| }, |
| { |
| "epoch": 4.9147286821705425, |
| "grad_norm": 0.3163430136720968, |
| "learning_rate": 9.88860367854112e-06, |
| "loss": 0.1449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14553579688072205, |
| "step": 3170, |
| "valid_targets_mean": 7166.2, |
| "valid_targets_min": 3325 |
| }, |
| { |
| "epoch": 4.922480620155039, |
| "grad_norm": 0.38091013274436497, |
| "learning_rate": 9.821967099401137e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1597091257572174, |
| "step": 3175, |
| "valid_targets_mean": 5441.1, |
| "valid_targets_min": 1887 |
| }, |
| { |
| "epoch": 4.930232558139535, |
| "grad_norm": 0.34441694300189507, |
| "learning_rate": 9.755482648353335e-06, |
| "loss": 0.1646, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13708937168121338, |
| "step": 3180, |
| "valid_targets_mean": 5538.1, |
| "valid_targets_min": 2859 |
| }, |
| { |
| "epoch": 4.937984496124031, |
| "grad_norm": 0.37415077897828763, |
| "learning_rate": 9.689151319121433e-06, |
| "loss": 0.1629, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14037328958511353, |
| "step": 3185, |
| "valid_targets_mean": 5194.1, |
| "valid_targets_min": 2266 |
| }, |
| { |
| "epoch": 4.945736434108527, |
| "grad_norm": 0.44777782502419616, |
| "learning_rate": 9.62297410314047e-06, |
| "loss": 0.1678, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18096795678138733, |
| "step": 3190, |
| "valid_targets_mean": 4345.2, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 4.953488372093023, |
| "grad_norm": 0.38931181856536856, |
| "learning_rate": 9.556951989542032e-06, |
| "loss": 0.1541, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11744767427444458, |
| "step": 3195, |
| "valid_targets_mean": 4002.5, |
| "valid_targets_min": 462 |
| }, |
| { |
| "epoch": 4.961240310077519, |
| "grad_norm": 0.36948872010681133, |
| "learning_rate": 9.491085965139402e-06, |
| "loss": 0.1516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12257242947816849, |
| "step": 3200, |
| "valid_targets_mean": 5256.6, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 4.9689922480620154, |
| "grad_norm": 0.41347264041909937, |
| "learning_rate": 9.425377014412848e-06, |
| "loss": 0.1556, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15283584594726562, |
| "step": 3205, |
| "valid_targets_mean": 4368.1, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 4.976744186046512, |
| "grad_norm": 0.42750383797473995, |
| "learning_rate": 9.35982611949493e-06, |
| "loss": 0.1725, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18603989481925964, |
| "step": 3210, |
| "valid_targets_mean": 4814.5, |
| "valid_targets_min": 483 |
| }, |
| { |
| "epoch": 4.984496124031008, |
| "grad_norm": 0.43059647799726375, |
| "learning_rate": 9.294434260155765e-06, |
| "loss": 0.161, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22478413581848145, |
| "step": 3215, |
| "valid_targets_mean": 5452.1, |
| "valid_targets_min": 1531 |
| }, |
| { |
| "epoch": 4.992248062015504, |
| "grad_norm": 0.39768354831373554, |
| "learning_rate": 9.229202413788419e-06, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15155833959579468, |
| "step": 3220, |
| "valid_targets_mean": 4607.6, |
| "valid_targets_min": 2135 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 0.38185972751001357, |
| "learning_rate": 9.164131555394288e-06, |
| "loss": 0.1561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13077522814273834, |
| "step": 3225, |
| "valid_targets_mean": 4259.6, |
| "valid_targets_min": 380 |
| }, |
| { |
| "epoch": 5.007751937984496, |
| "grad_norm": 0.41906475146843863, |
| "learning_rate": 9.099222657568554e-06, |
| "loss": 0.1557, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15627771615982056, |
| "step": 3230, |
| "valid_targets_mean": 5040.4, |
| "valid_targets_min": 1940 |
| }, |
| { |
| "epoch": 5.015503875968992, |
| "grad_norm": 0.4052151818524859, |
| "learning_rate": 9.034476690485579e-06, |
| "loss": 0.1328, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13936452567577362, |
| "step": 3235, |
| "valid_targets_mean": 5023.8, |
| "valid_targets_min": 705 |
| }, |
| { |
| "epoch": 5.023255813953488, |
| "grad_norm": 0.37188613632576223, |
| "learning_rate": 8.969894621884467e-06, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12986522912979126, |
| "step": 3240, |
| "valid_targets_mean": 5463.1, |
| "valid_targets_min": 412 |
| }, |
| { |
| "epoch": 5.0310077519379846, |
| "grad_norm": 0.3919445371842698, |
| "learning_rate": 8.905477417054595e-06, |
| "loss": 0.1387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12915056943893433, |
| "step": 3245, |
| "valid_targets_mean": 5352.3, |
| "valid_targets_min": 2354 |
| }, |
| { |
| "epoch": 5.038759689922481, |
| "grad_norm": 0.40240515277621475, |
| "learning_rate": 8.841226038821147e-06, |
| "loss": 0.1414, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1427655816078186, |
| "step": 3250, |
| "valid_targets_mean": 4806.9, |
| "valid_targets_min": 927 |
| }, |
| { |
| "epoch": 5.046511627906977, |
| "grad_norm": 0.4482311614474207, |
| "learning_rate": 8.77714144753075e-06, |
| "loss": 0.1335, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1503133922815323, |
| "step": 3255, |
| "valid_targets_mean": 4343.8, |
| "valid_targets_min": 188 |
| }, |
| { |
| "epoch": 5.054263565891473, |
| "grad_norm": 0.41632602975114186, |
| "learning_rate": 8.713224601037116e-06, |
| "loss": 0.1424, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11666247993707657, |
| "step": 3260, |
| "valid_targets_mean": 3756.2, |
| "valid_targets_min": 412 |
| }, |
| { |
| "epoch": 5.062015503875969, |
| "grad_norm": 0.4421325070582108, |
| "learning_rate": 8.649476454686734e-06, |
| "loss": 0.1549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14591653645038605, |
| "step": 3265, |
| "valid_targets_mean": 4298.9, |
| "valid_targets_min": 2252 |
| }, |
| { |
| "epoch": 5.069767441860465, |
| "grad_norm": 0.3706889070551245, |
| "learning_rate": 8.58589796130457e-06, |
| "loss": 0.1448, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1363983452320099, |
| "step": 3270, |
| "valid_targets_mean": 5321.2, |
| "valid_targets_min": 435 |
| }, |
| { |
| "epoch": 5.077519379844961, |
| "grad_norm": 0.42292771021367553, |
| "learning_rate": 8.522490071179834e-06, |
| "loss": 0.1654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1678886115550995, |
| "step": 3275, |
| "valid_targets_mean": 4751.9, |
| "valid_targets_min": 610 |
| }, |
| { |
| "epoch": 5.0852713178294575, |
| "grad_norm": 0.5828499776845351, |
| "learning_rate": 8.459253732051793e-06, |
| "loss": 0.1661, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17978990077972412, |
| "step": 3280, |
| "valid_targets_mean": 4170.8, |
| "valid_targets_min": 267 |
| }, |
| { |
| "epoch": 5.093023255813954, |
| "grad_norm": 0.4615372722971231, |
| "learning_rate": 8.396189889095581e-06, |
| "loss": 0.1516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18241898715496063, |
| "step": 3285, |
| "valid_targets_mean": 4325.0, |
| "valid_targets_min": 1860 |
| }, |
| { |
| "epoch": 5.10077519379845, |
| "grad_norm": 0.3817650649549942, |
| "learning_rate": 8.333299484908081e-06, |
| "loss": 0.1368, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1241084486246109, |
| "step": 3290, |
| "valid_targets_mean": 4798.9, |
| "valid_targets_min": 670 |
| }, |
| { |
| "epoch": 5.108527131782946, |
| "grad_norm": 0.4194147503687341, |
| "learning_rate": 8.27058345949384e-06, |
| "loss": 0.1484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14202088117599487, |
| "step": 3295, |
| "valid_targets_mean": 4392.2, |
| "valid_targets_min": 1724 |
| }, |
| { |
| "epoch": 5.116279069767442, |
| "grad_norm": 0.38881934176704125, |
| "learning_rate": 8.208042750251017e-06, |
| "loss": 0.1428, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12283352017402649, |
| "step": 3300, |
| "valid_targets_mean": 5001.8, |
| "valid_targets_min": 860 |
| }, |
| { |
| "epoch": 5.124031007751938, |
| "grad_norm": 0.41598556767284195, |
| "learning_rate": 8.14567829195737e-06, |
| "loss": 0.1498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12442460656166077, |
| "step": 3305, |
| "valid_targets_mean": 4178.7, |
| "valid_targets_min": 1866 |
| }, |
| { |
| "epoch": 5.131782945736434, |
| "grad_norm": 0.5128407487191675, |
| "learning_rate": 8.083491016756282e-06, |
| "loss": 0.1501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17859122157096863, |
| "step": 3310, |
| "valid_targets_mean": 3686.2, |
| "valid_targets_min": 761 |
| }, |
| { |
| "epoch": 5.1395348837209305, |
| "grad_norm": 0.3758183019008081, |
| "learning_rate": 8.021481854142843e-06, |
| "loss": 0.1487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14447617530822754, |
| "step": 3315, |
| "valid_targets_mean": 5073.4, |
| "valid_targets_min": 1295 |
| }, |
| { |
| "epoch": 5.147286821705427, |
| "grad_norm": 0.47801726631549907, |
| "learning_rate": 7.959651730949938e-06, |
| "loss": 0.14, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1533583104610443, |
| "step": 3320, |
| "valid_targets_mean": 3810.4, |
| "valid_targets_min": 688 |
| }, |
| { |
| "epoch": 5.155038759689923, |
| "grad_norm": 0.3860929841594393, |
| "learning_rate": 7.898001571334393e-06, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14451035857200623, |
| "step": 3325, |
| "valid_targets_mean": 5514.4, |
| "valid_targets_min": 587 |
| }, |
| { |
| "epoch": 5.162790697674419, |
| "grad_norm": 0.3927336266773621, |
| "learning_rate": 7.836532296763195e-06, |
| "loss": 0.15, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14219003915786743, |
| "step": 3330, |
| "valid_targets_mean": 5720.4, |
| "valid_targets_min": 854 |
| }, |
| { |
| "epoch": 5.170542635658915, |
| "grad_norm": 0.4701871029698711, |
| "learning_rate": 7.775244825999674e-06, |
| "loss": 0.1506, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13866694271564484, |
| "step": 3335, |
| "valid_targets_mean": 4240.4, |
| "valid_targets_min": 327 |
| }, |
| { |
| "epoch": 5.178294573643411, |
| "grad_norm": 0.5611394213445632, |
| "learning_rate": 7.7141400750898e-06, |
| "loss": 0.1537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1594468057155609, |
| "step": 3340, |
| "valid_targets_mean": 3598.9, |
| "valid_targets_min": 332 |
| }, |
| { |
| "epoch": 5.186046511627907, |
| "grad_norm": 0.46697871764537624, |
| "learning_rate": 7.653218957348478e-06, |
| "loss": 0.1625, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17361919581890106, |
| "step": 3345, |
| "valid_targets_mean": 4588.7, |
| "valid_targets_min": 750 |
| }, |
| { |
| "epoch": 5.1937984496124034, |
| "grad_norm": 0.40704733172155627, |
| "learning_rate": 7.592482383345905e-06, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16594815254211426, |
| "step": 3350, |
| "valid_targets_mean": 5162.1, |
| "valid_targets_min": 2503 |
| }, |
| { |
| "epoch": 5.2015503875969, |
| "grad_norm": 0.43347382037931187, |
| "learning_rate": 7.531931260893956e-06, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12546521425247192, |
| "step": 3355, |
| "valid_targets_mean": 4259.8, |
| "valid_targets_min": 2493 |
| }, |
| { |
| "epoch": 5.209302325581396, |
| "grad_norm": 0.451832191981657, |
| "learning_rate": 7.47156649503261e-06, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14870810508728027, |
| "step": 3360, |
| "valid_targets_mean": 4736.9, |
| "valid_targets_min": 2527 |
| }, |
| { |
| "epoch": 5.217054263565892, |
| "grad_norm": 0.5092134368319543, |
| "learning_rate": 7.411388988016444e-06, |
| "loss": 0.1464, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18897545337677002, |
| "step": 3365, |
| "valid_targets_mean": 4291.3, |
| "valid_targets_min": 1979 |
| }, |
| { |
| "epoch": 5.224806201550388, |
| "grad_norm": 0.3992712621608886, |
| "learning_rate": 7.351399639301116e-06, |
| "loss": 0.1433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16864998638629913, |
| "step": 3370, |
| "valid_targets_mean": 5468.9, |
| "valid_targets_min": 2411 |
| }, |
| { |
| "epoch": 5.232558139534884, |
| "grad_norm": 0.43818725229100414, |
| "learning_rate": 7.291599345529936e-06, |
| "loss": 0.1517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14088185131549835, |
| "step": 3375, |
| "valid_targets_mean": 4397.0, |
| "valid_targets_min": 227 |
| }, |
| { |
| "epoch": 5.24031007751938, |
| "grad_norm": 0.42669853677221803, |
| "learning_rate": 7.231989000520485e-06, |
| "loss": 0.1637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16974776983261108, |
| "step": 3380, |
| "valid_targets_mean": 5304.2, |
| "valid_targets_min": 818 |
| }, |
| { |
| "epoch": 5.248062015503876, |
| "grad_norm": 0.42231966887434225, |
| "learning_rate": 7.172569495251214e-06, |
| "loss": 0.1525, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15044859051704407, |
| "step": 3385, |
| "valid_targets_mean": 4793.6, |
| "valid_targets_min": 893 |
| }, |
| { |
| "epoch": 5.2558139534883725, |
| "grad_norm": 0.3774758090043144, |
| "learning_rate": 7.113341717848154e-06, |
| "loss": 0.1478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14274142682552338, |
| "step": 3390, |
| "valid_targets_mean": 5430.0, |
| "valid_targets_min": 567 |
| }, |
| { |
| "epoch": 5.263565891472869, |
| "grad_norm": 0.4221322079184396, |
| "learning_rate": 7.05430655357163e-06, |
| "loss": 0.1356, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1326403170824051, |
| "step": 3395, |
| "valid_targets_mean": 4851.8, |
| "valid_targets_min": 1855 |
| }, |
| { |
| "epoch": 5.271317829457364, |
| "grad_norm": 0.41865340457663663, |
| "learning_rate": 6.995464884803056e-06, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15016970038414001, |
| "step": 3400, |
| "valid_targets_mean": 4839.2, |
| "valid_targets_min": 685 |
| }, |
| { |
| "epoch": 5.27906976744186, |
| "grad_norm": 0.37620910591252854, |
| "learning_rate": 6.936817591031704e-06, |
| "loss": 0.1553, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11961726099252701, |
| "step": 3405, |
| "valid_targets_mean": 5236.1, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 5.286821705426356, |
| "grad_norm": 0.41396399132639294, |
| "learning_rate": 6.878365548841583e-06, |
| "loss": 0.1667, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15676863491535187, |
| "step": 3410, |
| "valid_targets_mean": 5105.6, |
| "valid_targets_min": 434 |
| }, |
| { |
| "epoch": 5.294573643410852, |
| "grad_norm": 0.37430857448740984, |
| "learning_rate": 6.820109631898337e-06, |
| "loss": 0.1537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13516280055046082, |
| "step": 3415, |
| "valid_targets_mean": 5407.8, |
| "valid_targets_min": 361 |
| }, |
| { |
| "epoch": 5.3023255813953485, |
| "grad_norm": 0.39609033417068207, |
| "learning_rate": 6.7620507109361876e-06, |
| "loss": 0.1416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11794918775558472, |
| "step": 3420, |
| "valid_targets_mean": 4567.0, |
| "valid_targets_min": 770 |
| }, |
| { |
| "epoch": 5.310077519379845, |
| "grad_norm": 0.6118599264333754, |
| "learning_rate": 6.704189653744897e-06, |
| "loss": 0.1615, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1839725375175476, |
| "step": 3425, |
| "valid_targets_mean": 4516.2, |
| "valid_targets_min": 484 |
| }, |
| { |
| "epoch": 5.317829457364341, |
| "grad_norm": 0.4381562079932628, |
| "learning_rate": 6.646527325156842e-06, |
| "loss": 0.1412, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16818967461585999, |
| "step": 3430, |
| "valid_targets_mean": 4886.8, |
| "valid_targets_min": 420 |
| }, |
| { |
| "epoch": 5.325581395348837, |
| "grad_norm": 0.4226204361999147, |
| "learning_rate": 6.5890645870340445e-06, |
| "loss": 0.1548, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1639600247144699, |
| "step": 3435, |
| "valid_targets_mean": 5103.1, |
| "valid_targets_min": 696 |
| }, |
| { |
| "epoch": 5.333333333333333, |
| "grad_norm": 0.3710849263141366, |
| "learning_rate": 6.531802298255303e-06, |
| "loss": 0.1499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12949195504188538, |
| "step": 3440, |
| "valid_targets_mean": 4989.1, |
| "valid_targets_min": 2837 |
| }, |
| { |
| "epoch": 5.341085271317829, |
| "grad_norm": 0.4435129156035455, |
| "learning_rate": 6.474741314703359e-06, |
| "loss": 0.1478, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15639318525791168, |
| "step": 3445, |
| "valid_targets_mean": 4721.8, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 5.348837209302325, |
| "grad_norm": 0.3625818524554749, |
| "learning_rate": 6.417882489252123e-06, |
| "loss": 0.1402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12721361219882965, |
| "step": 3450, |
| "valid_targets_mean": 5639.6, |
| "valid_targets_min": 3016 |
| }, |
| { |
| "epoch": 5.3565891472868215, |
| "grad_norm": 0.4323434478569545, |
| "learning_rate": 6.361226671753881e-06, |
| "loss": 0.1493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1502252072095871, |
| "step": 3455, |
| "valid_targets_mean": 5072.4, |
| "valid_targets_min": 346 |
| }, |
| { |
| "epoch": 5.364341085271318, |
| "grad_norm": 0.37196863493668914, |
| "learning_rate": 6.304774709026633e-06, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12962721288204193, |
| "step": 3460, |
| "valid_targets_mean": 5211.2, |
| "valid_targets_min": 2412 |
| }, |
| { |
| "epoch": 5.372093023255814, |
| "grad_norm": 0.4392929005011265, |
| "learning_rate": 6.248527444841417e-06, |
| "loss": 0.1469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15446701645851135, |
| "step": 3465, |
| "valid_targets_mean": 4372.7, |
| "valid_targets_min": 2320 |
| }, |
| { |
| "epoch": 5.37984496124031, |
| "grad_norm": 0.45498046007325976, |
| "learning_rate": 6.1924857199097e-06, |
| "loss": 0.1653, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1651144027709961, |
| "step": 3470, |
| "valid_targets_mean": 4883.4, |
| "valid_targets_min": 936 |
| }, |
| { |
| "epoch": 5.387596899224806, |
| "grad_norm": 0.42317989191246896, |
| "learning_rate": 6.136650371870816e-06, |
| "loss": 0.1391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12391775101423264, |
| "step": 3475, |
| "valid_targets_mean": 6439.6, |
| "valid_targets_min": 2368 |
| }, |
| { |
| "epoch": 5.395348837209302, |
| "grad_norm": 0.4440482712927205, |
| "learning_rate": 6.081022235279439e-06, |
| "loss": 0.1509, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13077440857887268, |
| "step": 3480, |
| "valid_targets_mean": 4186.4, |
| "valid_targets_min": 2293 |
| }, |
| { |
| "epoch": 5.403100775193798, |
| "grad_norm": 0.45472821818832726, |
| "learning_rate": 6.025602141593128e-06, |
| "loss": 0.1387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13112467527389526, |
| "step": 3485, |
| "valid_targets_mean": 4406.1, |
| "valid_targets_min": 454 |
| }, |
| { |
| "epoch": 5.410852713178294, |
| "grad_norm": 0.3962937912503978, |
| "learning_rate": 5.970390919159872e-06, |
| "loss": 0.1493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16544798016548157, |
| "step": 3490, |
| "valid_targets_mean": 5308.0, |
| "valid_targets_min": 797 |
| }, |
| { |
| "epoch": 5.4186046511627906, |
| "grad_norm": 0.3643941673945403, |
| "learning_rate": 5.915389393205717e-06, |
| "loss": 0.1608, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11564834415912628, |
| "step": 3495, |
| "valid_targets_mean": 4933.6, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 5.426356589147287, |
| "grad_norm": 0.42998784565296494, |
| "learning_rate": 5.86059838582246e-06, |
| "loss": 0.1413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15233772993087769, |
| "step": 3500, |
| "valid_targets_mean": 4981.4, |
| "valid_targets_min": 269 |
| }, |
| { |
| "epoch": 5.434108527131783, |
| "grad_norm": 0.41822740876158127, |
| "learning_rate": 5.806018715955317e-06, |
| "loss": 0.1449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1299438178539276, |
| "step": 3505, |
| "valid_targets_mean": 4537.4, |
| "valid_targets_min": 1080 |
| }, |
| { |
| "epoch": 5.441860465116279, |
| "grad_norm": 0.4528399940397294, |
| "learning_rate": 5.751651199390704e-06, |
| "loss": 0.1558, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16579484939575195, |
| "step": 3510, |
| "valid_targets_mean": 4755.4, |
| "valid_targets_min": 2776 |
| }, |
| { |
| "epoch": 5.449612403100775, |
| "grad_norm": 0.4684592080080512, |
| "learning_rate": 5.697496648744063e-06, |
| "loss": 0.1353, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.143550843000412, |
| "step": 3515, |
| "valid_targets_mean": 3519.6, |
| "valid_targets_min": 530 |
| }, |
| { |
| "epoch": 5.457364341085271, |
| "grad_norm": 0.45674225562117354, |
| "learning_rate": 5.643555873447677e-06, |
| "loss": 0.1408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14884954690933228, |
| "step": 3520, |
| "valid_targets_mean": 4183.1, |
| "valid_targets_min": 764 |
| }, |
| { |
| "epoch": 5.465116279069767, |
| "grad_norm": 0.4035257697649145, |
| "learning_rate": 5.589829679738597e-06, |
| "loss": 0.1605, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1421164870262146, |
| "step": 3525, |
| "valid_targets_mean": 5205.2, |
| "valid_targets_min": 2073 |
| }, |
| { |
| "epoch": 5.4728682170542635, |
| "grad_norm": 0.5117576530097852, |
| "learning_rate": 5.536318870646587e-06, |
| "loss": 0.145, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16778147220611572, |
| "step": 3530, |
| "valid_targets_mean": 5321.6, |
| "valid_targets_min": 639 |
| }, |
| { |
| "epoch": 5.48062015503876, |
| "grad_norm": 0.4104772923087062, |
| "learning_rate": 5.483024245982116e-06, |
| "loss": 0.1562, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13928261399269104, |
| "step": 3535, |
| "valid_targets_mean": 4891.7, |
| "valid_targets_min": 410 |
| }, |
| { |
| "epoch": 5.488372093023256, |
| "grad_norm": 0.4268402728473486, |
| "learning_rate": 5.429946602324414e-06, |
| "loss": 0.1467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1458597481250763, |
| "step": 3540, |
| "valid_targets_mean": 4448.0, |
| "valid_targets_min": 277 |
| }, |
| { |
| "epoch": 5.496124031007752, |
| "grad_norm": 0.4715412702854216, |
| "learning_rate": 5.377086733009551e-06, |
| "loss": 0.1421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14967858791351318, |
| "step": 3545, |
| "valid_targets_mean": 4361.0, |
| "valid_targets_min": 704 |
| }, |
| { |
| "epoch": 5.503875968992248, |
| "grad_norm": 0.5279261179055396, |
| "learning_rate": 5.3244454281185984e-06, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20234504342079163, |
| "step": 3550, |
| "valid_targets_mean": 3873.4, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 5.511627906976744, |
| "grad_norm": 0.507981142775861, |
| "learning_rate": 5.272023474465799e-06, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1777733415365219, |
| "step": 3555, |
| "valid_targets_mean": 3797.2, |
| "valid_targets_min": 472 |
| }, |
| { |
| "epoch": 5.51937984496124, |
| "grad_norm": 0.3833421328022469, |
| "learning_rate": 5.219821655586821e-06, |
| "loss": 0.1471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16572965681552887, |
| "step": 3560, |
| "valid_targets_mean": 5526.5, |
| "valid_targets_min": 551 |
| }, |
| { |
| "epoch": 5.5271317829457365, |
| "grad_norm": 0.43394338581146247, |
| "learning_rate": 5.167840751727034e-06, |
| "loss": 0.1497, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15046624839305878, |
| "step": 3565, |
| "valid_targets_mean": 4108.6, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 5.534883720930233, |
| "grad_norm": 0.40622205843630427, |
| "learning_rate": 5.116081539829874e-06, |
| "loss": 0.1362, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16226355731487274, |
| "step": 3570, |
| "valid_targets_mean": 6044.9, |
| "valid_targets_min": 1779 |
| }, |
| { |
| "epoch": 5.542635658914729, |
| "grad_norm": 0.4029911479453827, |
| "learning_rate": 5.064544793525192e-06, |
| "loss": 0.1668, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14648669958114624, |
| "step": 3575, |
| "valid_targets_mean": 5268.5, |
| "valid_targets_min": 249 |
| }, |
| { |
| "epoch": 5.550387596899225, |
| "grad_norm": 0.5364248446568755, |
| "learning_rate": 5.013231283117723e-06, |
| "loss": 0.1486, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14924436807632446, |
| "step": 3580, |
| "valid_targets_mean": 4603.7, |
| "valid_targets_min": 2372 |
| }, |
| { |
| "epoch": 5.558139534883721, |
| "grad_norm": 0.40849395379526177, |
| "learning_rate": 4.962141775575553e-06, |
| "loss": 0.1457, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1340319961309433, |
| "step": 3585, |
| "valid_targets_mean": 4452.3, |
| "valid_targets_min": 2157 |
| }, |
| { |
| "epoch": 5.565891472868217, |
| "grad_norm": 0.3507387441886511, |
| "learning_rate": 4.9112770345186664e-06, |
| "loss": 0.1308, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10928727686405182, |
| "step": 3590, |
| "valid_targets_mean": 5409.7, |
| "valid_targets_min": 2109 |
| }, |
| { |
| "epoch": 5.573643410852713, |
| "grad_norm": 0.4457364584152074, |
| "learning_rate": 4.8606378202075215e-06, |
| "loss": 0.1421, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13773344457149506, |
| "step": 3595, |
| "valid_targets_mean": 4546.3, |
| "valid_targets_min": 327 |
| }, |
| { |
| "epoch": 5.5813953488372094, |
| "grad_norm": 0.4973298360537683, |
| "learning_rate": 4.81022488953171e-06, |
| "loss": 0.1382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1543937474489212, |
| "step": 3600, |
| "valid_targets_mean": 4128.4, |
| "valid_targets_min": 349 |
| }, |
| { |
| "epoch": 5.589147286821706, |
| "grad_norm": 0.36859713218728013, |
| "learning_rate": 4.760038995998612e-06, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14406907558441162, |
| "step": 3605, |
| "valid_targets_mean": 5601.7, |
| "valid_targets_min": 2213 |
| }, |
| { |
| "epoch": 5.596899224806202, |
| "grad_norm": 0.3775608828670771, |
| "learning_rate": 4.710080889722157e-06, |
| "loss": 0.1379, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11484645307064056, |
| "step": 3610, |
| "valid_targets_mean": 4418.9, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 5.604651162790698, |
| "grad_norm": 0.5585581576269192, |
| "learning_rate": 4.660351317411598e-06, |
| "loss": 0.1546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16293855011463165, |
| "step": 3615, |
| "valid_targets_mean": 3673.5, |
| "valid_targets_min": 853 |
| }, |
| { |
| "epoch": 5.612403100775194, |
| "grad_norm": 0.40317305487140387, |
| "learning_rate": 4.610851022360372e-06, |
| "loss": 0.1472, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16022725403308868, |
| "step": 3620, |
| "valid_targets_mean": 5046.8, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 5.62015503875969, |
| "grad_norm": 0.46629312553258945, |
| "learning_rate": 4.561580744434962e-06, |
| "loss": 0.1363, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16484293341636658, |
| "step": 3625, |
| "valid_targets_mean": 4345.7, |
| "valid_targets_min": 719 |
| }, |
| { |
| "epoch": 5.627906976744186, |
| "grad_norm": 0.4517994866451772, |
| "learning_rate": 4.512541220063849e-06, |
| "loss": 0.1583, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1768956333398819, |
| "step": 3630, |
| "valid_targets_mean": 5144.0, |
| "valid_targets_min": 1570 |
| }, |
| { |
| "epoch": 5.635658914728682, |
| "grad_norm": 0.4266612314681182, |
| "learning_rate": 4.463733182226526e-06, |
| "loss": 0.1441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12670007348060608, |
| "step": 3635, |
| "valid_targets_mean": 4100.2, |
| "valid_targets_min": 2116 |
| }, |
| { |
| "epoch": 5.6434108527131785, |
| "grad_norm": 0.4680346659273191, |
| "learning_rate": 4.415157360442517e-06, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17845088243484497, |
| "step": 3640, |
| "valid_targets_mean": 4356.6, |
| "valid_targets_min": 322 |
| }, |
| { |
| "epoch": 5.651162790697675, |
| "grad_norm": 0.3890028520850903, |
| "learning_rate": 4.366814480760461e-06, |
| "loss": 0.1435, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12099163234233856, |
| "step": 3645, |
| "valid_targets_mean": 5003.2, |
| "valid_targets_min": 2596 |
| }, |
| { |
| "epoch": 5.658914728682171, |
| "grad_norm": 0.5488303595169921, |
| "learning_rate": 4.318705265747298e-06, |
| "loss": 0.1572, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1828697919845581, |
| "step": 3650, |
| "valid_targets_mean": 3999.2, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 5.666666666666667, |
| "grad_norm": 0.42060572333330015, |
| "learning_rate": 4.2708304344774554e-06, |
| "loss": 0.1384, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13645608723163605, |
| "step": 3655, |
| "valid_targets_mean": 4687.2, |
| "valid_targets_min": 2741 |
| }, |
| { |
| "epoch": 5.674418604651163, |
| "grad_norm": 0.4387274771557827, |
| "learning_rate": 4.223190702522084e-06, |
| "loss": 0.1453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14829561114311218, |
| "step": 3660, |
| "valid_targets_mean": 4422.6, |
| "valid_targets_min": 757 |
| }, |
| { |
| "epoch": 5.682170542635659, |
| "grad_norm": 0.38684240070794124, |
| "learning_rate": 4.1757867819383695e-06, |
| "loss": 0.1485, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15705367922782898, |
| "step": 3665, |
| "valid_targets_mean": 5591.4, |
| "valid_targets_min": 2183 |
| }, |
| { |
| "epoch": 5.689922480620155, |
| "grad_norm": 0.3924859326932451, |
| "learning_rate": 4.128619381258914e-06, |
| "loss": 0.1559, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1718716323375702, |
| "step": 3670, |
| "valid_targets_mean": 5566.4, |
| "valid_targets_min": 344 |
| }, |
| { |
| "epoch": 5.6976744186046515, |
| "grad_norm": 0.4255325828911711, |
| "learning_rate": 4.081689205481103e-06, |
| "loss": 0.1409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15730968117713928, |
| "step": 3675, |
| "valid_targets_mean": 4940.1, |
| "valid_targets_min": 2527 |
| }, |
| { |
| "epoch": 5.705426356589148, |
| "grad_norm": 0.4523673615926739, |
| "learning_rate": 4.034996956056596e-06, |
| "loss": 0.1613, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17630687355995178, |
| "step": 3680, |
| "valid_targets_mean": 4730.1, |
| "valid_targets_min": 836 |
| }, |
| { |
| "epoch": 5.713178294573644, |
| "grad_norm": 0.3996998930591703, |
| "learning_rate": 3.988543330880852e-06, |
| "loss": 0.1287, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12216873466968536, |
| "step": 3685, |
| "valid_targets_mean": 4865.8, |
| "valid_targets_min": 2765 |
| }, |
| { |
| "epoch": 5.720930232558139, |
| "grad_norm": 0.47040209067719235, |
| "learning_rate": 3.942329024282665e-06, |
| "loss": 0.1516, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16137559711933136, |
| "step": 3690, |
| "valid_targets_mean": 4531.0, |
| "valid_targets_min": 730 |
| }, |
| { |
| "epoch": 5.728682170542635, |
| "grad_norm": 0.3630897503273467, |
| "learning_rate": 3.896354727013811e-06, |
| "loss": 0.1532, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12590524554252625, |
| "step": 3695, |
| "valid_targets_mean": 5248.6, |
| "valid_targets_min": 2452 |
| }, |
| { |
| "epoch": 5.736434108527131, |
| "grad_norm": 0.4715032977447836, |
| "learning_rate": 3.850621126238716e-06, |
| "loss": 0.1437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15132960677146912, |
| "step": 3700, |
| "valid_targets_mean": 3941.0, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 5.7441860465116275, |
| "grad_norm": 0.4654118997053404, |
| "learning_rate": 3.8051289055241825e-06, |
| "loss": 0.162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1751362681388855, |
| "step": 3705, |
| "valid_targets_mean": 4353.2, |
| "valid_targets_min": 2659 |
| }, |
| { |
| "epoch": 5.751937984496124, |
| "grad_norm": 0.5227568375922278, |
| "learning_rate": 3.759878744829182e-06, |
| "loss": 0.16, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18965643644332886, |
| "step": 3710, |
| "valid_targets_mean": 4459.4, |
| "valid_targets_min": 733 |
| }, |
| { |
| "epoch": 5.75968992248062, |
| "grad_norm": 0.4609905003497403, |
| "learning_rate": 3.7148713204946752e-06, |
| "loss": 0.147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1515987515449524, |
| "step": 3715, |
| "valid_targets_mean": 4371.8, |
| "valid_targets_min": 621 |
| }, |
| { |
| "epoch": 5.767441860465116, |
| "grad_norm": 0.3918991200592125, |
| "learning_rate": 3.67010730523353e-06, |
| "loss": 0.1618, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12248925864696503, |
| "step": 3720, |
| "valid_targets_mean": 4360.6, |
| "valid_targets_min": 370 |
| }, |
| { |
| "epoch": 5.775193798449612, |
| "grad_norm": 0.467773056692704, |
| "learning_rate": 3.6255873681204332e-06, |
| "loss": 0.1566, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17771819233894348, |
| "step": 3725, |
| "valid_targets_mean": 4304.9, |
| "valid_targets_min": 288 |
| }, |
| { |
| "epoch": 5.782945736434108, |
| "grad_norm": 0.377912933539592, |
| "learning_rate": 3.5813121745819144e-06, |
| "loss": 0.1529, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14115823805332184, |
| "step": 3730, |
| "valid_targets_mean": 4955.0, |
| "valid_targets_min": 285 |
| }, |
| { |
| "epoch": 5.790697674418604, |
| "grad_norm": 0.3996511259289835, |
| "learning_rate": 3.537282386386387e-06, |
| "loss": 0.1561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13390158116817474, |
| "step": 3735, |
| "valid_targets_mean": 4518.8, |
| "valid_targets_min": 339 |
| }, |
| { |
| "epoch": 5.7984496124031, |
| "grad_norm": 0.3701488362865712, |
| "learning_rate": 3.4934986616342737e-06, |
| "loss": 0.1768, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14555737376213074, |
| "step": 3740, |
| "valid_targets_mean": 5657.8, |
| "valid_targets_min": 2347 |
| }, |
| { |
| "epoch": 5.8062015503875966, |
| "grad_norm": 0.45199830351728787, |
| "learning_rate": 3.449961654748146e-06, |
| "loss": 0.1487, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.150042325258255, |
| "step": 3745, |
| "valid_targets_mean": 4127.3, |
| "valid_targets_min": 2290 |
| }, |
| { |
| "epoch": 5.813953488372093, |
| "grad_norm": 0.4369336909116495, |
| "learning_rate": 3.406672016462964e-06, |
| "loss": 0.1463, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13401828706264496, |
| "step": 3750, |
| "valid_targets_mean": 4274.8, |
| "valid_targets_min": 1856 |
| }, |
| { |
| "epoch": 5.821705426356589, |
| "grad_norm": 0.4834110812261461, |
| "learning_rate": 3.363630393816335e-06, |
| "loss": 0.1402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15827834606170654, |
| "step": 3755, |
| "valid_targets_mean": 3873.9, |
| "valid_targets_min": 2432 |
| }, |
| { |
| "epoch": 5.829457364341085, |
| "grad_norm": 0.4597445261763014, |
| "learning_rate": 3.3208374301388504e-06, |
| "loss": 0.1627, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17994539439678192, |
| "step": 3760, |
| "valid_targets_mean": 4758.0, |
| "valid_targets_min": 1984 |
| }, |
| { |
| "epoch": 5.837209302325581, |
| "grad_norm": 0.42360510165536924, |
| "learning_rate": 3.278293765044469e-06, |
| "loss": 0.1546, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13492318987846375, |
| "step": 3765, |
| "valid_targets_mean": 4426.1, |
| "valid_targets_min": 233 |
| }, |
| { |
| "epoch": 5.844961240310077, |
| "grad_norm": 0.48922365457669503, |
| "learning_rate": 3.236000034420963e-06, |
| "loss": 0.1498, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14569556713104248, |
| "step": 3770, |
| "valid_targets_mean": 3687.8, |
| "valid_targets_min": 242 |
| }, |
| { |
| "epoch": 5.852713178294573, |
| "grad_norm": 0.4033773146053126, |
| "learning_rate": 3.193956870420396e-06, |
| "loss": 0.1738, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18744111061096191, |
| "step": 3775, |
| "valid_targets_mean": 5528.1, |
| "valid_targets_min": 611 |
| }, |
| { |
| "epoch": 5.8604651162790695, |
| "grad_norm": 0.34857475686830064, |
| "learning_rate": 3.1521649014496925e-06, |
| "loss": 0.155, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13359975814819336, |
| "step": 3780, |
| "valid_targets_mean": 5863.0, |
| "valid_targets_min": 2553 |
| }, |
| { |
| "epoch": 5.868217054263566, |
| "grad_norm": 0.4313376511492457, |
| "learning_rate": 3.110624752161229e-06, |
| "loss": 0.1689, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13781484961509705, |
| "step": 3785, |
| "valid_targets_mean": 5246.6, |
| "valid_targets_min": 578 |
| }, |
| { |
| "epoch": 5.875968992248062, |
| "grad_norm": 0.35972262523748805, |
| "learning_rate": 3.069337043443523e-06, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1296289563179016, |
| "step": 3790, |
| "valid_targets_mean": 5488.9, |
| "valid_targets_min": 1966 |
| }, |
| { |
| "epoch": 5.883720930232558, |
| "grad_norm": 0.46395239595319404, |
| "learning_rate": 3.0283023924119236e-06, |
| "loss": 0.1425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1438305675983429, |
| "step": 3795, |
| "valid_targets_mean": 5045.4, |
| "valid_targets_min": 548 |
| }, |
| { |
| "epoch": 5.891472868217054, |
| "grad_norm": 0.4216115298877531, |
| "learning_rate": 2.9875214123993967e-06, |
| "loss": 0.1489, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13032379746437073, |
| "step": 3800, |
| "valid_targets_mean": 5036.0, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 5.89922480620155, |
| "grad_norm": 0.369645204601132, |
| "learning_rate": 2.94699471294738e-06, |
| "loss": 0.1474, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10359348356723785, |
| "step": 3805, |
| "valid_targets_mean": 4782.0, |
| "valid_targets_min": 395 |
| }, |
| { |
| "epoch": 5.906976744186046, |
| "grad_norm": 0.4329223252021753, |
| "learning_rate": 2.9067228997966347e-06, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14920011162757874, |
| "step": 3810, |
| "valid_targets_mean": 4213.8, |
| "valid_targets_min": 265 |
| }, |
| { |
| "epoch": 5.9147286821705425, |
| "grad_norm": 0.38061473387366296, |
| "learning_rate": 2.8667065748782177e-06, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11807483434677124, |
| "step": 3815, |
| "valid_targets_mean": 4682.1, |
| "valid_targets_min": 2866 |
| }, |
| { |
| "epoch": 5.922480620155039, |
| "grad_norm": 0.4630422264492311, |
| "learning_rate": 2.826946336304481e-06, |
| "loss": 0.1606, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1536155343055725, |
| "step": 3820, |
| "valid_targets_mean": 4259.2, |
| "valid_targets_min": 826 |
| }, |
| { |
| "epoch": 5.930232558139535, |
| "grad_norm": 0.4336604749432643, |
| "learning_rate": 2.7874427783601234e-06, |
| "loss": 0.1443, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13880223035812378, |
| "step": 3825, |
| "valid_targets_mean": 4519.3, |
| "valid_targets_min": 609 |
| }, |
| { |
| "epoch": 5.937984496124031, |
| "grad_norm": 0.5243528481538801, |
| "learning_rate": 2.7481964914933157e-06, |
| "loss": 0.1604, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17028310894966125, |
| "step": 3830, |
| "valid_targets_mean": 3623.1, |
| "valid_targets_min": 591 |
| }, |
| { |
| "epoch": 5.945736434108527, |
| "grad_norm": 0.4789980300582059, |
| "learning_rate": 2.7092080623068674e-06, |
| "loss": 0.1745, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1756812334060669, |
| "step": 3835, |
| "valid_targets_mean": 4744.0, |
| "valid_targets_min": 772 |
| }, |
| { |
| "epoch": 5.953488372093023, |
| "grad_norm": 0.45611253393283935, |
| "learning_rate": 2.6704780735494784e-06, |
| "loss": 0.1441, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1426219344139099, |
| "step": 3840, |
| "valid_targets_mean": 4248.6, |
| "valid_targets_min": 525 |
| }, |
| { |
| "epoch": 5.961240310077519, |
| "grad_norm": 0.3857782088985867, |
| "learning_rate": 2.6320071041070018e-06, |
| "loss": 0.1479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11612827330827713, |
| "step": 3845, |
| "valid_targets_mean": 4773.6, |
| "valid_targets_min": 2511 |
| }, |
| { |
| "epoch": 5.9689922480620154, |
| "grad_norm": 0.4166115486481006, |
| "learning_rate": 2.593795728993804e-06, |
| "loss": 0.1544, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18450096249580383, |
| "step": 3850, |
| "valid_targets_mean": 5148.2, |
| "valid_targets_min": 2061 |
| }, |
| { |
| "epoch": 5.976744186046512, |
| "grad_norm": 0.4335144952819728, |
| "learning_rate": 2.555844519344186e-06, |
| "loss": 0.1444, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1622152328491211, |
| "step": 3855, |
| "valid_targets_mean": 5090.6, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 5.984496124031008, |
| "grad_norm": 0.3565273610492274, |
| "learning_rate": 2.518154042403813e-06, |
| "loss": 0.1408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12373974919319153, |
| "step": 3860, |
| "valid_targets_mean": 5277.1, |
| "valid_targets_min": 2691 |
| }, |
| { |
| "epoch": 5.992248062015504, |
| "grad_norm": 0.36972590062662825, |
| "learning_rate": 2.480724861521264e-06, |
| "loss": 0.1588, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10760015994310379, |
| "step": 3865, |
| "valid_targets_mean": 4705.8, |
| "valid_targets_min": 2256 |
| }, |
| { |
| "epoch": 6.0, |
| "grad_norm": 0.3774316986540542, |
| "learning_rate": 2.443557536139598e-06, |
| "loss": 0.1449, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13823938369750977, |
| "step": 3870, |
| "valid_targets_mean": 5121.6, |
| "valid_targets_min": 2951 |
| }, |
| { |
| "epoch": 6.007751937984496, |
| "grad_norm": 0.4491491812525188, |
| "learning_rate": 2.406652621787999e-06, |
| "loss": 0.1461, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1544957160949707, |
| "step": 3875, |
| "valid_targets_mean": 3907.7, |
| "valid_targets_min": 472 |
| }, |
| { |
| "epoch": 6.015503875968992, |
| "grad_norm": 0.39058530830234023, |
| "learning_rate": 2.3700106700734705e-06, |
| "loss": 0.1501, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11147475242614746, |
| "step": 3880, |
| "valid_targets_mean": 4658.1, |
| "valid_targets_min": 412 |
| }, |
| { |
| "epoch": 6.023255813953488, |
| "grad_norm": 0.4764404360508427, |
| "learning_rate": 2.3336322286725823e-06, |
| "loss": 0.1365, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1638670563697815, |
| "step": 3885, |
| "valid_targets_mean": 3920.1, |
| "valid_targets_min": 792 |
| }, |
| { |
| "epoch": 6.0310077519379846, |
| "grad_norm": 0.41031515357008064, |
| "learning_rate": 2.2975178413233047e-06, |
| "loss": 0.1426, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11806363612413406, |
| "step": 3890, |
| "valid_targets_mean": 4190.1, |
| "valid_targets_min": 2164 |
| }, |
| { |
| "epoch": 6.038759689922481, |
| "grad_norm": 0.4080067588790369, |
| "learning_rate": 2.261668047816863e-06, |
| "loss": 0.1442, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16606493294239044, |
| "step": 3895, |
| "valid_targets_mean": 5487.4, |
| "valid_targets_min": 272 |
| }, |
| { |
| "epoch": 6.046511627906977, |
| "grad_norm": 0.4182771476362144, |
| "learning_rate": 2.226083383989668e-06, |
| "loss": 0.1454, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12919700145721436, |
| "step": 3900, |
| "valid_targets_mean": 4410.3, |
| "valid_targets_min": 453 |
| }, |
| { |
| "epoch": 6.054263565891473, |
| "grad_norm": 0.465578156889018, |
| "learning_rate": 2.1907643817153313e-06, |
| "loss": 0.1429, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1524408608675003, |
| "step": 3905, |
| "valid_targets_mean": 4006.7, |
| "valid_targets_min": 402 |
| }, |
| { |
| "epoch": 6.062015503875969, |
| "grad_norm": 0.49003831755013766, |
| "learning_rate": 2.1557115688966835e-06, |
| "loss": 0.1466, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15983235836029053, |
| "step": 3910, |
| "valid_targets_mean": 3748.0, |
| "valid_targets_min": 1984 |
| }, |
| { |
| "epoch": 6.069767441860465, |
| "grad_norm": 0.4793985294195704, |
| "learning_rate": 2.120925469457904e-06, |
| "loss": 0.1492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1331721544265747, |
| "step": 3915, |
| "valid_targets_mean": 3765.6, |
| "valid_targets_min": 1989 |
| }, |
| { |
| "epoch": 6.077519379844961, |
| "grad_norm": 0.4857730761757885, |
| "learning_rate": 2.086406603336686e-06, |
| "loss": 0.162, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.223957359790802, |
| "step": 3920, |
| "valid_targets_mean": 4345.2, |
| "valid_targets_min": 487 |
| }, |
| { |
| "epoch": 6.0852713178294575, |
| "grad_norm": 0.38478031129260776, |
| "learning_rate": 2.052155486476466e-06, |
| "loss": 0.1401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.141106978058815, |
| "step": 3925, |
| "valid_targets_mean": 5665.4, |
| "valid_targets_min": 1766 |
| }, |
| { |
| "epoch": 6.093023255813954, |
| "grad_norm": 0.572101341083877, |
| "learning_rate": 2.0181726308187044e-06, |
| "loss": 0.1537, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16148856282234192, |
| "step": 3930, |
| "valid_targets_mean": 3327.9, |
| "valid_targets_min": 393 |
| }, |
| { |
| "epoch": 6.10077519379845, |
| "grad_norm": 0.5702565613060158, |
| "learning_rate": 1.984458544295247e-06, |
| "loss": 0.1491, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15981945395469666, |
| "step": 3935, |
| "valid_targets_mean": 3374.9, |
| "valid_targets_min": 665 |
| }, |
| { |
| "epoch": 6.108527131782946, |
| "grad_norm": 0.41153314259954854, |
| "learning_rate": 1.9510137308207187e-06, |
| "loss": 0.144, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14380812644958496, |
| "step": 3940, |
| "valid_targets_mean": 4357.6, |
| "valid_targets_min": 343 |
| }, |
| { |
| "epoch": 6.116279069767442, |
| "grad_norm": 0.42473098729111763, |
| "learning_rate": 1.9178386902850033e-06, |
| "loss": 0.1416, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12821288406848907, |
| "step": 3945, |
| "valid_targets_mean": 3923.3, |
| "valid_targets_min": 266 |
| }, |
| { |
| "epoch": 6.124031007751938, |
| "grad_norm": 0.4233818856902045, |
| "learning_rate": 1.884933918545766e-06, |
| "loss": 0.1382, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14326541125774384, |
| "step": 3950, |
| "valid_targets_mean": 4490.9, |
| "valid_targets_min": 513 |
| }, |
| { |
| "epoch": 6.131782945736434, |
| "grad_norm": 0.4075534532593769, |
| "learning_rate": 1.8522999074210357e-06, |
| "loss": 0.1425, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13676217198371887, |
| "step": 3955, |
| "valid_targets_mean": 5278.7, |
| "valid_targets_min": 773 |
| }, |
| { |
| "epoch": 6.1395348837209305, |
| "grad_norm": 0.4831447381224601, |
| "learning_rate": 1.819937144681876e-06, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14638128876686096, |
| "step": 3960, |
| "valid_targets_mean": 4841.4, |
| "valid_targets_min": 1843 |
| }, |
| { |
| "epoch": 6.147286821705427, |
| "grad_norm": 0.5692373377592979, |
| "learning_rate": 1.7878461140450709e-06, |
| "loss": 0.146, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17473667860031128, |
| "step": 3965, |
| "valid_targets_mean": 3916.5, |
| "valid_targets_min": 1954 |
| }, |
| { |
| "epoch": 6.155038759689923, |
| "grad_norm": 0.4411787512540076, |
| "learning_rate": 1.7560272951659007e-06, |
| "loss": 0.1499, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16196417808532715, |
| "step": 3970, |
| "valid_targets_mean": 4841.2, |
| "valid_targets_min": 681 |
| }, |
| { |
| "epoch": 6.162790697674419, |
| "grad_norm": 0.4144797822314153, |
| "learning_rate": 1.7244811636309865e-06, |
| "loss": 0.1459, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12838700413703918, |
| "step": 3975, |
| "valid_targets_mean": 5786.5, |
| "valid_targets_min": 536 |
| }, |
| { |
| "epoch": 6.170542635658915, |
| "grad_norm": 0.4579031301080518, |
| "learning_rate": 1.693208190951159e-06, |
| "loss": 0.148, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1469820737838745, |
| "step": 3980, |
| "valid_targets_mean": 4262.1, |
| "valid_targets_min": 2558 |
| }, |
| { |
| "epoch": 6.178294573643411, |
| "grad_norm": 0.35185050016875424, |
| "learning_rate": 1.6622088445544337e-06, |
| "loss": 0.1488, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.129560187458992, |
| "step": 3985, |
| "valid_targets_mean": 5511.1, |
| "valid_targets_min": 710 |
| }, |
| { |
| "epoch": 6.186046511627907, |
| "grad_norm": 0.41851723149449205, |
| "learning_rate": 1.6314835877790035e-06, |
| "loss": 0.141, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15272796154022217, |
| "step": 3990, |
| "valid_targets_mean": 4655.8, |
| "valid_targets_min": 332 |
| }, |
| { |
| "epoch": 6.1937984496124034, |
| "grad_norm": 0.40076139878422207, |
| "learning_rate": 1.6010328798663332e-06, |
| "loss": 0.1481, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12933820486068726, |
| "step": 3995, |
| "valid_targets_mean": 5362.1, |
| "valid_targets_min": 3053 |
| }, |
| { |
| "epoch": 6.2015503875969, |
| "grad_norm": 0.45341665170317824, |
| "learning_rate": 1.570857175954279e-06, |
| "loss": 0.1637, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12798666954040527, |
| "step": 4000, |
| "valid_targets_mean": 4509.7, |
| "valid_targets_min": 489 |
| }, |
| { |
| "epoch": 6.209302325581396, |
| "grad_norm": 0.3607620367511857, |
| "learning_rate": 1.540956927070294e-06, |
| "loss": 0.128, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11347877979278564, |
| "step": 4005, |
| "valid_targets_mean": 5619.4, |
| "valid_targets_min": 2424 |
| }, |
| { |
| "epoch": 6.217054263565892, |
| "grad_norm": 0.5026070546003747, |
| "learning_rate": 1.5113325801246914e-06, |
| "loss": 0.1531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18720689415931702, |
| "step": 4010, |
| "valid_targets_mean": 4427.4, |
| "valid_targets_min": 1430 |
| }, |
| { |
| "epoch": 6.224806201550388, |
| "grad_norm": 0.43575139062965373, |
| "learning_rate": 1.4819845779039477e-06, |
| "loss": 0.1657, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1679738312959671, |
| "step": 4015, |
| "valid_targets_mean": 5928.5, |
| "valid_targets_min": 808 |
| }, |
| { |
| "epoch": 6.232558139534884, |
| "grad_norm": 0.42143605193627004, |
| "learning_rate": 1.4529133590641009e-06, |
| "loss": 0.1343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13898807764053345, |
| "step": 4020, |
| "valid_targets_mean": 4824.2, |
| "valid_targets_min": 1828 |
| }, |
| { |
| "epoch": 6.24031007751938, |
| "grad_norm": 0.4220444192180161, |
| "learning_rate": 1.4241193581241964e-06, |
| "loss": 0.1369, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12464825809001923, |
| "step": 4025, |
| "valid_targets_mean": 4312.4, |
| "valid_targets_min": 280 |
| }, |
| { |
| "epoch": 6.248062015503876, |
| "grad_norm": 0.4246528594263321, |
| "learning_rate": 1.395603005459769e-06, |
| "loss": 0.1514, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11180758476257324, |
| "step": 4030, |
| "valid_targets_mean": 5064.3, |
| "valid_targets_min": 268 |
| }, |
| { |
| "epoch": 6.2558139534883725, |
| "grad_norm": 0.4601989305033969, |
| "learning_rate": 1.367364727296434e-06, |
| "loss": 0.1391, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17486141622066498, |
| "step": 4035, |
| "valid_targets_mean": 4553.9, |
| "valid_targets_min": 455 |
| }, |
| { |
| "epoch": 6.263565891472869, |
| "grad_norm": 0.41743085880863806, |
| "learning_rate": 1.3394049457035063e-06, |
| "loss": 0.1271, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11269478499889374, |
| "step": 4040, |
| "valid_targets_mean": 4022.4, |
| "valid_targets_min": 396 |
| }, |
| { |
| "epoch": 6.271317829457364, |
| "grad_norm": 0.3957905593683059, |
| "learning_rate": 1.3117240785876994e-06, |
| "loss": 0.1397, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1279354691505432, |
| "step": 4045, |
| "valid_targets_mean": 4760.3, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 6.27906976744186, |
| "grad_norm": 0.46939606376712706, |
| "learning_rate": 1.2843225396868707e-06, |
| "loss": 0.1278, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14345014095306396, |
| "step": 4050, |
| "valid_targets_mean": 3840.0, |
| "valid_targets_min": 977 |
| }, |
| { |
| "epoch": 6.286821705426356, |
| "grad_norm": 0.45118172267262807, |
| "learning_rate": 1.2572007385638264e-06, |
| "loss": 0.1409, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13466718792915344, |
| "step": 4055, |
| "valid_targets_mean": 5589.4, |
| "valid_targets_min": 2910 |
| }, |
| { |
| "epoch": 6.294573643410852, |
| "grad_norm": 0.47093501864092696, |
| "learning_rate": 1.2303590806002341e-06, |
| "loss": 0.138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17266318202018738, |
| "step": 4060, |
| "valid_targets_mean": 4088.8, |
| "valid_targets_min": 1934 |
| }, |
| { |
| "epoch": 6.3023255813953485, |
| "grad_norm": 0.43593257987581496, |
| "learning_rate": 1.2037979669905341e-06, |
| "loss": 0.1462, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1565391570329666, |
| "step": 4065, |
| "valid_targets_mean": 5561.3, |
| "valid_targets_min": 2171 |
| }, |
| { |
| "epoch": 6.310077519379845, |
| "grad_norm": 0.38442258109857474, |
| "learning_rate": 1.1775177947359472e-06, |
| "loss": 0.1469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.120355024933815, |
| "step": 4070, |
| "valid_targets_mean": 5508.9, |
| "valid_targets_min": 600 |
| }, |
| { |
| "epoch": 6.317829457364341, |
| "grad_norm": 0.5116245670615639, |
| "learning_rate": 1.1515189566385598e-06, |
| "loss": 0.1536, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15075933933258057, |
| "step": 4075, |
| "valid_targets_mean": 3669.8, |
| "valid_targets_min": 289 |
| }, |
| { |
| "epoch": 6.325581395348837, |
| "grad_norm": 0.519726609280829, |
| "learning_rate": 1.125801841295422e-06, |
| "loss": 0.1538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1663362681865692, |
| "step": 4080, |
| "valid_targets_mean": 3507.8, |
| "valid_targets_min": 755 |
| }, |
| { |
| "epoch": 6.333333333333333, |
| "grad_norm": 0.5066281048339958, |
| "learning_rate": 1.1003668330927674e-06, |
| "loss": 0.1561, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17226609587669373, |
| "step": 4085, |
| "valid_targets_mean": 3913.7, |
| "valid_targets_min": 891 |
| }, |
| { |
| "epoch": 6.341085271317829, |
| "grad_norm": 0.4168253714412732, |
| "learning_rate": 1.0752143122002502e-06, |
| "loss": 0.1549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13902395963668823, |
| "step": 4090, |
| "valid_targets_mean": 4731.2, |
| "valid_targets_min": 310 |
| }, |
| { |
| "epoch": 6.348837209302325, |
| "grad_norm": 0.3943285404063543, |
| "learning_rate": 1.0503446545652718e-06, |
| "loss": 0.1437, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13005225360393524, |
| "step": 4095, |
| "valid_targets_mean": 4982.7, |
| "valid_targets_min": 575 |
| }, |
| { |
| "epoch": 6.3565891472868215, |
| "grad_norm": 0.4120867129337237, |
| "learning_rate": 1.0257582319073612e-06, |
| "loss": 0.1276, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11511364579200745, |
| "step": 4100, |
| "valid_targets_mean": 4254.6, |
| "valid_targets_min": 869 |
| }, |
| { |
| "epoch": 6.364341085271318, |
| "grad_norm": 0.44941410097724094, |
| "learning_rate": 1.001455411712613e-06, |
| "loss": 0.1475, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14647594094276428, |
| "step": 4105, |
| "valid_targets_mean": 4231.6, |
| "valid_targets_min": 709 |
| }, |
| { |
| "epoch": 6.372093023255814, |
| "grad_norm": 0.38228475170706705, |
| "learning_rate": 9.774365572281973e-07, |
| "loss": 0.1393, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12529915571212769, |
| "step": 4110, |
| "valid_targets_mean": 5377.4, |
| "valid_targets_min": 2890 |
| }, |
| { |
| "epoch": 6.37984496124031, |
| "grad_norm": 0.40870796264529896, |
| "learning_rate": 9.537020274569376e-07, |
| "loss": 0.1378, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1220163106918335, |
| "step": 4115, |
| "valid_targets_mean": 4960.4, |
| "valid_targets_min": 617 |
| }, |
| { |
| "epoch": 6.387596899224806, |
| "grad_norm": 0.4785371009759146, |
| "learning_rate": 9.302521771519291e-07, |
| "loss": 0.1724, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15229693055152893, |
| "step": 4120, |
| "valid_targets_mean": 4179.5, |
| "valid_targets_min": 794 |
| }, |
| { |
| "epoch": 6.395348837209302, |
| "grad_norm": 0.5482438722247103, |
| "learning_rate": 9.070873568112537e-07, |
| "loss": 0.1715, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.20323488116264343, |
| "step": 4125, |
| "valid_targets_mean": 3866.2, |
| "valid_targets_min": 528 |
| }, |
| { |
| "epoch": 6.403100775193798, |
| "grad_norm": 0.34393102511247997, |
| "learning_rate": 8.842079126727365e-07, |
| "loss": 0.1438, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17043393850326538, |
| "step": 4130, |
| "valid_targets_mean": 8063.3, |
| "valid_targets_min": 1395 |
| }, |
| { |
| "epoch": 6.410852713178294, |
| "grad_norm": 0.48778735386271366, |
| "learning_rate": 8.616141867087569e-07, |
| "loss": 0.1415, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1254102885723114, |
| "step": 4135, |
| "valid_targets_mean": 4153.1, |
| "valid_targets_min": 497 |
| }, |
| { |
| "epoch": 6.4186046511627906, |
| "grad_norm": 0.42788835357838334, |
| "learning_rate": 8.393065166211544e-07, |
| "loss": 0.1385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1304156631231308, |
| "step": 4140, |
| "valid_targets_mean": 4457.7, |
| "valid_targets_min": 1134 |
| }, |
| { |
| "epoch": 6.426356589147287, |
| "grad_norm": 0.39619956994694927, |
| "learning_rate": 8.172852358361782e-07, |
| "loss": 0.1455, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1729072630405426, |
| "step": 4145, |
| "valid_targets_mean": 5565.4, |
| "valid_targets_min": 629 |
| }, |
| { |
| "epoch": 6.434108527131783, |
| "grad_norm": 0.4776261582174204, |
| "learning_rate": 7.955506734994922e-07, |
| "loss": 0.139, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17891857028007507, |
| "step": 4150, |
| "valid_targets_mean": 4085.9, |
| "valid_targets_min": 482 |
| }, |
| { |
| "epoch": 6.441860465116279, |
| "grad_norm": 0.4278671968152442, |
| "learning_rate": 7.741031544712663e-07, |
| "loss": 0.1358, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12771019339561462, |
| "step": 4155, |
| "valid_targets_mean": 4428.9, |
| "valid_targets_min": 479 |
| }, |
| { |
| "epoch": 6.449612403100775, |
| "grad_norm": 0.37776538158237155, |
| "learning_rate": 7.529429993213222e-07, |
| "loss": 0.1423, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12023401260375977, |
| "step": 4160, |
| "valid_targets_mean": 5098.1, |
| "valid_targets_min": 994 |
| }, |
| { |
| "epoch": 6.457364341085271, |
| "grad_norm": 0.43694272212869895, |
| "learning_rate": 7.320705243243287e-07, |
| "loss": 0.1405, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14688435196876526, |
| "step": 4165, |
| "valid_targets_mean": 5080.8, |
| "valid_targets_min": 675 |
| }, |
| { |
| "epoch": 6.465116279069767, |
| "grad_norm": 0.4225966998298987, |
| "learning_rate": 7.114860414550917e-07, |
| "loss": 0.1385, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14561529457569122, |
| "step": 4170, |
| "valid_targets_mean": 5137.9, |
| "valid_targets_min": 2089 |
| }, |
| { |
| "epoch": 6.4728682170542635, |
| "grad_norm": 0.4688876624797445, |
| "learning_rate": 6.911898583838738e-07, |
| "loss": 0.151, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15033042430877686, |
| "step": 4175, |
| "valid_targets_mean": 4029.8, |
| "valid_targets_min": 661 |
| }, |
| { |
| "epoch": 6.48062015503876, |
| "grad_norm": 0.4340667422133109, |
| "learning_rate": 6.711822784718158e-07, |
| "loss": 0.1515, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15977023541927338, |
| "step": 4180, |
| "valid_targets_mean": 4863.2, |
| "valid_targets_min": 2046 |
| }, |
| { |
| "epoch": 6.488372093023256, |
| "grad_norm": 0.4569382782087973, |
| "learning_rate": 6.5146360076638e-07, |
| "loss": 0.1623, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1681194007396698, |
| "step": 4185, |
| "valid_targets_mean": 4351.9, |
| "valid_targets_min": 315 |
| }, |
| { |
| "epoch": 6.496124031007752, |
| "grad_norm": 0.4554589036178452, |
| "learning_rate": 6.320341199968982e-07, |
| "loss": 0.1476, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15873485803604126, |
| "step": 4190, |
| "valid_targets_mean": 4564.2, |
| "valid_targets_min": 658 |
| }, |
| { |
| "epoch": 6.503875968992248, |
| "grad_norm": 0.49218409403445584, |
| "learning_rate": 6.128941265701627e-07, |
| "loss": 0.1387, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1481098085641861, |
| "step": 4195, |
| "valid_targets_mean": 3601.8, |
| "valid_targets_min": 352 |
| }, |
| { |
| "epoch": 6.511627906976744, |
| "grad_norm": 0.4096283466727092, |
| "learning_rate": 5.94043906566073e-07, |
| "loss": 0.1333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13861069083213806, |
| "step": 4200, |
| "valid_targets_mean": 4857.5, |
| "valid_targets_min": 326 |
| }, |
| { |
| "epoch": 6.51937984496124, |
| "grad_norm": 0.46885200416042144, |
| "learning_rate": 5.754837417333781e-07, |
| "loss": 0.1389, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14652873575687408, |
| "step": 4205, |
| "valid_targets_mean": 3894.9, |
| "valid_targets_min": 906 |
| }, |
| { |
| "epoch": 6.5271317829457365, |
| "grad_norm": 0.3885968728101716, |
| "learning_rate": 5.572139094854478e-07, |
| "loss": 0.1482, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12030985951423645, |
| "step": 4210, |
| "valid_targets_mean": 4954.5, |
| "valid_targets_min": 2183 |
| }, |
| { |
| "epoch": 6.534883720930233, |
| "grad_norm": 0.37139089742268966, |
| "learning_rate": 5.392346828961504e-07, |
| "loss": 0.1401, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11080891638994217, |
| "step": 4215, |
| "valid_targets_mean": 5050.3, |
| "valid_targets_min": 298 |
| }, |
| { |
| "epoch": 6.542635658914729, |
| "grad_norm": 0.3853585068404549, |
| "learning_rate": 5.215463306957436e-07, |
| "loss": 0.1479, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13822655379772186, |
| "step": 4220, |
| "valid_targets_mean": 5455.0, |
| "valid_targets_min": 2416 |
| }, |
| { |
| "epoch": 6.550387596899225, |
| "grad_norm": 0.4726856345826331, |
| "learning_rate": 5.0414911726687e-07, |
| "loss": 0.1675, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.22890380024909973, |
| "step": 4225, |
| "valid_targets_mean": 5294.4, |
| "valid_targets_min": 781 |
| }, |
| { |
| "epoch": 6.558139534883721, |
| "grad_norm": 0.4031349839399349, |
| "learning_rate": 4.870433026406152e-07, |
| "loss": 0.1508, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13684213161468506, |
| "step": 4230, |
| "valid_targets_mean": 4680.8, |
| "valid_targets_min": 2718 |
| }, |
| { |
| "epoch": 6.565891472868217, |
| "grad_norm": 0.48960339790783236, |
| "learning_rate": 4.7022914249260197e-07, |
| "loss": 0.1597, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1440485715866089, |
| "step": 4235, |
| "valid_targets_mean": 4090.7, |
| "valid_targets_min": 2062 |
| }, |
| { |
| "epoch": 6.573643410852713, |
| "grad_norm": 0.48029936611780594, |
| "learning_rate": 4.537068881391848e-07, |
| "loss": 0.138, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15450087189674377, |
| "step": 4240, |
| "valid_targets_mean": 3792.6, |
| "valid_targets_min": 2354 |
| }, |
| { |
| "epoch": 6.5813953488372094, |
| "grad_norm": 0.411026213138413, |
| "learning_rate": 4.37476786533686e-07, |
| "loss": 0.1413, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11528407782316208, |
| "step": 4245, |
| "valid_targets_mean": 5034.7, |
| "valid_targets_min": 682 |
| }, |
| { |
| "epoch": 6.589147286821706, |
| "grad_norm": 0.3613114304130289, |
| "learning_rate": 4.2153908026270504e-07, |
| "loss": 0.1404, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11450152099132538, |
| "step": 4250, |
| "valid_targets_mean": 5106.2, |
| "valid_targets_min": 3567 |
| }, |
| { |
| "epoch": 6.596899224806202, |
| "grad_norm": 0.49968357376260497, |
| "learning_rate": 4.058940075424933e-07, |
| "loss": 0.1505, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1560279130935669, |
| "step": 4255, |
| "valid_targets_mean": 4061.5, |
| "valid_targets_min": 2069 |
| }, |
| { |
| "epoch": 6.604651162790698, |
| "grad_norm": 0.46911068601775274, |
| "learning_rate": 3.9054180221539394e-07, |
| "loss": 0.1538, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13993695378303528, |
| "step": 4260, |
| "valid_targets_mean": 3780.2, |
| "valid_targets_min": 790 |
| }, |
| { |
| "epoch": 6.612403100775194, |
| "grad_norm": 0.3917124798281757, |
| "learning_rate": 3.7548269374634736e-07, |
| "loss": 0.1344, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11809076368808746, |
| "step": 4265, |
| "valid_targets_mean": 4906.1, |
| "valid_targets_min": 253 |
| }, |
| { |
| "epoch": 6.62015503875969, |
| "grad_norm": 0.43882837837397076, |
| "learning_rate": 3.607169072194583e-07, |
| "loss": 0.1303, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13036519289016724, |
| "step": 4270, |
| "valid_targets_mean": 4900.6, |
| "valid_targets_min": 449 |
| }, |
| { |
| "epoch": 6.627906976744186, |
| "grad_norm": 0.3783203483240392, |
| "learning_rate": 3.4624466333464057e-07, |
| "loss": 0.1386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13775168359279633, |
| "step": 4275, |
| "valid_targets_mean": 5567.1, |
| "valid_targets_min": 523 |
| }, |
| { |
| "epoch": 6.635658914728682, |
| "grad_norm": 0.3505902467720475, |
| "learning_rate": 3.320661784043e-07, |
| "loss": 0.1366, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11130744218826294, |
| "step": 4280, |
| "valid_targets_mean": 6773.1, |
| "valid_targets_min": 3288 |
| }, |
| { |
| "epoch": 6.6434108527131785, |
| "grad_norm": 0.4364368560735114, |
| "learning_rate": 3.1818166435012563e-07, |
| "loss": 0.1503, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15424305200576782, |
| "step": 4285, |
| "valid_targets_mean": 4766.6, |
| "valid_targets_min": 605 |
| }, |
| { |
| "epoch": 6.651162790697675, |
| "grad_norm": 0.49428323333345386, |
| "learning_rate": 3.0459132869989914e-07, |
| "loss": 0.1635, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17941808700561523, |
| "step": 4290, |
| "valid_targets_mean": 4228.8, |
| "valid_targets_min": 575 |
| }, |
| { |
| "epoch": 6.658914728682171, |
| "grad_norm": 0.4532498891303768, |
| "learning_rate": 2.912953745844083e-07, |
| "loss": 0.1603, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16425731778144836, |
| "step": 4295, |
| "valid_targets_mean": 4930.4, |
| "valid_targets_min": 512 |
| }, |
| { |
| "epoch": 6.666666666666667, |
| "grad_norm": 0.4484218818013772, |
| "learning_rate": 2.7829400073440704e-07, |
| "loss": 0.147, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14921866357326508, |
| "step": 4300, |
| "valid_targets_mean": 4864.6, |
| "valid_targets_min": 2160 |
| }, |
| { |
| "epoch": 6.674418604651163, |
| "grad_norm": 0.5128051450701466, |
| "learning_rate": 2.655874014776427e-07, |
| "loss": 0.1484, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19552041590213776, |
| "step": 4305, |
| "valid_targets_mean": 4560.8, |
| "valid_targets_min": 324 |
| }, |
| { |
| "epoch": 6.682170542635659, |
| "grad_norm": 0.39420076435511847, |
| "learning_rate": 2.531757667359491e-07, |
| "loss": 0.1343, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11401358246803284, |
| "step": 4310, |
| "valid_targets_mean": 5222.8, |
| "valid_targets_min": 2452 |
| }, |
| { |
| "epoch": 6.689922480620155, |
| "grad_norm": 0.39424587927802124, |
| "learning_rate": 2.4105928202241557e-07, |
| "loss": 0.1313, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10992264747619629, |
| "step": 4315, |
| "valid_targets_mean": 4744.0, |
| "valid_targets_min": 946 |
| }, |
| { |
| "epoch": 6.6976744186046515, |
| "grad_norm": 0.4909208750282455, |
| "learning_rate": 2.2923812843861136e-07, |
| "loss": 0.1569, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1754213571548462, |
| "step": 4320, |
| "valid_targets_mean": 4488.9, |
| "valid_targets_min": 267 |
| }, |
| { |
| "epoch": 6.705426356589148, |
| "grad_norm": 0.46076430916005, |
| "learning_rate": 2.1771248267186795e-07, |
| "loss": 0.1439, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15366077423095703, |
| "step": 4325, |
| "valid_targets_mean": 3990.3, |
| "valid_targets_min": 412 |
| }, |
| { |
| "epoch": 6.713178294573644, |
| "grad_norm": 0.44837990403963107, |
| "learning_rate": 2.064825169926632e-07, |
| "loss": 0.1436, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14431065320968628, |
| "step": 4330, |
| "valid_targets_mean": 4223.2, |
| "valid_targets_min": 1821 |
| }, |
| { |
| "epoch": 6.720930232558139, |
| "grad_norm": 0.3689938810371774, |
| "learning_rate": 1.9554839925201686e-07, |
| "loss": 0.1333, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16173899173736572, |
| "step": 4335, |
| "valid_targets_mean": 6193.9, |
| "valid_targets_min": 3050 |
| }, |
| { |
| "epoch": 6.728682170542635, |
| "grad_norm": 0.3834490175252527, |
| "learning_rate": 1.849102928790014e-07, |
| "loss": 0.1465, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15902329981327057, |
| "step": 4340, |
| "valid_targets_mean": 5950.6, |
| "valid_targets_min": 532 |
| }, |
| { |
| "epoch": 6.736434108527131, |
| "grad_norm": 0.3806645179110598, |
| "learning_rate": 1.74568356878293e-07, |
| "loss": 0.1431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15495096147060394, |
| "step": 4345, |
| "valid_targets_mean": 5389.5, |
| "valid_targets_min": 2093 |
| }, |
| { |
| "epoch": 6.7441860465116275, |
| "grad_norm": 0.5001568087478473, |
| "learning_rate": 1.6452274582779537e-07, |
| "loss": 0.1494, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14459748566150665, |
| "step": 4350, |
| "valid_targets_mean": 4592.8, |
| "valid_targets_min": 555 |
| }, |
| { |
| "epoch": 6.751937984496124, |
| "grad_norm": 0.5854439307900624, |
| "learning_rate": 1.5477360987633305e-07, |
| "loss": 0.166, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19409656524658203, |
| "step": 4355, |
| "valid_targets_mean": 3547.4, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 6.75968992248062, |
| "grad_norm": 0.4665900083114806, |
| "learning_rate": 1.453210947413952e-07, |
| "loss": 0.1467, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1850074976682663, |
| "step": 4360, |
| "valid_targets_mean": 4564.8, |
| "valid_targets_min": 540 |
| }, |
| { |
| "epoch": 6.767441860465116, |
| "grad_norm": 0.48350023695445227, |
| "learning_rate": 1.3616534170697747e-07, |
| "loss": 0.1539, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15944364666938782, |
| "step": 4365, |
| "valid_targets_mean": 3584.8, |
| "valid_targets_min": 263 |
| }, |
| { |
| "epoch": 6.775193798449612, |
| "grad_norm": 0.45038375032977, |
| "learning_rate": 1.2730648762144804e-07, |
| "loss": 0.1552, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.18844370543956757, |
| "step": 4370, |
| "valid_targets_mean": 5290.8, |
| "valid_targets_min": 806 |
| }, |
| { |
| "epoch": 6.782945736434108, |
| "grad_norm": 0.4134945839078117, |
| "learning_rate": 1.1874466489551817e-07, |
| "loss": 0.1408, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15977919101715088, |
| "step": 4375, |
| "valid_targets_mean": 4978.0, |
| "valid_targets_min": 325 |
| }, |
| { |
| "epoch": 6.790697674418604, |
| "grad_norm": 0.40450500367697456, |
| "learning_rate": 1.1048000150025939e-07, |
| "loss": 0.1453, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13722053170204163, |
| "step": 4380, |
| "valid_targets_mean": 4658.6, |
| "valid_targets_min": 3135 |
| }, |
| { |
| "epoch": 6.7984496124031, |
| "grad_norm": 0.41715346551607424, |
| "learning_rate": 1.0251262096518499e-07, |
| "loss": 0.1402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.10508380830287933, |
| "step": 4385, |
| "valid_targets_mean": 4255.1, |
| "valid_targets_min": 250 |
| }, |
| { |
| "epoch": 6.8062015503875966, |
| "grad_norm": 0.5216272062569919, |
| "learning_rate": 9.484264237641372e-08, |
| "loss": 0.1549, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.21273067593574524, |
| "step": 4390, |
| "valid_targets_mean": 4022.2, |
| "valid_targets_min": 608 |
| }, |
| { |
| "epoch": 6.813953488372093, |
| "grad_norm": 0.39630599414920137, |
| "learning_rate": 8.747018037488009e-08, |
| "loss": 0.1337, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12072727829217911, |
| "step": 4395, |
| "valid_targets_mean": 4854.1, |
| "valid_targets_min": 233 |
| }, |
| { |
| "epoch": 6.821705426356589, |
| "grad_norm": 0.4277418685702825, |
| "learning_rate": 8.039534515462244e-08, |
| "loss": 0.129, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11388542503118515, |
| "step": 4400, |
| "valid_targets_mean": 4361.8, |
| "valid_targets_min": 821 |
| }, |
| { |
| "epoch": 6.829457364341085, |
| "grad_norm": 0.38765433024613494, |
| "learning_rate": 7.361824246114424e-08, |
| "loss": 0.1309, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13917176425457, |
| "step": 4405, |
| "valid_targets_mean": 5343.9, |
| "valid_targets_min": 1942 |
| }, |
| { |
| "epoch": 6.837209302325581, |
| "grad_norm": 0.34398297746177137, |
| "learning_rate": 6.713897358982202e-08, |
| "loss": 0.1493, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.113133504986763, |
| "step": 4410, |
| "valid_targets_mean": 5645.0, |
| "valid_targets_min": 678 |
| }, |
| { |
| "epoch": 6.844961240310077, |
| "grad_norm": 0.48279011534912997, |
| "learning_rate": 6.095763538440214e-08, |
| "loss": 0.1492, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12714777886867523, |
| "step": 4415, |
| "valid_targets_mean": 3936.2, |
| "valid_targets_min": 216 |
| }, |
| { |
| "epoch": 6.852713178294573, |
| "grad_norm": 0.4180463055838533, |
| "learning_rate": 5.507432023554637e-08, |
| "loss": 0.1469, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1416483223438263, |
| "step": 4420, |
| "valid_targets_mean": 4545.9, |
| "valid_targets_min": 1037 |
| }, |
| { |
| "epoch": 6.8604651162790695, |
| "grad_norm": 0.4294181180018212, |
| "learning_rate": 4.948911607945084e-08, |
| "loss": 0.1531, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.19967518746852875, |
| "step": 4425, |
| "valid_targets_mean": 5607.9, |
| "valid_targets_min": 615 |
| }, |
| { |
| "epoch": 6.868217054263566, |
| "grad_norm": 0.3477503979746384, |
| "learning_rate": 4.420210639653366e-08, |
| "loss": 0.1297, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1086292415857315, |
| "step": 4430, |
| "valid_targets_mean": 5510.9, |
| "valid_targets_min": 2659 |
| }, |
| { |
| "epoch": 6.875968992248062, |
| "grad_norm": 0.41768003376691165, |
| "learning_rate": 3.921337021018934e-08, |
| "loss": 0.1403, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1428183615207672, |
| "step": 4435, |
| "valid_targets_mean": 5068.1, |
| "valid_targets_min": 459 |
| }, |
| { |
| "epoch": 6.883720930232558, |
| "grad_norm": 0.490921604098694, |
| "learning_rate": 3.452298208560301e-08, |
| "loss": 0.1374, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.17244720458984375, |
| "step": 4440, |
| "valid_targets_mean": 4010.2, |
| "valid_targets_min": 669 |
| }, |
| { |
| "epoch": 6.891472868217054, |
| "grad_norm": 0.36536468948119627, |
| "learning_rate": 3.0131012128642445e-08, |
| "loss": 0.1521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.11829351633787155, |
| "step": 4445, |
| "valid_targets_mean": 5238.6, |
| "valid_targets_min": 573 |
| }, |
| { |
| "epoch": 6.89922480620155, |
| "grad_norm": 0.43543485475431953, |
| "learning_rate": 2.6037525984798918e-08, |
| "loss": 0.1592, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14736925065517426, |
| "step": 4450, |
| "valid_targets_mean": 4508.6, |
| "valid_targets_min": 2594 |
| }, |
| { |
| "epoch": 6.906976744186046, |
| "grad_norm": 0.457191809542186, |
| "learning_rate": 2.2242584838219062e-08, |
| "loss": 0.1419, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1291424185037613, |
| "step": 4455, |
| "valid_targets_mean": 4140.1, |
| "valid_targets_min": 363 |
| }, |
| { |
| "epoch": 6.9147286821705425, |
| "grad_norm": 0.3441924236982618, |
| "learning_rate": 1.8746245410781184e-08, |
| "loss": 0.1402, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.09382060170173645, |
| "step": 4460, |
| "valid_targets_mean": 5934.2, |
| "valid_targets_min": 2203 |
| }, |
| { |
| "epoch": 6.922480620155039, |
| "grad_norm": 0.46978533968904, |
| "learning_rate": 1.5548559961253707e-08, |
| "loss": 0.1517, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16701874136924744, |
| "step": 4465, |
| "valid_targets_mean": 4124.2, |
| "valid_targets_min": 435 |
| }, |
| { |
| "epoch": 6.930232558139535, |
| "grad_norm": 0.45884185400938543, |
| "learning_rate": 1.2649576284509135e-08, |
| "loss": 0.1654, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15522664785385132, |
| "step": 4470, |
| "valid_targets_mean": 4735.6, |
| "valid_targets_min": 748 |
| }, |
| { |
| "epoch": 6.937984496124031, |
| "grad_norm": 0.37304600716915987, |
| "learning_rate": 1.004933771080907e-08, |
| "loss": 0.1585, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.15063238143920898, |
| "step": 4475, |
| "valid_targets_mean": 5812.3, |
| "valid_targets_min": 1844 |
| }, |
| { |
| "epoch": 6.945736434108527, |
| "grad_norm": 0.4417268532948254, |
| "learning_rate": 7.747883105166942e-09, |
| "loss": 0.1483, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12845158576965332, |
| "step": 4480, |
| "valid_targets_mean": 3979.6, |
| "valid_targets_min": 329 |
| }, |
| { |
| "epoch": 6.953488372093023, |
| "grad_norm": 0.4206373369632711, |
| "learning_rate": 5.745246866748489e-09, |
| "loss": 0.1433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1285676211118698, |
| "step": 4485, |
| "valid_targets_mean": 4420.4, |
| "valid_targets_min": 864 |
| }, |
| { |
| "epoch": 6.961240310077519, |
| "grad_norm": 0.409189864441095, |
| "learning_rate": 4.041458928378816e-09, |
| "loss": 0.1433, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13274972140789032, |
| "step": 4490, |
| "valid_targets_mean": 5082.7, |
| "valid_targets_min": 2020 |
| }, |
| { |
| "epoch": 6.9689922480620154, |
| "grad_norm": 0.7633572465865676, |
| "learning_rate": 2.6365447560761093e-09, |
| "loss": 0.1471, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.1332360953092575, |
| "step": 4495, |
| "valid_targets_mean": 3844.5, |
| "valid_targets_min": 300 |
| }, |
| { |
| "epoch": 6.976744186046512, |
| "grad_norm": 0.4810580142176617, |
| "learning_rate": 1.5305253486852523e-09, |
| "loss": 0.1431, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.16817598044872284, |
| "step": 4500, |
| "valid_targets_mean": 4177.8, |
| "valid_targets_min": 529 |
| }, |
| { |
| "epoch": 6.984496124031008, |
| "grad_norm": 0.4276342091229402, |
| "learning_rate": 7.234172375558679e-10, |
| "loss": 0.1495, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.13658341765403748, |
| "step": 4505, |
| "valid_targets_mean": 4540.3, |
| "valid_targets_min": 1720 |
| }, |
| { |
| "epoch": 6.992248062015504, |
| "grad_norm": 0.41945236764032184, |
| "learning_rate": 2.1523248629806703e-10, |
| "loss": 0.1521, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.14896142482757568, |
| "step": 4510, |
| "valid_targets_mean": 4939.6, |
| "valid_targets_min": 694 |
| }, |
| { |
| "epoch": 7.0, |
| "grad_norm": 0.4017760557242996, |
| "learning_rate": 5.978690600372261e-12, |
| "loss": 0.1386, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12985655665397644, |
| "step": 4515, |
| "valid_targets_mean": 5961.6, |
| "valid_targets_min": 2002 |
| }, |
| { |
| "epoch": 7.0, |
| "loss_nan_ranks": 0, |
| "loss_rank_avg": 0.12985655665397644, |
| "step": 4515, |
| "total_flos": 1219521762033664.0, |
| "train_loss": 0.10701951415567831, |
| "train_runtime": 13204.5072, |
| "train_samples_per_second": 5.464, |
| "train_steps_per_second": 0.342, |
| "valid_targets_mean": 5961.6, |
| "valid_targets_min": 2002 |
| } |
| ], |
| "logging_steps": 5, |
| "max_steps": 4515, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 7, |
| "save_steps": 1500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": true |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 1219521762033664.0, |
| "train_batch_size": 1, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|